losses.py

import random
import chainer
import chainer.functions as F
from chainer import Variable,cuda

class ImagePool():
    def __init__(self, pool_size):
        self.pool_size = pool_size
        if self.pool_size > 0:
            self.num_imgs = 0
            self.images = []

    def query(self, images):
        if self.pool_size == 0:
            return images
        return_images = []
        xp = cuda.get_array_module(images)
        for image in images:
            image = xp.expand_dims(image, axis=0)
            if self.num_imgs < self.pool_size:
                self.num_imgs = self.num_imgs + 1
                self.images.append(image)
                return_images.append(image)
            else:
                if random.choice([True, False]):
                    random_id = random.randint(0, self.pool_size - 1)
                    tmp = xp.copy(self.images[random_id])
                    self.images[random_id] = image
                    return_images.append(tmp)
                else:
                    return_images.append(image)
        return_images = xp.concatenate(return_images)
        return return_images

def add_noise(h, sigma): 
    xp = cuda.get_array_module(h.data)
    if chainer.config.train and sigma>0:
        return h + sigma * xp.random.randn(*h.data.shape).astype(h.dtype)
    else:
        return h

## contrastive loss of a batch
def contrastive_loss(x,t, margin=0.2):
    xp = x.xp
    d = F.sum((F.expand_dims(x, axis=0)-F.expand_dims(x, axis=1))**2, axis=-1)
    lb = (xp.expand_dims(t.array, axis=0) == xp.expand_dims(t.array, axis=1))
    pos = F.expand_dims(d[lb], axis=1)
    neg = F.expand_dims(d[xp.logical_not(lb)], axis=0)
    return F.average(F.relu(pos - neg + margin))    

## binary focal loss (x has to be [0,1])
def sigmoid_focalloss(x, t, class_weight, gamma=2, eps=1e-7):
    p = F.clip(x, x_min=eps, x_max=1-eps)
    tf = t.astype(p.dtype)
    p = tf * p + (1-tf) * (1-p)
    w = class_weight[t]
    return F.sum(-((1 - p) ** gamma) * w * F.log(p))

## multi-class focal loss
def softmax_focalloss(x, t, class_num=4, gamma=2, eps=1e-7):
    p = F.clip(F.softmax(x), x_min=eps, x_max=1-eps)
    q = -x.xp.eye(class_num)[t] * F.log(p)
    return F.sum(q * ((1 - p) ** gamma))

## discriminator CE loss for fake (all values should be zero)
def cross_entropy_dis_fake(y_fake):
    batchsize,_,w,h = y_fake.data.shape
    return(F.sum(F.softplus(-y_fake)) / batchsize / w / h)

## apply average filter and take difference
def loss_avg(x,y, ksize=3, norm='l2', weight=None):
    if ksize>1:
        ax = F.average_pooling_2d(x,ksize,1,0)
        ay = F.average_pooling_2d(y,ksize,1,0)
    else:
        ax = x
        ay = y
    if weight:
        if norm=='l1':        
            return F.average(F.absolute(ax-ay)*(weight*ay+1))
        else:
            return F.average(((ax-ay)**2)*(weight*ay+1))
    else:
        if norm=='l1':        
            return F.mean_absolute_error(ax,ay)
        else:
            return F.mean_squared_error(ax,ay)

## apply pre-trained CNN and take difference
def loss_perceptual(x,y,model,layer='conv4_2',grey=False):
    with chainer.using_config('train', False) and chainer.no_backprop_mode():
        if grey:
            loss = 0
            for i in range(x.shape[1]):
                xp = cuda.get_array_module(x.data)
                xx=x[:,i:(i+1),:,:]
                vx = model(F.concat([xx,xx,xx]), layers=[layer])[layer]
                yy=y[:,i:(i+1),:,:]
                vy = model(F.concat([yy,yy,yy]), layers=[layer])[layer]
                loss += F.mean_squared_error(vx,vy)
            loss /= x.shape[1]
        else:
            vx = model(x, layers=[layer])[layer]
            vy = model(y, layers=[layer])[layer]
            loss = F.mean_squared_error(vx,vy)
    return(loss)

## compute gradient and take difference
def loss_grad(x, y, method='diff',norm='l1'):
    if method=="diff":
        dxx = x[:, :, 1:, :] - x[:, :, :-1, :]
        dyx = y[:, :, 1:, :] - y[:, :, :-1, :]
        dxy = x[:, :, :, 1:] - x[:, :, :, :-1]
        dyy = y[:, :, :, 1:] - y[:, :, :, :-1]
    elif method=="sobel": # apply Sobel's filter
        xp = cuda.get_array_module(x.data)
        grad = xp.tile(xp.asarray([[[[1,0,-1],[2,0,-2],[1,0,-1]]]],dtype=x.dtype),(x.data.shape[1],1,1))
        dxx = F.convolution_2d(x,grad)
        dyx = F.convolution_2d(y,grad)
        dxy = F.convolution_2d(x,xp.transpose(grad,(0,1,3,2)))
        dyy = F.convolution_2d(y,xp.transpose(grad,(0,1,3,2)))
    if norm=='l1':
        return F.mean_absolute_error(dxx,dyx)+F.mean_absolute_error(dxy,dyy)
    else:
        return F.mean_squared_error(dxx,dyx)+F.mean_squared_error(dxy,dyy)

# compare only pixels with x < threshold.
def loss_comp_low(x,y,threshold,norm='l1'):
    mask = ((x.array <= threshold)^(y.array <= threshold)).astype(x.xp.float32) ## XOR
    if norm=='l1':
        return(F.average( mask * F.absolute_error(x,y) ))
    else:
        return(F.average( mask * F.squared_error(x,y) ))

def loss_func_comp(y, val, noise=0):
    xp = cuda.get_array_module(y.data)
    if noise>0:
        val += random.normalvariate(0,noise)   ## jitter for the target value
#        val += random.uniform(-noise, noise)   ## jitter for the target value
    shape = y.data.shape
    if y.shape[1] == 2:  ## weighted discriminator
        shape = (shape[0],1,shape[2],shape[3])
        target = xp.full(shape, val, dtype=y.dtype)
        W = F.tanh(y[:,1,:,:])+1
        return F.average( ((y[:,0,:,:]-target)**2) * W )  ## weighted loss
    else:
        target = xp.full(shape, val, dtype=y.dtype)
        return F.mean_squared_error(y, target)

def loss_func_reg(y,norm='l1'):
    if norm=='l1':
        return(F.average(F.absolute(y)))
    else:
        return(F.average(y**2))

def total_variation(x,tau=1e-6, method="usual"):
    xp = cuda.get_array_module(x.data)
    if method=="abs":
        dx = x[:, :, 1:, :] - x[:, :, :-1, :]
        dy = x[:, :, :, 1:] - x[:, :, :, :-1]
        return F.average(F.absolute(dx))+F.average(F.absolute(dy))
    elif method=="sobel":
        wh = xp.tile(xp.asarray([[[[1,0],[-1,0]]]], dtype=x.dtype),(x.data.shape[1],1,1))
        ww = xp.tile(xp.asarray([[[[1, -1],[0, 0]]]], dtype=x.dtype),(x.data.shape[1],1,1))
        dx = F.convolution_2d(x, W=wh)
        dy = F.convolution_2d(x, W=ww)
        d = F.sqrt(dx**2 + dy**2 + xp.full(dx.data.shape, tau**2, dtype=dx.dtype))
        return(F.average(d))
    elif method=="usual":
        xp = cuda.get_array_module(x.data)
        dx = x[:, :, 1:, :-1] - x[:, :, :-1, :-1]
        dy = x[:, :, :-1, 1:] - x[:, :, :-1, :-1]
        d = F.sqrt(dx**2 + dy**2 + xp.full(dx.data.shape, tau**2, dtype=dx.dtype))
        return(F.average(d))

def total_variation_ch(x):
    xp = cuda.get_array_module(x.data)
    dx = x[:, 1:, :, :] - x[:, :-1, :, :]
    return F.average(F.absolute(dx))