def get_model_and_losses(cnn, style_img, content_img,
                         content_layers=content_layers_default,
                         style_layers=style_layers_default):
    
    """Duplicating CNN model while inserting losses at given feature level.
        
        Args.
            cnn: VGG-19 feature extractor pre-trained on ImageNet
            style_img: image from which synthesize tecture
            content_img: image from which reconstruct content
            content_layers: levels of feature to use for content reconstruction
            style_layers: levels of feature to use for texture synthesis
        Return.
            model: duplicated model with losses inserted
            style_losses: losses layer of texture synthesis
            content_losses: losses layer of content reconstruction
    """
 
    cnn = copy.deepcopy(cnn)
    content_losses = []
    style_losses = []
    
    normalization = Normalization() 
    model = nn.Sequential(normalization)
 
    block_idx, layer_idx = 1, 1
    end_of_blocks = ['conv_1_2', 'conv_2_2', 'conv_3_3', 'conv_4_4', 'conv_5_4']
    for layer in cnn.children():
        if isinstance(layer, nn.Conv2d):
            # 2D convolutional networks
            name = 'conv_%d_%d'%(block_idx, layer_idx)
            
        elif isinstance(layer, nn.ReLU):
            # relu layer
            name = 'relu_%d_%d'%(block_idx, layer_idx)
            layer = nn.ReLU(inplace=False)
            
            if 'conv_%d_%d'%(block_idx, layer_idx) in end_of_blocks:
                # when current conv layer is the final layer of each block
                # we add content and style loss here
               
                if 'conv_%d'%block_idx in content_layers:
                    # add content layer
                    target = model(content_img).detach()
                    content_loss = ContentLoss(target)
                    model.add_module('content_loss_%d'%block_idx, content_loss)
                    content_losses.append(content_loss)
 
                if 'conv_%d'%block_idx in style_layers:
                    # add style layer
                    target = model(style_img).detach()
                    style_loss = StyleLoss(target)
                    model.add_module('style_loss_%d'%block_idx, style_loss)
                    style_losses.append(style_loss)
 
                if max(content_layers + style_layers) == 'conv_%d'%block_idx:
                    break
            
            layer_idx += 1
 
        elif isinstance(layer, nn.MaxPool2d):
            # pooling layer
            name = 'pool_%d'%(block_idx)
            block_idx += 1
            layer_idx = 1
 
        else:
            NameError, "unexpected layer name appeared!"
 
        model.add_module(name, layer)
 
    return model, style_losses, content_losses

Colored by Color Scripter

cs

class ContentLoss(nn.Module):
 
    def __init__(self, target,):
        super(ContentLoss, self).__init__()
        # Normalize target and input for each layer
        _target = target.detach()
        self.mean = _target.mean((2, 3), keepdim=True)
        self.std = _target.std((2, 3), keepdim=True)
        self.target = (_target - self.mean) / self.std
 
 
    def forward(self, input):
        # Forward pass
       
        self.loss = F.mse_loss((input - self.mean)/self.std, self.target)
       
        return input

Colored by Color Scripter

cs

def gram_matrix(activations):
    a, b, c, d = activations.size()  # a=batch size(=1)
    features = activations.view(a * b, c * d)
    gram = torch.mm(features, features.T)
 
    normalized_gram = gram.div(a * b * c * d)
 
    return normalized_gram
 
 
class StyleLoss(nn.Module):
 
    def __init__(self, target_feature):
        super(StyleLoss, self).__init__()
        # Normalize feature at each layer
        _target = target_feature.detach()
        self.mean = _target.mean((2, 3), keepdim=True)
        self.std = _target.std((2, 3), keepdim=True)
        self.target = gram_matrix((_target - self.mean) / self.std)
 
    def forward(self, input):
        normalized_gram = gram_matrix((input - self.mean)/self.std)
        self.loss = F.mse_loss(normalized_gram, self.target) 
 
        return input

Colored by Color Scripter

cs