refine psgan code according tho the reviewer's comment

d77cf3bc · lijianshe02 · 3d86ec00 · 3d86ec00 · d77cf3bc · d77cf3bc
13 changed file
--- a/applications/run.sh
+++ b/applications/run.sh
-# 模型说明
-# 目前包含DAIN(插帧模型)，DeOldify(上色模型)，DeepRemaster(去噪与上色模型)，EDVR(基于连续帧(视频)超分辨率模型)，RealSR(基于图片的超分辨率模型)
-# 参数说明
-# input 输入视频的路径
-# output 输出视频保存的路径
-# proccess_order 要使用的模型及顺序
-python tools/video-enhance.py \
--input input.mp4  --output output --proccess_order DeOldify RealSR
--- a/configs/makeup.yaml
+++ b/configs/makeup.yaml
-# copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve.
+epochs: 100
-#
+isTrain: True
-# Licensed under the Apache License, Version 2.0 (the "License");
+output_dir: degrade_match
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-epochs: 200
-isTrain: False
-output_dir: tmp
 checkpoints_dir: checkpoints
 lambda_A: 10.0
 lambda_B: 10.0
@@ -31,7 +17,7 @@ model:
    ndf: 64
    n_layers: 3
    input_nc: 3
-    norm_type: batch
+    norm_type: spectral
  gan_mode: lsgan
 dataset:

--- a/ppgan/datasets/makeup_dataset.py
+++ b/ppgan/datasets/makeup_dataset.py
@@ -17,7 +17,6 @@ import os.path
 from .base_dataset import BaseDataset, get_transform
 from .transforms.makeup_transforms import get_makeup_transform
 import paddle.vision.transforms as T
-from .image_folder import make_dataset
 from PIL import Image
 import random
 import numpy as np
@@ -28,15 +27,6 @@ from .builder import DATASETS
 @DATASETS.register()
 class MakeupDataset(BaseDataset):
-    """
-    This dataset class can load unaligned/unpaired datasets.
-    It requires two directories to host training images from domain A '/path/to/data/trainA'
-    and from domain B '/path/to/data/trainB' respectively.
-    You can train the model with the dataset flag '--dataroot /path/to/data'.
-    Similarly, you need to prepare two directories:
-    '/path/to/data/testA' and '/path/to/data/testB' during test time.
-    """
    def __init__(self, cfg):
        """Initialize this dataset class.
@@ -83,16 +73,12 @@ class MakeupDataset(BaseDataset):
                getattr(self, cls + "_lmks_filenames").append(splits[2])
    def __getitem__(self, index):
-        """Return a data point and its metadata information.
+        """Return MANet and MDNet needed params.
        Parameters:
            index (int)      -- a random integer for data indexing
-        Returns a dictionary that contains A, B, A_paths and B_paths
+        Returns a dictionary that contains needed params.
-            A (tensor)       -- an image in the input domain
-            B (tensor)       -- its corresponding image in the target domain
-            A_paths (str)    -- image paths
-            B_paths (str)    -- image paths
        """
        try:
            index_A = random.randint(
@@ -125,15 +111,11 @@ class MakeupDataset(BaseDataset):
                        self.image_path,
                        getattr(self, self.cls_B +
                                "_mask_filenames")[index_B])).convert('L'))
-            #image_A.paste((200,200,200), (0,0), Image.fromarray(np.uint8(255*(np.array(mask_A)==0))))
-            #image_B.paste((200,200,200), (0,0), Image.fromarray(np.uint8(255*(np.array(mask_B)==0))))
            image_A = np.array(image_A)
            image_B = np.array(image_B)
-            print('image shape: ', image_A.shape)
            image_A = self.transform(image_A)
            image_B = self.transform(image_B)
-            print('image shape: ', image_A.shape)
            mask_A = cv2.resize(mask_A, (256, 256),
                                interpolation=cv2.INTER_NEAREST)

--- a/ppgan/faceutils/dlibutils/__init__.py
+++ b/ppgan/faceutils/dlibutils/__init__.py
-#!/usr/bin/python
+from .dlib_utils import detect, crop, landmarks, crop_from_array
-# -*- encoding: utf-8 -*-
-from .main import detect, crop, landmarks, crop_from_array
--- a/ppgan/faceutils/dlibutils/main.py
+++ b/ppgan/faceutils/dlibutils/main.py
@@ -61,7 +61,6 @@ def crop(image: Image, face, up_ratio, down_ratio, width_ratio):
    face_expand = dlib.rectangle(img_left, img_top, img_right, img_bottom)
    center = face_expand.center()
    width, height = image.size
-    # import ipdb; ipdb.set_trace()
    crop_left = img_left
    crop_top = img_top
    crop_right = img_right

--- a/ppgan/faceutils/image.py
+++ b/ppgan/faceutils/image.py
@@ -3,16 +3,6 @@ import cv2
 from io import BytesIO
-def load_image(path):
-    with path.open("rb") as reader:
-        data = np.fromstring(reader.read(), dtype=np.uint8)
-        img = cv2.imdecode(data, cv2.IMREAD_COLOR)
-        if img is None:
-            return
-        img = img[..., ::-1]
-    return img
 def resize_by_max(image, max_side=512, force=False):
    h, w = image.shape[:2]
    if max(h, w) < max_side and not force:
@@ -22,10 +12,3 @@ def resize_by_max(image, max_side=512, force=False):
    w = int(w / ratio + 0.5)
    h = int(h / ratio + 0.5)
    return cv2.resize(image, (w, h))
-def image2buffer(image):
-    is_success, buffer = cv2.imencode(".jpg", image)
-    if not is_success:
-        return None
-    return BytesIO(buffer)
--- a/ppgan/faceutils/mask/__init__.py
+++ b/ppgan/faceutils/mask/__init__.py
@@ -12,4 +12,4 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from .main import FaceParser
+from .face_parser import FaceParser
--- a/ppgan/faceutils/mask/main.py
+++ b/ppgan/faceutils/mask/main.py
@@ -67,9 +67,5 @@ class FaceParser:
            for j in range(w):
                result[i][j] = self.mapper[parse_np[i][j]]
-        with open('/workspace/PaddleGAN/mapper_out.pkl', 'rb') as f:
-            torch_out = pickle.load(f)
-            cm = np.allclose(torch_out, result)
-            print('cm out: ', cm)
        result = paddle.to_tensor(result).astype('float32')
        return result
--- a/ppgan/faceutils/mask/model.py
+++ b/ppgan/faceutils/mask/model.py
@@ -40,7 +40,6 @@ class ConvBNReLU(paddle.nn.Layer):
                              bias_attr=False)
        self.bn = nn.BatchNorm2d(out_chan)
        self.relu = nn.ReLU()
-        #self.init_weight()
    def forward(self, x):
        x = self.conv(x)
@@ -57,7 +56,6 @@ class BiSeNetOutput(paddle.nn.Layer):
                                  n_classes,
                                  kernel_size=1,
                                  bias_attr=False)
-        #self.init_weight()
    def forward(self, x):
        x = self.conv(x)
@@ -75,11 +73,9 @@ class AttentionRefinementModule(paddle.nn.Layer):
                                    bias_attr=False)
        self.bn_atten = nn.BatchNorm(out_chan)
        self.sigmoid_atten = nn.Sigmoid()
-        #self.init_weight()
    def forward(self, x):
        feat = self.conv(x)
-        #atten = F.avg_pool2d(feat, feat.size()[2:])
        atten = F.avg_pool2d(feat, feat.shape[2:])
        atten = self.conv_atten(atten)
        atten = self.bn_atten(atten)
@@ -87,12 +83,6 @@ class AttentionRefinementModule(paddle.nn.Layer):
        out = feat * atten
        return out
-    #def init_weight(self):
-    #    for ly in self.children():
-    #        if isinstance(ly, nn.Conv2d):
-    #            nn.init.kaiming_normal_(ly.weight, a=1)
-    #            if not ly.bias is None: nn.init.constant_(ly.bias, 0)
 class ContextPath(paddle.nn.Layer):
    def __init__(self, *args, **kwargs):
@@ -104,37 +94,30 @@ class ContextPath(paddle.nn.Layer):
        self.conv_head16 = ConvBNReLU(128, 128, ks=3, stride=1, padding=1)
        self.conv_avg = ConvBNReLU(512, 128, ks=1, stride=1, padding=0)
-        #self.init_weight()
    def forward(self, x):
        H0, W0 = x.shape[2:]
        feat8, feat16, feat32 = self.resnet(x)
        H8, W8 = feat8.shape[2:]
        H16, W16 = feat16.shape[2:]
        H32, W32 = feat32.shape[2:]
-        print('feat32.shape: ', feat32.shape[2:])
        avg = F.avg_pool2d(feat32, feat32.shape[2:])
        avg = self.conv_avg(avg)
-        #avg_up = F.interpolate(avg, (H32, W32), mode='nearest')
+        avg_up = F.interpolate(avg, size=(H32, W32), mode='nearest')
-        avg_up = F.resize_nearest(avg, out_shape=(H32, W32))
        feat32_arm = self.arm32(feat32)
        feat32_sum = feat32_arm + avg_up
-        #feat32_up = F.interpolate(feat32_sum, (H16, W16), mode='nearest')
+        feat32_up = F.interpolate(feat32_sum, size=(H16, W16), mode='nearest')
-        feat32_up = F.resize_nearest(feat32_sum, out_shape=(H16, W16))
        feat32_up = self.conv_head32(feat32_up)
        feat16_arm = self.arm16(feat16)
        feat16_sum = feat16_arm + feat32_up
-        #feat16_up = F.interpolate(feat16_sum, (H8, W8), mode='nearest')
+        feat16_up = F.interpolate(feat16_sum, size=(H8, W8), mode='nearest')
-        feat16_up = F.resize_nearest(feat16_sum, out_shape=(H8, W8))
        feat16_up = self.conv_head16(feat16_up)
        return feat8, feat16_up, feat32_up  # x8, x8, x16
-### This is not used, since I replace this with the resnet feature with the same size
 class SpatialPath(paddle.nn.Layer):
    def __init__(self, *args, **kwargs):
        super(SpatialPath, self).__init__()
@@ -142,7 +125,6 @@ class SpatialPath(paddle.nn.Layer):
        self.conv2 = ConvBNReLU(64, 64, ks=3, stride=2, padding=1)
        self.conv3 = ConvBNReLU(64, 64, ks=3, stride=2, padding=1)
        self.conv_out = ConvBNReLU(64, 128, ks=1, stride=1, padding=0)
-        #self.init_weight()
    def forward(self, x):
        feat = self.conv1(x)
@@ -174,7 +156,6 @@ class FeatureFusionModule(paddle.nn.Layer):
    def forward(self, fsp, fcp):
        fcat = paddle.concat([fsp, fcp], axis=1)
        feat = self.convblk(fcat)
-        #atten = F.avg_pool2d(feat, feat.size()[2:])
        atten = F.avg_pool2d(feat, feat.shape[2:])
        atten = self.conv1(atten)
        atten = self.relu(atten)
@@ -189,7 +170,6 @@ class BiSeNet(paddle.nn.Layer):
    def __init__(self, n_classes, *args, **kwargs):
        super(BiSeNet, self).__init__()
        self.cp = ContextPath()
-        ## here self.sp is deleted
        self.ffm = FeatureFusionModule(256, 256)
        self.conv_out = BiSeNetOutput(256, 256, n_classes)
        self.conv_out16 = BiSeNetOutput(128, 64, n_classes)
@@ -206,9 +186,9 @@ class BiSeNet(paddle.nn.Layer):
        feat_out16 = self.conv_out16(feat_cp8)
        feat_out32 = self.conv_out32(feat_cp16)
-        feat_out = F.resize_bilinear(feat_out, out_shape=(H, W))
+        feat_out = F.interpolate(feat_out, size=(H, W))
-        feat_out16 = F.resize_bilinear(feat_out16, out_shape=(H, W))
+        feat_out16 = F.interpolate(feat_out16, size=(H, W))
-        feat_out32 = F.resize_bilinear(feat_out32, out_shape=(H, W))
+        feat_out32 = F.interpolate(feat_out32, size=(H, W))
        return feat_out, feat_out16, feat_out32

--- a/ppgan/models/discriminators/nlayers.py
+++ b/ppgan/models/discriminators/nlayers.py
@@ -25,7 +25,7 @@ from .builder import DISCRIMINATORS
 @DISCRIMINATORS.register()
-class NLayerDiscriminator(paddle.nn.Layer):
+class NLayerDiscriminator(nn.Layer):
    """Defines a PatchGAN discriminator"""
    def __init__(self, input_nc, ndf=64, n_layers=3, norm_type='instance'):
        """Construct a PatchGAN discriminator
@@ -47,53 +47,98 @@ class NLayerDiscriminator(paddle.nn.Layer):
        kw = 4
        padw = 1
-        #sequence = [Conv2d(input_nc, ndf, kernel_size=kw, stride=2, padding=padw), nn.LeakyReLU(0.01)]
-        sequence = [
+        if norm_type == 'spectral':
-            Spectralnorm(
+            sequence = [
-                Conv2d(input_nc, ndf, kernel_size=kw, stride=2, padding=padw)),
+                Spectralnorm(
-            nn.LeakyReLU(0.01)
+                    Conv2d(input_nc,
-        ]
+                           ndf,
+                           kernel_size=kw,
+                           stride=2,
+                           padding=padw)),
+                nn.LeakyReLU(0.01)
+            ]
+        else:
+            sequence = [
+                Conv2d(input_nc,
+                       ndf,
+                       kernel_size=kw,
+                       stride=2,
+                       padding=padw,
+                       bias_attr=use_bias),
+                nn.LeakyReLU(0.2)
+            ]
        nf_mult = 1
        nf_mult_prev = 1
        for n in range(1, n_layers):  # gradually increase the number of filters
            nf_mult_prev = nf_mult
            nf_mult = min(2**n, 8)
+            if norm_type == 'spectral':
+                sequence += [
+                    Spectralnorm(
+                        Conv2d(ndf * nf_mult_prev,
+                               ndf * nf_mult,
+                               kernel_size=kw,
+                               stride=2,
+                               padding=padw)),
+                    nn.LeakyReLU(0.01)
+                ]
+            else:
+                sequence += [
+                    Conv2d(ndf * nf_mult_prev,
+                           ndf * nf_mult,
+                           kernel_size=kw,
+                           stride=2,
+                           padding=padw,
+                           bias_attr=use_bias),
+                    norm_layer(ndf * nf_mult),
+                    nn.LeakyReLU(0.2)
+                ]
+        nf_mult_prev = nf_mult
+        nf_mult = min(2**n_layers, 8)
+        if norm_type == 'spectral':
            sequence += [
-                #Conv2d(ndf * nf_mult_prev, ndf * nf_mult, kernel_size=kw, stride=2, padding=padw, bias_attr=use_bias),
                Spectralnorm(
                    Conv2d(ndf * nf_mult_prev,
                           ndf * nf_mult,
                           kernel_size=kw,
-                           stride=2,
+                           stride=1,
                           padding=padw)),
-                #norm_layer(ndf * nf_mult),
                nn.LeakyReLU(0.01)
            ]
+        else:
-        nf_mult_prev = nf_mult
+            sequence += [
-        nf_mult = min(2**n_layers, 8)
-        sequence += [
-            #Conv2d(ndf * nf_mult_prev, ndf * nf_mult, kernel_size=kw, stride=1, padding=padw, bias_attr=use_bias),
-            Spectralnorm(
                Conv2d(ndf * nf_mult_prev,
                       ndf * nf_mult,
                       kernel_size=kw,
                       stride=1,
-                       padding=padw)),
+                       padding=padw,
-            #norm_layer(ndf * nf_mult),
+                       bias_attr=use_bias),
-            nn.LeakyReLU(0.01)
+                norm_layer(ndf * nf_mult),
-        ]
+                nn.LeakyReLU(0.2)
+            ]
-        #sequence += [Conv2d(ndf * nf_mult, 1, kernel_size=kw, stride=1, padding=padw)]  # output 1 channel prediction map
+        if norm_type == 'spectral':
-        sequence += [
+            sequence += [
-            Spectralnorm(
+                Spectralnorm(
+                    Conv2d(ndf * nf_mult,
+                           1,
+                           kernel_size=kw,
+                           stride=1,
+                           padding=padw,
+                           bias_attr=False))
+            ]  # output 1 channel prediction map
+        else:
+            sequence += [
                Conv2d(ndf * nf_mult,
                       1,
                       kernel_size=kw,
                       stride=1,
                       padding=padw,
-                       bias_attr=False))
+                       bias_attr=False)
-        ]  # output 1 channel prediction map
+            ]  # output 1 channel prediction map
        self.model = nn.Sequential(*sequence)
    def forward(self, input):

--- a/ppgan/models/makeup_model.py
+++ b/ppgan/models/makeup_model.py
@@ -132,7 +132,6 @@ class MakeupModel(BaseModel):
        The option 'direction' can be used to swap domain A and domain B.
        """
        self.real_A = paddle.to_tensor(input['image_A'])
-        print('real_a shape: ', self.real_A.shape)
        self.real_B = paddle.to_tensor(input['image_B'])
        self.c_m = paddle.to_tensor(input['consis_mask'])
        self.P_A = paddle.to_tensor(input['P_A'])
@@ -338,9 +337,9 @@ class MakeupModel(BaseModel):
        g_B_eye_loss_his = self.criterionL1(fake_B_eye_masked, fake_match_eye_B)
        self.loss_G_A_his = (g_A_eye_loss_his + g_A_lip_loss_his +
-                             g_A_skin_loss_his * 0.1) * 0.1
+                             g_A_skin_loss_his * 0.1) * 0.01
        self.loss_G_B_his = (g_B_eye_loss_his + g_B_lip_loss_his +
-                             g_B_skin_loss_his * 0.1) * 0.1
+                             g_B_skin_loss_his * 0.1) * 0.01
        #self.loss_G_A_his = self.criterionL1(tmp_1, tmp_2) * 2048 * 255
        #tmp_3 = self.hm_gt_B*self.hm_mask_weight_B
@@ -361,8 +360,8 @@ class MakeupModel(BaseModel):
                                           vgg_r) * lambda_B * lambda_vgg
        self.loss_rec = (self.loss_cycle_A + self.loss_cycle_B +
-                         self.loss_A_vgg + self.loss_B_vgg) * 0.1
+                         self.loss_A_vgg + self.loss_B_vgg) * 0.2
-        self.loss_idt = (self.loss_idt_A + self.loss_idt_B) * 0.1
+        self.loss_idt = (self.loss_idt_A + self.loss_idt_B) * 0.2
        # bg consistency loss
        mask_A_consis = paddle.cast(
@@ -370,8 +369,8 @@ class MakeupModel(BaseModel):
                (self.mask_A == 10), dtype='float32') + paddle.cast(
                    (self.mask_A == 8), dtype='float32')
        mask_A_consis = paddle.unsqueeze(paddle.clip(mask_A_consis, 0, 1), 1)
-        self.loss_G_bg_consis = self.criterionL1(self.real_A * mask_A_consis,
+        self.loss_G_bg_consis = self.criterionL1(
-                                                 self.fake_A * mask_A_consis)
+            self.real_A * mask_A_consis, self.fake_A * mask_A_consis) * 0.1
        # combined loss and calculate gradients

--- a/ppgan/models/vgg.py
+++ b/ppgan/models/vgg.py
@@ -14,211 +14,38 @@
 import paddle
 import paddle.nn as nn
-import paddle.nn.functional as F
 from paddle.utils.download import get_weights_path_from_url
+from paddle.vision.models.vgg import make_layers
-__all__ = [
+cfg = [
-    'VGG',
+    64, 64, 'M', 128, 128, 'M', 256, 256, 256, 'M', 512, 512, 512, 'M', 512,
-    'vgg11',
+    512, 512, 'M'
-    'vgg13',
-    'vgg16',
-    'vgg19',
 ]
 model_urls = {
    'vgg16': ('https://paddle-hapi.bj.bcebos.com/models/vgg16.pdparams',
-              'c788f453a3b999063e8da043456281ee')
+              '89bbffc0f87d260be9b8cdc169c991c4')
 }
-class Classifier(paddle.nn.Layer):
+class VGG(nn.Layer):
-    def __init__(self, num_classes, classifier_activation='softmax'):
+    def __init__(self, features):
-        super(Classifier, self).__init__()
-        self.linear1 = nn.Linear(512 * 7 * 7, 4096)
-        self.linear2 = nn.Linear(4096, 4096)
-        self.linear3 = nn.Linear(4096, num_classes)
-        self.relu = nn.ReLU()
-        self.dropout = nn.Dropout(0.5)
-        self.softmax = nn.Softmax()
-    def forward(self, x):
-        x = self.linear1(x)
-        x = self.relu(x)
-        x = self.dropout(x)
-        x = self.linear2(x)
-        x = self.relu(x)
-        x = self.dropout(x)
-        out = self.linear3(x)
-        out = self.softmax(out)
-        return out
-class VGG(paddle.nn.Layer):
-    """VGG model from
-    `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_
-    Args:
-        features (nn.Layer): vgg features create by function make_layers.
-        num_classes (int): output dim of last fc layer. If num_classes <=0, last fc layer
-                            will not be defined. Default: 1000.
-        classifier_activation (str): activation for the last fc layer. Default: 'softmax'.
-    Examples:
-        .. code-block:: python
-            from paddle.incubate.hapi.vision.models import VGG
-            from paddle.incubate.hapi.vision.models.vgg import make_layers
-            vgg11_cfg = [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M']
-            features = make_layers(vgg11_cfg)
-            vgg11 = VGG(features)
-    """
-    def __init__(self,
-                 features,
-                 num_classes=1000,
-                 classifier_activation='softmax'):
        super(VGG, self).__init__()
        self.features = features
-        self.num_classes = num_classes
-        if num_classes > 0:
-            classifier = Classifier(num_classes, classifier_activation)
-            self.classifier = self.add_sublayer("classifier",
-                                                nn.Sequential(classifier))
    def forward(self, x):
        x = self.features(x)
-        #if self.num_classes > 0:
-        #    x = fluid.layers.flatten(x, 1)
-        #    x = self.classifier(x)
        return x
-def make_layers(cfg, batch_norm=False):
+def vgg16(pretrained=False):
-    layers = []
+    features = make_layers(cfg)
-    in_channels = 3
+    model = VGG(features)
-    for v in cfg:
-        if v == 'M':
-            layers += [nn.MaxPool2d(kernel_size=2, stride=2)]
-        else:
-            if batch_norm:
-                conv2d = nn.Conv2d(in_channels, v, kernel_size=3, padding=1)
-                layers += [conv2d, nn.BatchNorm2d(v), nn.ReLU()]
-            else:
-                conv2d = nn.Conv2d(in_channels, v, kernel_size=3, padding=1)
-                layers += [conv2d, nn.ReLU()]
-            in_channels = v
-    return nn.Sequential(*layers)
-cfgs = {
-    'A': [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M'],
-    'B':
-    [64, 64, 'M', 128, 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M'],
-    'D': [
-        64, 64, 'M', 128, 128, 'M', 256, 256, 256, 'M', 512, 512, 512, 'M', 512,
-        512, 512, 'M'
-    ],
-    'E': [
-        64, 64, 'M', 128, 128, 'M', 256, 256, 256, 256, 'M', 512, 512, 512, 512,
-        'M', 512, 512, 512, 512, 'M'
-    ],
-}
-def _vgg(arch, cfg, batch_norm, pretrained, **kwargs):
-    model = VGG(make_layers(cfgs[cfg], batch_norm=batch_norm),
-                num_classes=1000,
-                **kwargs)
    if pretrained:
-        #assert arch in model_urls, "{} model do not have a pretrained model now, you should set pretrained=False".format(
+        weight_path = get_weights_path_from_url(model_urls['vgg16'][0],
-        #    arch)
+                                                model_urls['vgg16'][1])
-        #weight_path = get_weights_path_from_url(model_urls[arch][0],
-        #                                        model_urls[arch][1])
-        #assert weight_path.endswith(
-        #    '.pdparams'), "suffix of weight must be .pdparams"
-        weight_path = './vgg16.pdparams'
        param, _ = paddle.load(weight_path)
        model.load_dict(param)
    return model
-def vgg11(pretrained=False, batch_norm=False, **kwargs):
-    """VGG 11-layer model
-    Args:
-        pretrained (bool): If True, returns a model pre-trained on ImageNet. Default: False.
-        batch_norm (bool): If True, returns a model with batch_norm layer. Default: False.
-    Examples:
-        .. code-block:: python
-            from paddle.incubate.hapi.vision.models import vgg11
-            # build model
-            model = vgg11()
-            # build vgg11 model with batch_norm
-            model = vgg11(batch_norm=True)
-    """
-    model_name = 'vgg11'
-    if batch_norm:
-        model_name += ('_bn')
-    return _vgg(model_name, 'A', batch_norm, pretrained, **kwargs)
-def vgg13(pretrained=False, batch_norm=False, **kwargs):
-    """VGG 13-layer model
-    Args:
-        pretrained (bool): If True, returns a model pre-trained on ImageNet. Default: False.
-        batch_norm (bool): If True, returns a model with batch_norm layer. Default: False.
-    Examples:
-        .. code-block:: python
-            from paddle.incubate.hapi.vision.models import vgg13
-            # build model
-            model = vgg13()
-            # build vgg13 model with batch_norm
-            model = vgg13(batch_norm=True)
-    """
-    model_name = 'vgg13'
-    if batch_norm:
-        model_name += ('_bn')
-    return _vgg(model_name, 'B', batch_norm, pretrained, **kwargs)
-def vgg16(pretrained=False, batch_norm=False, **kwargs):
-    """VGG 16-layer model
-    Args:
-        pretrained (bool): If True, returns a model pre-trained on ImageNet. Default: False.
-        batch_norm (bool): If True, returns a model with batch_norm layer. Default: False.
-    Examples:
-        .. code-block:: python
-            from paddle.incubate.hapi.vision.models import vgg16
-            # build model
-            model = vgg16()
-            # build vgg16 model with batch_norm
-            model = vgg16(batch_norm=True)
-    """
-    model_name = 'vgg16'
-    if batch_norm:
-        model_name += ('_bn')
-    return _vgg(model_name, 'D', batch_norm, pretrained, **kwargs)
-def vgg19(pretrained=False, batch_norm=False, **kwargs):
-    """VGG 19-layer model
-    Args:
-        pretrained (bool): If True, returns a model pre-trained on ImageNet. Default: False.
-        batch_norm (bool): If True, returns a model with batch_norm layer. Default: False.
-    Examples:
-        .. code-block:: python
-            from paddle.incubate.hapi.vision.models import vgg19
-            # build model
-            model = vgg19()
-            # build vgg19 model with batch_norm
-            model = vgg19(batch_norm=True)
-    """
-    model_name = 'vgg19'
-    if batch_norm:
-        model_name += ('_bn')
-    return _vgg(model_name, 'E', batch_norm, pretrained, **kwargs)
--- a/ppgan/modules/norm.py
+++ b/ppgan/modules/norm.py
 import paddle
 import functools
 import paddle.nn as nn
+from .nn import Spectralnorm
 class Identity(nn.Layer):
@@ -35,6 +36,8 @@ def build_norm_layer(norm_type='instance'):
            bias_attr=paddle.ParamAttr(initializer=nn.initializer.Constant(0.0),
                                       learning_rate=0.0,
                                       trainable=False))
+    elif norm_type == 'spectral':
+        norm_layer = functools.partial(Spectralnorm)
    elif norm_type == 'none':
        def norm_layer(x):