files

3 years ago · 3ed918cf34
12 changed files with 244 additions and 0 deletions
--- a/copy.md
+++ b/copy.md
@ -0,0 +1,54 @@
+# AnimeGanV2 Style-Transfer Operator
+
+Authors: filip
+
+## Overview
+
+AnimeGanV2 is a style transfer net that transforms images to looking like they fit in an anime movie.
+
+## Interface
+
+```python
+__init__(self, model_name: str, framework: str = 'pytorch')
+```
+
+**Args:**
+
+- model_name:
+  - which weights to use for inference.
+  - supports 'celeba', 'facepaintv1', 'facepaitv2', 'hayao', 'paprika', 'shinkai'
+- framework:
+  - the framework of the model
+  - supported types: `str`, default is 'pytorch'
+
+```python
+__call__(self,  image: 'towhee.types.Image')
+```
+
+**Args:**
+
+- image:
+  - the input image
+  - supported types: `towhee.types.Image`
+
+**Returns:**
+
+The Operator returns a tuple `Tuple[('styled_image', numpy.ndarray)]` containing following fields:
+
+- styled_image:
+  - styled photo
+  - data type: `numpy.ndarray`
+  - shape: (3, x, x)
+  - format: RGB
+  - values: [0,1]
+
+## Requirements
+
+You can get the required python package by [requirements.txt](./requirements.txt).
+
+
+## Reference
+
+Jie Chen, Gang Liu, Xin Chen
+"AnimeGAN: A Novel Lightweight GAN for Photo Animation."
+ISICA 2019: Artificial Intelligence Algorithms and Applications pp 242-256, 2019.
--- a/init.py
+++ b/init.py
@ -0,0 +1,3 @@
+from .animegan import Animegan
+def animegan(name):
+    return Animegan(name)
--- a/animegan.py
+++ b/animegan.py
@ -0,0 +1,34 @@
+import os
+from pathlib import Path
+from torchvision import transforms
+
+from towhee import register
+from towhee.operator import Operator, OperatorFlag
+from towhee.types import arg, to_image_color
+from towhee._types import Image
+import warnings
+warnings.filterwarnings('ignore')
+
+@register(output_schema=['styled_image'], flag=OperatorFlag.STATELESS | OperatorFlag.REUSEABLE,)
+class Animegan(Operator):
+    """
+    PyTorch model for image embedding.
+    """
+    def __init__(self, model_name: str, framework: str = 'pytorch') -> None:
+        super().__init__()
+        if framework == 'pytorch':
+            import importlib.util
+            path = os.path.join(str(Path(__file__).parent), 'pytorch', 'model.py')
+            opname = os.path.basename(str(Path(__file__))).split('.')[0]
+            spec = importlib.util.spec_from_file_location(opname, path)
+            module = importlib.util.module_from_spec(spec)
+            spec.loader.exec_module(module)
+        self.model = module.Model(model_name)
+        self.tfms = transforms.Compose([
+                                        transforms.ToTensor()
+                                    ])
+    @arg(1, to_image_color('RGB') )
+    def __call__(self, image):
+        img = self.tfms(image).unsqueeze(0)
+        styled_image = self.model(img)
+        return Image(styled_image, 'RGB')
--- a/pytorch/init.py
+++ b/pytorch/init.py
--- a/pytorch/model.py
+++ b/pytorch/model.py
@ -0,0 +1,133 @@
+from torch import nn, load, Tensor
+import os
+from pathlib import Path
+
+
+class ConvNormLReLU(nn.Sequential):
+    def __init__(self, in_ch, out_ch, kernel_size=3, stride=1, padding=1, pad_mode="reflect", groups=1, bias=False):
+        
+        pad_layer = {
+            "zero":    nn.ZeroPad2d,
+            "same":    nn.ReplicationPad2d,
+            "reflect": nn.ReflectionPad2d,
+        }
+        if pad_mode not in pad_layer:
+            raise NotImplementedError
+            
+        super(ConvNormLReLU, self).__init__(
+            pad_layer[pad_mode](padding),
+            nn.Conv2d(in_ch, out_ch, kernel_size=kernel_size, stride=stride, padding=0, groups=groups, bias=bias),
+            nn.GroupNorm(num_groups=1, num_channels=out_ch, affine=True),
+            nn.LeakyReLU(0.2, inplace=True)
+        )
+
+
+class InvertedResBlock(nn.Module):
+    def __init__(self, in_ch, out_ch, expansion_ratio=2):
+        super(InvertedResBlock, self).__init__()
+
+        self.use_res_connect = in_ch == out_ch
+        bottleneck = int(round(in_ch*expansion_ratio))
+        layers = []
+        if expansion_ratio != 1:
+            layers.append(ConvNormLReLU(in_ch, bottleneck, kernel_size=1, padding=0))
+        
+        # dw
+        layers.append(ConvNormLReLU(bottleneck, bottleneck, groups=bottleneck, bias=True))
+        # pw
+        layers.append(nn.Conv2d(bottleneck, out_ch, kernel_size=1, padding=0, bias=False))
+        layers.append(nn.GroupNorm(num_groups=1, num_channels=out_ch, affine=True))
+
+        self.layers = nn.Sequential(*layers)
+        
+    def forward(self, input):
+        out = self.layers(input)
+        if self.use_res_connect:
+            out = input + out
+        return out
+
+    
+class Generator(nn.Module):
+    def __init__(self, ):
+        super().__init__()
+        
+        self.block_a = nn.Sequential(
+            ConvNormLReLU(3,  32, kernel_size=7, padding=3),
+            ConvNormLReLU(32, 64, stride=2, padding=(0,1,0,1)),
+            ConvNormLReLU(64, 64)
+        )
+        
+        self.block_b = nn.Sequential(
+            ConvNormLReLU(64,  128, stride=2, padding=(0,1,0,1)),            
+            ConvNormLReLU(128, 128)
+        )
+        
+        self.block_c = nn.Sequential(
+            ConvNormLReLU(128, 128),
+            InvertedResBlock(128, 256, 2),
+            InvertedResBlock(256, 256, 2),
+            InvertedResBlock(256, 256, 2),
+            InvertedResBlock(256, 256, 2),
+            ConvNormLReLU(256, 128),
+        )    
+        
+        self.block_d = nn.Sequential(
+            ConvNormLReLU(128, 128),
+            ConvNormLReLU(128, 128)
+        )
+
+        self.block_e = nn.Sequential(
+            ConvNormLReLU(128, 64),
+            ConvNormLReLU(64,  64),
+            ConvNormLReLU(64,  32, kernel_size=7, padding=3)
+        )
+
+        self.out_layer = nn.Sequential(
+            nn.Conv2d(32, 3, kernel_size=1, stride=1, padding=0, bias=False),
+            nn.Tanh()
+        )
+        
+    def forward(self, input, align_corners=True):
+        out = self.block_a(input)
+        half_size = out.size()[-2:]
+        out = self.block_b(out)
+        out = self.block_c(out)
+        
+        if align_corners:
+            out = nn.functional.interpolate(out, half_size, mode="bilinear", align_corners=True)
+        else:
+            out = nn.functional.interpolate(out, scale_factor=2, mode="bilinear", align_corners=False)
+        out = self.block_d(out)
+
+        if align_corners:
+            out = nn.functional.interpolate(out, input.size()[-2:], mode="bilinear", align_corners=True)
+        else:
+            out = nn.functional.interpolate(out, scale_factor=2, mode="bilinear", align_corners=False)
+        out = self.block_e(out)
+
+        out = self.out_layer(out)
+        return out
+
+class Model():
+    def __init__(self, model_name) -> None:
+        self._model = Generator()
+        path = os.path.join(str(Path(__file__).parent), 'weights', model_name + '.pt')
+        ckpt = load(path)
+        self._model.load_state_dict(ckpt)
+        self._model.eval()
+        
+
+    def __call__(self, img_tensor: Tensor):
+        img_tensor = img_tensor * 2 - 1
+        out = self._model(img_tensor).detach()
+        out = out.squeeze(0).clip(-1, 1) * 0.5 + 0.5
+        return out.numpy()
+ 
+    def train(self):
+         """
+         For training model
+         """
+         pass
+
+    
+        
--- a/pytorch/weights/celeba.pt
+++ b/pytorch/weights/celeba.pt
--- a/pytorch/weights/facepaintv1.pt
+++ b/pytorch/weights/facepaintv1.pt
--- a/pytorch/weights/facepaintv2.pt
+++ b/pytorch/weights/facepaintv2.pt
--- a/pytorch/weights/hayao.pt
+++ b/pytorch/weights/hayao.pt
--- a/pytorch/weights/paprika.pt
+++ b/pytorch/weights/paprika.pt
--- a/pytorch/weights/shinkai.pt
+++ b/pytorch/weights/shinkai.pt
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,2 @@
+pathlib
+torchvision