update

Signed-off-by: junjie.jiang <junjie.jiang@zilliz.com>
3 years ago · e582a9204c
4 changed files with 92 additions and 1 deletions
--- a/README.md
+++ b/README.md
@ -1,2 +1,2 @@
-# clip-vision
+# clip_vision

--- a/init.py
+++ b/init.py
@ -0,0 +1,19 @@
+# Copyright 2021 Zilliz. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+from .clip_vision import ClipVision
+
+def clip_vision(**kwargs):
+    return ClipVision(**kwargs)
--- a/clip_vision.py
+++ b/clip_vision.py
@ -0,0 +1,71 @@
+# Copyright 2021 Zilliz. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import torch
+import numpy as np
+from torchvision import transforms as T
+
+from towhee.operator import NNOperator
+from towhee.models import clip
+
+
+class Model:
+    def __init__(self, model_name, device='cpu'):
+        self.model = clip.create_model(model_name=model_name, pretrained=True, device=device).visual
+        self.model.eval()
+
+    def __call__(self, data: 'Tensor'):
+        return self.model(data)
+
+
+class ClipVision(NNOperator):
+    def __init__(self, model_name='clip_vit_b32'):
+        super().__init__()
+        
+        self.tfms = torch.nn.Sequential(
+            T.Resize(224, interpolation=T.InterpolationMode.BICUBIC),
+            T.CenterCrop(224),
+            T.ConvertImageDtype(torch.float),
+            T.Normalize(
+                (0.48145466, 0.4578275, 0.40821073), (0.26862954, 0.26130258, 0.27577711))
+        ).to(self.device)
+        self.model = Model(model_name, self.device)
+
+    @property
+    def device(self):
+        if self._device_id < 0:
+            return 'cpu'
+        else:
+            return self._device_id
+
+    def __call__(self, image: 'Image'):
+        img = np.transpose(image, [2, 0, 1])
+        data = torch.from_numpy(img)
+        data = data.to(self.device)
+        image_tensor = self.tfms(img)
+        features = self.model(image_tensor)
+        return features.detach().cpu().numpy().flatten()
+
+    def save_model(self, model_type, output_file, args=None):
+        if model_type != 'onnx':
+            return False
+        x = torch.randn((1, 3, 224, 224))
+
+        torch.onnx.export(self.model, x, output_file, input_names=['INPUT0'],
+                          output_names=['OUTPUT0'],  dynamic_axes={'INPUT0': [0]})
+        return True
+
+    @property
+    def supported_formats(self):
+        return ['onnx']
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1 @@
+onnxruntime