diff --git a/clip.py b/clip.py index a52aa9b..1db657c 100644 --- a/clip.py +++ b/clip.py @@ -49,7 +49,7 @@ class Clip(NNOperator): vec = self._inference_from_text(data) else: raise ValueError("modality[{}] not implemented.".format(self._modality)) - return vec.detach().cpu().numpy() + return vec.detach().cpu().numpy().flatten() def _inference_from_text(self, text): text = self.tokenize(text).to(self.device)