|
|
|
# Copyright 2021 Zilliz. All rights reserved.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
|
|
|
|
from openai import Embedding
|
|
|
|
from tenacity import retry, stop_after_attempt, wait_random_exponential
|
|
|
|
from towhee.operator.base import PyOperator
|
|
|
|
|
|
|
|
|
|
|
|
class AzureOpenaiEmbeding(PyOperator):
|
|
|
|
def __init__(self,
|
|
|
|
model_name='text-embedding-ada-002',
|
|
|
|
api_type: str = 'azure',
|
|
|
|
api_version: str = '2023-07-01-preview',
|
|
|
|
api_key=None,
|
|
|
|
api_base=None):
|
|
|
|
self._engine = model_name
|
|
|
|
self._api_type = api_type
|
|
|
|
self._api_version = api_version
|
|
|
|
self._api_key = api_key
|
|
|
|
self._api_base = api_base
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
@retry(wait=wait_random_exponential(min=1, max=20), stop=stop_after_attempt(6))
|
|
|
|
def _call(self, text):
|
|
|
|
text = text.replace("\n", " ")
|
|
|
|
return Embedding.create(input=[text],
|
|
|
|
engine=self._engine,
|
|
|
|
api_key=self._api_key,
|
|
|
|
api_type=self._api_type,
|
|
|
|
api_version=self._api_version,
|
|
|
|
api_base=self._api_base
|
|
|
|
)["data"][0]["embedding"]
|
|
|
|
|
|
|
|
def __call__(self, text):
|
|
|
|
return self._call(text)
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def supported_model_names():
|
|
|
|
model_list = [
|
|
|
|
'text-embedding-ada-002',
|
|
|
|
'text-similarity-davinci-001',
|
|
|
|
'text-similarity-curie-001',
|
|
|
|
'text-similarity-babbage-001',
|
|
|
|
'text-similarity-ada-001'
|
|
|
|
]
|
|
|
|
model_list.sort()
|
|
|
|
return model_list
|
|
|
|
|