Add files

Signed-off-by: Jael Gu <mengjia.gu@zilliz.com>
3 years ago · ef9429c86b
4 changed files with 177 additions and 1 deletions
--- a/README.md
+++ b/README.md
@ -1,2 +1,85 @@
 # Ernie
 # 文心一言
 *author: Jael*
 <br />
 ## Description
 A LLM operator generates answer given prompt in messages using a large language model or service.
 This operator is implemented with Ernie Bot from [Baidu](https://cloud.baidu.com/wenxin.html).
 Please note you will need [Ernie API key & Secret key](https://ai.baidu.com/ai-doc/REFERENCE/Lkru0zoz4) to access the service.
 <br />
 ## Code Example
 Use the default model to continue the conversation from given messages.
 *Write a pipeline with explicit inputs/outputs name specifications:*
 ```python
 from towhee import pipe, ops
 p = (
    pipe.input('messages')
        .map('messages', 'answer', ops.LLM.Ernie(api_key=ERNIE_API_KEY, secret_key=ERNIE_SECRET_KEY))
        .output('messages', 'answer')
 )
 messages=[
        {'question': 'Zilliz Cloud 是什么？', 'answer': 'Zilliz Cloud 是一种全托管的向量检索服务。'},
        {'question': '它和 Milvus 的关系是什么？'}
    ]
 answer = p(messages).get()[0]
 ```
 <br />
 ## Factory Constructor
 Create the operator via the following factory method:
 ***LLM.Ernie(api_key: str, secret_key: str)***
 **Parameters:**
 ***api_key***: *str=None*
 The Ernie API key in string, defaults to None. If None, it will use the environment variable `ERNIE_API_KEY`.
 ***secret_key***: *str=None*
 The Ernie Secret key in string, defaults to None. If None, it will use the environment variable `ERNIE_SECRET_KEY`.
 ***\*\*kwargs***
 Other OpenAI parameters such as temperature, etc.
 <br />
 ## Interface
 The operator takes a piece of text in string as input.
 It returns answer in json.
 ***\_\_call\_\_(txt)***
 **Parameters:**
 ***messages***: *list*
 	A list of messages to set up chat.
 Must be a list of dictionaries with key value from "question", "answer". For example, [{"question": "a past question?", "answer": "a past answer."}, {"question": "current question?"}].
 It also accepts the orignal Ernie message format like [{"role": "user", "content": "a question?"}, {"role": "assistant", "content": "an answer."}]
 **Returns**:
 *answer: str*
 	The next answer generated by role "assistant".
 <br />
--- a/init.py
+++ b/init.py
@ -0,0 +1,5 @@
 from .ernie_chat import ErnieChat
 def Ernie(*args, **kwargs):
    return ErnieChat(*args, **kwargs)
--- a/ernie_chat.py
+++ b/ernie_chat.py
@ -0,0 +1,87 @@
 # Copyright 2021 Zilliz. All rights reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
 import requests
 import json
 from typing import List
 from towhee.operator.base import PyOperator
 class ErnieChat(PyOperator):
    '''Wrapper of OpenAI Chat API'''
    def __init__(self,
                 api_key: str = None,
                 secret_key: str = None,
                 **kwargs
                 ):
        self.api_key = api_key or os.getenv('ERNIE_API_KEY')
        self.secret_key = secret_key or os.getenv('ERNIE_SECRET_KEY')
        self.kwargs = kwargs
        try:
            self.access_token = self.get_access_token(api_key=self.api_key, secret_key=self.secret_key)
        except Exception as e:
            raise RuntimeError(f'Failed to get access token: {e}')
        self.url = 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/completions?access_token=' \
            + self.access_token
    def __call__(self, messages: List[dict]):
        messages = self.parse_inputs(messages)
        self.kwargs['messages'] = messages
        payload = json.dumps(self.kwargs)
        headers = {
            'Content-Type': 'application/json'
        }
        response = requests.request('POST', self.url, headers=headers, data=payload)
        # if self.kwargs.get('stream', False):
        #     return self.stream_output(response)
        answer = response.json()['result']
        return answer
    def parse_inputs(self, messages: List[dict]):
        assert isinstance(messages, list), \
            'Inputs must be a list of dictionaries with keys from ["question", "answer"] or ["role", "content"].'
        new_messages = []
        for m in messages:
            if ('role' and 'content' in m) and (m['role'] in ['assistant', 'user']):
                new_messages.append(m)
            else:
                for k, v in m.items():
                    if k == 'question':
                        new_m = {'role': 'user', 'content': v}
                    elif k == 'answer':
                        new_m = {'role': 'assistant', 'content': v}
                    else:
                        'Invalid message key: only accept key value from ["question", "answer"].'
                    new_messages.append(new_m)
        return new_messages
    def stream_output(self, response):
         # todo
         pass
    @staticmethod
    def get_access_token(api_key, secret_key):
        url = 'https://aip.baidubce.com/oauth/2.0/token'
        params = {
            'grant_type': 'client_credentials',
            'client_id': api_key,
            'client_secret': secret_key
            }
        return str(requests.post(url, params=params).json().get('access_token'))
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1 @@
 requests