Update

Signed-off-by: Jael Gu <mengjia.gu@zilliz.com>
2 years ago · 28419844ff
2 changed files with 38 additions and 26 deletions
--- a/README.md
+++ b/README.md
@ -48,7 +48,7 @@ Create the operator via the following factory method:
 The model name in string, defaults to None.
 If None, the operator will be initialized without specified model.
 Supported model names:
 Please note only supported models are tested by us:
 <details><summary>Albert</summary>
@ -309,6 +309,12 @@ If None, the operator will download and load pretrained model by `model_name` fr
 <br />
 ***device***: *str*
 The device in string, defaults to None. If None, it will enable "cuda" automatically when cuda is available.
 <br /> 
 ***tokenizer***: *object*
 The method to tokenize input text, defaults to None.
--- a/auto_transformers.py
+++ b/auto_transformers.py
@ -37,14 +37,33 @@ warnings.filterwarnings('ignore')
 os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
 t_logging.set_verbosity_error()
 def create_model(model_name, checkpoint_path, device):
    model = AutoModel.from_pretrained(model_name).to(device)
    if hasattr(model, 'pooler') and model.pooler:
        model.pooler = None
    if checkpoint_path:
        try:
            state_dict = torch.load(checkpoint_path, map_location=device)
            model.load_state_dict(state_dict)
        except Exception:
            log.error(f'Fail to load weights from {checkpoint_path}')
    model.eval()
    return model
 # @accelerate
 class Model:
    def __init__(self, model):
        self.model = model
    def __init__(self, model_name, checkpoint_path, device):
        self.device = device
        self.model = create_model(model_name, checkpoint_path, device)
    def __call__(self, *args, **kwargs):
        outs = self.model(*args, **kwargs, return_dict=True)
        new_args = []
        for x in args:
            new_args.append(x.to(self.device))
        new_kwargs = {}
        for k, v in kwargs.items():
            new_kwargs[k] = v.to(self.device)
        outs = self.model(*new_args, **new_kwargs, return_dict=True)
        return outs['last_hidden_state']
@ -75,17 +94,13 @@ class AutoTransformers(NNOperator):
        self.checkpoint_path = checkpoint_path
        if self.model_name:
            model_list = self.supported_model_names()
            assert model_name in model_list, f"Invalid model name: {model_name}. Supported model names: {model_list}"
            self.model = Model(self._model)
            if tokenizer is None:
                try:
                    self.tokenizer = AutoTokenizer.from_pretrained(model_name)
                except Exception as e:
                    log.error(f'Fail to load default tokenizer by name: {self.model_name}')
                    raise e
            else:
            # model_list = self.supported_model_names()
            # assert model_name in model_list, f"Invalid model name: {model_name}. Supported model names: {model_list}"
            self.model = Model(model_name=self.model_name, checkpoint_path=self.checkpoint_path, device=self.device)
            if tokenizer:
                self.tokenizer = tokenizer
            else:
                self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)
            if not self.tokenizer.pad_token:
                self.tokenizer.pad_token = '[PAD]'
        else:
@ -98,7 +113,7 @@ class AutoTransformers(NNOperator):
        else:
            txt = data
        try:
            inputs = self.tokenizer(txt, padding=True, truncation=True, return_tensors="pt").to(self.device)
            inputs = self.tokenizer(txt, padding=True, truncation=True, return_tensors='pt')
        except Exception as e:
            log.error(f'Fail to tokenize inputs: {e}')
            raise e
@ -116,17 +131,7 @@ class AutoTransformers(NNOperator):
    @property
    def _model(self):
        model = AutoModel.from_pretrained(self.model_name).to(self.device)
        if hasattr(model, 'pooler') and model.pooler:
            model.pooler = None
        if self.checkpoint_path:
            try:
                state_dict = torch.load(self.checkpoint_path, map_location=self.device)
                model.load_state_dict(state_dict)
            except Exception:
                log.error(f'Fail to load weights from {self.checkpoint_path}')
        model.eval()
        return model
        return self.model.model
    def save_model(self, model_type: str = 'pytorch', output_file: str = 'default'):
        if output_file == 'default':
@ -160,6 +165,7 @@ class AutoTransformers(NNOperator):
        elif model_type == 'onnx':
            from transformers.onnx.features import FeaturesManager
            from transformers.onnx import export
            self._model = self._model.to('cpu')
            model_kind, model_onnx_config = FeaturesManager.check_supported_model_or_raise(
                self._model, feature='default')
            onnx_config = model_onnx_config(self._model.config)