oleksandrfluxon
/

mpt-7b-instruct

Text Generation

text-generation-inference

Model card Files Files and versions Community

oleksandrfluxon commited on Jul 21, 2023

Commit

0519c83

·

1 Parent(s): cd7796f

Update handler.py

Files changed (1) hide show

handler.py +1 -2

handler.py CHANGED Viewed

@@ -7,7 +7,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig
 class EndpointHandler:
     def __init__(self, path=""):
         # load model and tokenizer from path
-        self.tokenizer = AutoTokenizer.from_pretrained("EleutherAI/gpt-neox-20b")
         config = AutoConfig.from_pretrained(path, trust_remote_code=True)
         # config.attn_config['attn_impl'] = 'triton'
@@ -22,7 +22,6 @@ class EndpointHandler:
         )
         # self.device = "cuda" if torch.cuda.is_available() else "cpu"
         self.device = 'cuda'
-        print('===> device', device)
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
         # process input

 class EndpointHandler:
     def __init__(self, path=""):
         # load model and tokenizer from path
+        self.tokenizer = AutoTokenizer.from_pretrained("EleutherAI/gpt-neox-20b", padding_side="left")
         config = AutoConfig.from_pretrained(path, trust_remote_code=True)
         # config.attn_config['attn_impl'] = 'triton'
         )
         # self.device = "cuda" if torch.cuda.is_available() else "cpu"
         self.device = 'cuda'
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
         # process input