Kowsher
/

TokenTrails

Text Generation

text-generation-inference

Model card Files Files and versions

Kowsher commited on Jul 18, 2023

Commit

cd690fb

·

1 Parent(s): 231705d

Update handler.py

Files changed (1) hide show

handler.py +5 -3

handler.py CHANGED Viewed

@@ -1,16 +1,18 @@
 import torch
 from typing import Any, Dict
-from transformers import AutoModelForCausalLM, AutoTokenizer
 from transformers.models.auto import modeling_auto
 class EndpointHandler:
     def __init__(self, path=""):
         # load model and tokenizer from path
-        self.tokenizer = AutoTokenizer.from_pretrained(path)
         self.model = AutoModelForCausalLM.from_pretrained(
-            path, device_map="auto", torch_dtype=torch.float16, trust_remote_code=True
         )
         self.device = "cuda" if torch.cuda.is_available() else "cpu"

 import torch
 from typing import Any, Dict
+from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig
 from transformers.models.auto import modeling_auto
 class EndpointHandler:
     def __init__(self, path=""):
+        print('starting machine')
+        config = AutoConfig.from_pretrained("Kowsher/Egol_model", trust_remote_code=True)
         # load model and tokenizer from path
+        self.tokenizer = AutoTokenizer.from_pretrained(path, trust_remote_code=True)
         self.model = AutoModelForCausalLM.from_pretrained(
+            path, device_map="auto", torch_dtype=torch.float16, config = config, trust_remote_code=True
         )
         self.device = "cuda" if torch.cuda.is_available() else "cpu"