Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
|
@@ -10,7 +10,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "8192"))
|
|
| 10 |
|
| 11 |
class EndpointHandler:
|
| 12 |
def __init__(self, path=""):
|
| 13 |
-
self.model_name_or_path = "
|
| 14 |
self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True, flash_atten=True)
|
| 15 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 16 |
self.model_name_or_path, torch_dtype=torch.bfloat16,
|
|
|
|
| 10 |
|
| 11 |
class EndpointHandler:
|
| 12 |
def __init__(self, path=""):
|
| 13 |
+
self.model_name_or_path = "threadshare/Peach-9B-8k-Roleplay"
|
| 14 |
self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True, flash_atten=True)
|
| 15 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 16 |
self.model_name_or_path, torch_dtype=torch.bfloat16,
|