Spaces:
Sleeping
Sleeping
Commit ·
ce2f7c2
1
Parent(s): a97164c
fix
Browse files
app.py
CHANGED
|
@@ -15,9 +15,16 @@ from transformers import (
|
|
| 15 |
import torch.nn.functional as F
|
| 16 |
from collections import defaultdict
|
| 17 |
HF_TOKEN = os.getenv("HF_token")
|
| 18 |
-
CHAT_MODEL_ID = "
|
| 19 |
EMB_MODEL_ID = "mixedbread-ai/mxbai-embed-large-v1"
|
| 20 |
MAX_PROMPT_TOKENS = 8192
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
|
| 22 |
# ---------- new defaults & helper ------------------
|
| 23 |
DEFAULT_TEMP = 0.7
|
|
|
|
| 15 |
import torch.nn.functional as F
|
| 16 |
from collections import defaultdict
|
| 17 |
HF_TOKEN = os.getenv("HF_token")
|
| 18 |
+
CHAT_MODEL_ID = "meta-llama/Llama-3.1-8B-Instruct"
|
| 19 |
EMB_MODEL_ID = "mixedbread-ai/mxbai-embed-large-v1"
|
| 20 |
MAX_PROMPT_TOKENS = 8192
|
| 21 |
+
import transformers
|
| 22 |
+
pipeline = transformers.pipeline(
|
| 23 |
+
"text-generation",
|
| 24 |
+
model=CHAT_MODEL_ID,
|
| 25 |
+
model_kwargs={"torch_dtype": torch.bfloat16},
|
| 26 |
+
device_map="auto",
|
| 27 |
+
)
|
| 28 |
|
| 29 |
# ---------- new defaults & helper ------------------
|
| 30 |
DEFAULT_TEMP = 0.7
|