Cyantist8208 commited on
Commit
ce2f7c2
·
1 Parent(s): a97164c
Files changed (1) hide show
  1. app.py +8 -1
app.py CHANGED
@@ -15,9 +15,16 @@ from transformers import (
15
  import torch.nn.functional as F
16
  from collections import defaultdict
17
  HF_TOKEN = os.getenv("HF_token")
18
- CHAT_MODEL_ID = "NousResearch/Meta-Llama-3-8B-Instruct"
19
  EMB_MODEL_ID = "mixedbread-ai/mxbai-embed-large-v1"
20
  MAX_PROMPT_TOKENS = 8192
 
 
 
 
 
 
 
21
 
22
  # ---------- new defaults & helper ------------------
23
  DEFAULT_TEMP = 0.7
 
15
  import torch.nn.functional as F
16
  from collections import defaultdict
17
  HF_TOKEN = os.getenv("HF_token")
18
+ CHAT_MODEL_ID = "meta-llama/Llama-3.1-8B-Instruct"
19
  EMB_MODEL_ID = "mixedbread-ai/mxbai-embed-large-v1"
20
  MAX_PROMPT_TOKENS = 8192
21
+ import transformers
22
+ pipeline = transformers.pipeline(
23
+ "text-generation",
24
+ model=CHAT_MODEL_ID,
25
+ model_kwargs={"torch_dtype": torch.bfloat16},
26
+ device_map="auto",
27
+ )
28
 
29
  # ---------- new defaults & helper ------------------
30
  DEFAULT_TEMP = 0.7