Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -33,8 +33,8 @@ def load_pipeline():
|
|
| 33 |
index.add(kb_embeddings)
|
| 34 |
|
| 35 |
# 3. Load Generative LLM (CPU mode)
|
| 36 |
-
llama_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2.5-
|
| 37 |
-
llama_model = AutoModelForCausalLM.from_pretrained("Qwen/Qwen2.5-
|
| 38 |
|
| 39 |
return distil_tokenizer, distil_model, kb, embedder, index, llama_tokenizer, llama_model
|
| 40 |
|
|
|
|
| 33 |
index.add(kb_embeddings)
|
| 34 |
|
| 35 |
# 3. Load Generative LLM (CPU mode)
|
| 36 |
+
llama_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2.5-0.5B-Instruct")
|
| 37 |
+
llama_model = AutoModelForCausalLM.from_pretrained("Qwen/Qwen2.5-0.5B-Instruct", device_map="cpu")
|
| 38 |
|
| 39 |
return distil_tokenizer, distil_model, kb, embedder, index, llama_tokenizer, llama_model
|
| 40 |
|