Update main.py
Browse files
main.py
CHANGED
|
@@ -5,7 +5,7 @@ device = "cuda" # the device to load the model onto
|
|
| 5 |
|
| 6 |
from ctransformers import AutoModelForCausalLM
|
| 7 |
|
| 8 |
-
llm = AutoModelForCausalLM.from_pretrained("TheBloke/Mistral-7B-v0.1-GGUF", model_file="mistral-7b-v0.1.Q4_K_M.gguf", model_type="mistral", gpu_layers=
|
| 9 |
|
| 10 |
|
| 11 |
@app.route('/recommend', methods=['POST'])
|
|
|
|
| 5 |
|
| 6 |
from ctransformers import AutoModelForCausalLM
|
| 7 |
|
| 8 |
+
llm = AutoModelForCausalLM.from_pretrained("TheBloke/Mistral-7B-v0.1-GGUF", model_file="mistral-7b-v0.1.Q4_K_M.gguf", model_type="mistral", gpu_layers=00)
|
| 9 |
|
| 10 |
|
| 11 |
@app.route('/recommend', methods=['POST'])
|