Springboardmen commited on
Commit
4ad42f2
·
verified ·
1 Parent(s): f179e9f

Update model_loader.py

Browse files
Files changed (1) hide show
  1. model_loader.py +20 -13
model_loader.py CHANGED
@@ -1,13 +1,20 @@
1
- from transformers import AutoTokenizer, AutoModelForCausalLM
2
- import torch
3
-
4
- MODEL_NAME = "mistralai/Mistral-7B-Instruct-v0.2"
5
-
6
- def load_model():
7
- tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
8
- model = AutoModelForCausalLM.from_pretrained(
9
- MODEL_NAME,
10
- torch_dtype=torch.float16,
11
- device_map="auto"
12
- )
13
- return tokenizer, model
 
 
 
 
 
 
 
 
1
+ import requests
2
+ import os
3
+ from dotenv import load_dotenv
4
+
5
+ load_dotenv()
6
+
7
+ API_URL = "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2"
8
+ headers = {"Authorization": f"Bearer {os.getenv('HF_TOKEN')}"}
9
+
10
+ def query_model(prompt):
11
+ payload = {
12
+ "inputs": prompt,
13
+ "parameters": {
14
+ "max_new_tokens": 800,
15
+ "temperature": 0.7
16
+ }
17
+ }
18
+
19
+ response = requests.post(API_URL, headers=headers, json=payload)
20
+ return response.json()[0]["generated_text"]