Module_2 / model_api.py
srbhavya01's picture
Update model_api.py
c06dc28 verified
raw
history blame
718 Bytes
from huggingface_hub import InferenceClient
import os
def query_model(prompt):
try:
HF_TOKEN = os.getenv("HF_TOKEN")
# You can also set provider at the client level
client = InferenceClient(api_key=HF_TOKEN, provider="auto")
response = client.chat.completions.create(
model="Qwen/Qwen2.5-7B-Instruct",
messages=[
{"role": "system", "content": "You are a professional fitness trainer."},
{"role": "user", "content": prompt}
],
max_tokens=1500,
temperature=0.7
)
return response.choices[0].message.content
except Exception as e:
return f"Error: {str(e)}"