Spaces:

Sarupa
/

AI_Confidence_Layer

Sleeping

Upload 17 files

a66815f verified about 2 months ago

1.41 kB

	import os
	import requests
	from dotenv import load_dotenv, find_dotenv

	# Search upward from this file so it works whether you run from backend/ or root
	load_dotenv(find_dotenv(usecwd=False))

	HF_TOKEN = os.getenv("HF_TOKEN")
	# API_URL = "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.3"
	API_URL = "https://router.huggingface.co/v1/chat/completions"

	# Debug: confirm token is loading
	print(f"[DEBUG] HF_TOKEN loaded: {'YES ('+HF_TOKEN[:8]+'...)' if HF_TOKEN else 'NO - TOKEN IS NONE'}")

	headers = {
	"Authorization": f"Bearer {HF_TOKEN}",
	"Content-Type": "application/json",
	}

	def call_llm(prompt: str, temperature: float = 0.7, top_p: float = 0.9) -> str:
	payload = {
	"model": "Qwen/Qwen2.5-72B-Instruct",
	"messages": [{"role": "user", "content": prompt}],
	"temperature": temperature,
	"top_p": top_p,
	"max_tokens": 400,
	}
	try:
	response = requests.post(API_URL, headers=headers, json=payload, timeout=90)
	print(f"[DEBUG] HF API status: {response.status_code}")
	if response.status_code != 200:
	print(f"[DEBUG] HF API error response: {response.text[:300]}")
	response.raise_for_status()
	return response.json()["choices"][0]["message"]["content"]
	except Exception as e:
	print(f"[DEBUG] Error on temp={temperature}: {str(e)}")
	return f"Error: {str(e)}"