FitPlan-module2

Sleeping

App Files Files Community

saiganesh2004 commited on Feb 26

Commit

74ece72

verified ·

1 Parent(s): 2164ce5

Update model_api.py

Browse files

Files changed (1) hide show

model_api.py +146 -68

model_api.py CHANGED Viewed

@@ -1,92 +1,170 @@
 from huggingface_hub import InferenceClient
 import os
 def query_model(prompt):
     """
-    Query the Mistral-7B model with the given prompt
     """
     try:
-        HF_TOKEN = os.getenv("HF_TOKEN")
-        if not HF_TOKEN:
-            return "Error: HF_TOKEN not found. Please set your Hugging Face token in environment variables."
-        # Initialize the client
-        client = InferenceClient(
-            model="mistralai/Mistral-7B-Instruct-v0.2",
-            token=HF_TOKEN
-        )
-        # Enhanced system prompt for better responses
-        system_prompt = """You are a certified professional fitness trainer with expertise in creating personalized workout plans.
-        Always provide complete, detailed workout plans with:
-        - Clear day-by-day structure
-        - Specific exercises with sets, reps, and rest periods
-        - Warm-up and cool-down recommendations
-        - Safety considerations based on user's profile
-        When asked for a 5-day plan, ensure ALL 5 days are included with clear day headers."""
-        # Make the API call
-        response = client.chat_completion(
             messages=[
                 {"role": "system", "content": system_prompt},
-                {"role": "user", "content": prompt}
             ],
-            max_tokens=3000,  # Increased for complete 5-day plan
-            temperature=0.7,
-            top_p=0.95
         )
-        # Extract and return the response
-        workout_plan = response.choices[0].message.content
-        # Verify if the response contains all 5 days
-        days_found = sum([f"Day {i}" in workout_plan for i in range(1, 6)])
-        if days_found < 5:
-            # If incomplete, try one more time with more explicit instruction
-            retry_prompt = prompt + "\n\nIMPORTANT: The previous response was incomplete. Please ensure ALL 5 days (Day 1 through Day 5) are included in the plan. Each day should be clearly marked with 'Day X' header and include 4-6 exercises."
-            retry_response = client.chat_completion(
-                messages=[
-                    {"role": "system", "content": system_prompt},
-                    {"role": "user", "content": retry_prompt}
-                ],
-                max_tokens=2500,
-                temperature=0.7
-            )
-            workout_plan = retry_response.choices[0].message.content
-        return workout_plan
     except Exception as e:
-        return f"Error generating workout plan: {str(e)}"
 def test_api_connection():
     """
     Test function to verify API connection
     """
     try:
-        HF_TOKEN = os.getenv("HF_TOKEN")
-        if not HF_TOKEN:
-            return False, "HF_TOKEN not found"
-        client = InferenceClient(
-            model="mistralai/Mistral-7B-Instruct-v0.2",
-            token=HF_TOKEN
-        )
-        # Simple test prompt
-        response = client.chat_completion(
-            messages=[
-                {"role": "system", "content": "You are a helpful assistant."},
-                {"role": "user", "content": "Say 'API connection successful' if you can read this."}
-            ],
-            max_tokens=50,
-            temperature=0.1
-        )
-        return True, "API connection successful"
     except Exception as e:
-        return False, f"API connection failed: {str(e)}"

 from huggingface_hub import InferenceClient
 import os
+import requests
+import json
+LLAMA_MODEL = "meta-llama/Llama-3.2-3B-Instruct"  # Default model
+USE_LOCAL_OLLAMA = False  # Set to True if using local Ollama
 def query_model(prompt):
     """
+    Query the Llama model with the given prompt
+    Supports both Hugging Face Inference API and local Ollama
     """
     try:
+        if USE_LOCAL_OLLAMA:
+            return query_ollama(prompt)
+        else:
+            return query_huggingface(prompt)
+    except Exception as e:
+        return f"Error generating workout plan: {str(e)}"
+def query_huggingface(prompt):
+    """
+    Query Llama via Hugging Face Inference API
+    """
+    HF_TOKEN = os.getenv("HF_TOKEN")
+    if not HF_TOKEN:
+        return "Error: HF_TOKEN not found. Please set your Hugging Face token in environment variables."
+    # Initialize the client with Llama model
+    client = InferenceClient(
+        model=LLAMA_MODEL,
+        token=HF_TOKEN
+    )
+    # Enhanced system prompt for better responses
+    system_prompt = """You are a certified professional fitness trainer with expertise in creating personalized workout plans.
+    Always provide complete, detailed workout plans with:
+    - Clear day-by-day structure
+    - Specific exercises with sets, reps, and rest periods
+    - Warm-up and cool-down recommendations
+    - Safety considerations based on user's profile
+    When asked for a 5-day plan, ensure ALL 5 days are included with clear day headers."""
+    # Make the API call
+    response = client.chat_completion(
+        messages=[
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": prompt}
+        ],
+        max_tokens=3000,
+        temperature=0.7,
+        top_p=0.95
+    )
+    # Extract and return the response
+    workout_plan = response.choices[0].message.content
+    # Verify if the response contains all 5 days
+    days_found = sum([f"Day {i}" in workout_plan for i in range(1, 6)])
+    if days_found < 5:
+        # If incomplete, try one more time with more explicit instruction
+        retry_prompt = prompt + "\n\nIMPORTANT: The previous response was incomplete. Please ensure ALL 5 days (Day 1 through Day 5) are included in the plan. Each day should be clearly marked with 'Day X' header and include 4-6 exercises."
+        retry_response = client.chat_completion(
             messages=[
                 {"role": "system", "content": system_prompt},
+                {"role": "user", "content": retry_prompt}
             ],
+            max_tokens=3000,
+            temperature=0.7
+        )
+        workout_plan = retry_response.choices[0].message.content
+    return workout_plan
+def query_ollama(prompt):
+    """
+    Query Llama via local Ollama (completely free, no API key needed)
+    """
+    try:
+        response = requests.post(
+            "http://localhost:11434/api/generate",
+            json={
+                "model": "llama3.2:3b",  # or "llama3.2:1b" for lighter model
+                "prompt": f"""You are a certified professional fitness trainer. Create a comprehensive 5-day workout plan.
+{prompt}
+Provide a complete, detailed 5-day workout plan with clear day headers, exercises, sets, reps, and rest periods.""",
+                "stream": False,
+                "max_tokens": 3000,
+                "temperature": 0.7
+            }
         )
+        if response.status_code == 200:
+            return response.json()["response"]
+        else:
+            return f"Error: Ollama returned status code {response.status_code}"
+    except requests.exceptions.ConnectionError:
+        return "Error: Cannot connect to Ollama. Make sure Ollama is running locally (run 'ollama serve' in terminal)"
     except Exception as e:
+        return f"Error with Ollama: {str(e)}"
 def test_api_connection():
     """
     Test function to verify API connection
     """
     try:
+        if USE_LOCAL_OLLAMA:
+            # Test Ollama connection
+            response = requests.post(
+                "http://localhost:11434/api/generate",
+                json={
+                    "model": "llama3.2:3b",
+                    "prompt": "Say 'API connection successful' if you can read this.",
+                    "stream": False,
+                    "max_tokens": 50
+                }
+            )
+            if response.status_code == 200:
+                return True, "Ollama connection successful"
+            else:
+                return False, f"Ollama connection failed: {response.status_code}"
+        else:
+            # Test Hugging Face connection
+            HF_TOKEN = os.getenv("HF_TOKEN")
+            if not HF_TOKEN:
+                return False, "HF_TOKEN not found"
+            client = InferenceClient(
+                model=LLAMA_MODEL,
+                token=HF_TOKEN
+            )
+            response = client.chat_completion(
+                messages=[
+                    {"role": "system", "content": "You are a helpful assistant."},
+                    {"role": "user", "content": "Say 'API connection successful' if you can read this."}
+                ],
+                max_tokens=50,
+                temperature=0.1
+            )
+            return True, f"API connection successful (using {LLAMA_MODEL})"
     except Exception as e:
+        return False, f"API connection failed: {str(e)}"
+def switch_model(model_name):
+    """
+    Switch to a different Llama model
+    """
+    global LLAMA_MODEL
+    LLAMA_MODEL = model_name
+    return f"Switched to {model_name}"
+def set_ollama_mode(use_ollama):
+    """
+    Switch between Hugging Face API and local Ollama
+    """
+    global USE_LOCAL_OLLAMA
+    USE_LOCAL_OLLAMA = use_ollama
+    mode = "local Ollama" if use_ollama else "Hugging Face API"
+    return f"Switched to {mode} mode"