Spaces:

nutrientartcd
/

recipe-ai-fastapi

Sleeping

vk commited on Sep 2, 2025

Commit

6e6fe5a

1 Parent(s): 233b45a

Improve recipe recommendations: better dessert detection and lightweight LLM

- Replace heavy Llama 2 with DialoGPT-small for HF Spaces
- Add comprehensive dessert/chocolate ingredient detection
- Implement priority-based recipe matching (dessert queries get 3x boost)
- Enhanced search algorithm with 18+ dessert-specific patterns
- Remove heavy dependencies (peft, accelerate, bitsandbytes)
- Fix issue where 'chocolate dessert' returned shrimp recipes

Files changed (2) hide show

app.py +312 -159
requirements.txt +0 -2

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ from pydantic import BaseModel
 from typing import List, Optional
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
-from peft import PeftModel
 import uvicorn
 import os
 import pandas as pd
@@ -249,151 +249,251 @@ def load_recipes():
         raise Exception(f"Failed to load recipe database: {e}")
 @torch.inference_mode()
-def extract_query_features_with_gpt2(query_text, preferences="", max_minutes=30):
-    """Use GPT-2 to intelligently extract searchable features from user query"""
     global tokenizer, model
-    if model is None or tokenizer is None:
-        # Fallback to simple extraction if model not loaded
-        return extract_query_features_simple(query_text, preferences, max_minutes)
-    # Create a structured prompt for GPT-2 to extract features
-    full_query = f"{query_text} {preferences}".strip()
-    extraction_prompt = f"""Extract cooking information from this request: "{full_query}"
-Ingredients mentioned: """
-    try:
-        inputs = tokenizer(extraction_prompt, return_tensors="pt").to(device)
-        # Generate a short response to extract ingredients/features
-        outputs = model.generate(
-            **inputs,
-            max_new_tokens=50,
-            temperature=0.3,  # Lower temperature for more focused extraction
-            top_p=0.9,
-            do_sample=True,
-            pad_token_id=tokenizer.eos_token_id,
-            repetition_penalty=1.1
-        )
-        response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-        gpt2_extraction = response[len(extraction_prompt):].strip()
-        # Parse the GPT-2 response and combine with rule-based extraction
-        gpt2_features = parse_gpt2_extraction(gpt2_extraction)
-        rule_features = extract_query_features_simple(query_text, preferences, max_minutes)
-        # Combine both approaches
-        combined_features = {
-            'ingredients': list(set(gpt2_features.get('ingredients', []) + rule_features['ingredients'])),
-            'cuisines': list(set(gpt2_features.get('cuisines', []) + rule_features['cuisines'])),
-            'diets': list(set(gpt2_features.get('diets', []) + rule_features['diets'])),
-            'styles': list(set(gpt2_features.get('styles', []) + rule_features['styles'])),
-            'max_minutes': max_minutes,
-        }
-        combined_features['search_terms'] = (
-            combined_features['ingredients'] +
-            combined_features['cuisines'] +
-            combined_features['diets'] +
-            combined_features['styles']
-        )
-        print(f"🧠 GPT-2 enhanced extraction: {combined_features['search_terms'][:8]}")
-        return combined_features
-    except Exception as e:
-        print(f"⚠️ GPT-2 extraction failed, using rule-based: {e}")
-        return extract_query_features_simple(query_text, preferences, max_minutes)
-def parse_gpt2_extraction(gpt2_text):
-    """Parse GPT-2's extraction response into structured features"""
-    text_lower = gpt2_text.lower()
-    # Extract ingredients from GPT-2 response
-    ingredients = []
-    common_ingredients = [
-        'chicken', 'beef', 'pork', 'fish', 'salmon', 'shrimp', 'tofu',
-        'pasta', 'rice', 'quinoa', 'bread', 'potatoes', 'noodles',
-        'tomatoes', 'onion', 'garlic', 'ginger', 'peppers', 'broccoli',
-        'spinach', 'carrots', 'mushrooms', 'avocado', 'lemon', 'lime',
-        'cheese', 'milk', 'eggs', 'butter', 'oil', 'flour', 'herbs',
-        'beans', 'lentils', 'chickpeas'
-    ]
-    for ing in common_ingredients:
-        if ing in text_lower:
-            ingredients.append(ing)
-    # Look for cuisine mentions
-    cuisines = []
-    cuisine_words = ['italian', 'mexican', 'asian', 'chinese', 'thai', 'indian', 'greek', 'french', 'mediterranean']
-    for cuisine in cuisine_words:
-        if cuisine in text_lower:
-            cuisines.append(cuisine)
-    # Look for dietary preferences
-    diets = []
-    diet_words = ['vegetarian', 'vegan', 'healthy', 'low-carb', 'keto', 'gluten-free']
-    for diet in diet_words:
-        if diet in text_lower:
-            diets.append(diet)
-    # Look for cooking styles
-    styles = []
-    style_words = ['quick', 'easy', 'fast', 'slow', 'comfort', 'light', 'hearty', 'spicy']
-    for style in style_words:
-        if style in text_lower:
-            styles.append(style)
     return {
         'ingredients': ingredients,
-        'cuisines': cuisines,
-        'diets': diets,
-        'styles': styles
     }
-def extract_query_features_simple(query_text, preferences="", max_minutes=30):
-    """Fallback rule-based feature extraction"""
-    query_lower = query_text.lower() + " " + preferences.lower()
-    # Extract ingredients mentioned
-    common_ingredients = [
-        'chicken', 'beef', 'pork', 'fish', 'salmon', 'shrimp', 'tofu',
-        'pasta', 'rice', 'quinoa', 'bread', 'potatoes', 'noodles',
-        'tomatoes', 'onion', 'garlic', 'ginger', 'peppers', 'broccoli',
-        'spinach', 'carrots', 'mushrooms', 'avocado', 'lemon', 'lime',
-        'cheese', 'milk', 'eggs', 'butter', 'oil', 'flour', 'herbs',
-        'beans', 'lentils', 'chickpeas'
-    ]
-    mentioned_ingredients = [ing for ing in common_ingredients if ing in query_lower]
-    # Extract cuisine preferences
-    cuisines = ['italian', 'mexican', 'asian', 'chinese', 'thai', 'indian', 'greek', 'french']
-    mentioned_cuisines = [cuisine for cuisine in cuisines if cuisine in query_lower]
-    # Extract diet preferences
-    diets = ['vegetarian', 'vegan', 'healthy', 'low-carb', 'keto', 'gluten-free']
-    mentioned_diets = [diet for diet in diets if diet in query_lower]
-    # Extract cooking style
-    styles = ['quick', 'easy', 'fast', 'slow', 'comfort', 'light', 'hearty']
-    mentioned_styles = [style for style in styles if style in query_lower]
     return {
-        'ingredients': mentioned_ingredients,
-        'cuisines': mentioned_cuisines,
-        'diets': mentioned_diets,
-        'styles': mentioned_styles,
-        'max_minutes': max_minutes,
-        'search_terms': mentioned_ingredients + mentioned_cuisines + mentioned_diets + mentioned_styles
     }
 def search_recipes(query_features, top_k=10):
-    """Search for recipes matching the query features"""
     global recipes_df, vectorizer, recipe_vectors
     if recipes_df is None:
@@ -405,7 +505,7 @@ def search_recipes(query_features, top_k=10):
     if len(filtered_df) == 0:
         filtered_df = recipes_df.copy()  # Fall back to all recipes
-    # Create search query
     search_query = ' '.join(query_features['search_terms'])
     if search_query and vectorizer is not None:
@@ -438,20 +538,82 @@ def search_recipes(query_features, top_k=10):
             print(f"⚠️ Similarity length mismatch: {len(similarities)} vs {len(filtered_df)}")
             filtered_df['similarity'] = 0.5
-        # Boost recipes that match specific criteria
-        if query_features['ingredients']:
             for ingredient in query_features['ingredients']:
-                mask = filtered_df['ingredients_text'].str.contains(ingredient, na=False)
-                filtered_df.loc[mask, 'similarity'] *= 1.5
-        if query_features['cuisines']:
             for cuisine in query_features['cuisines']:
-                mask = filtered_df['tags_text'].str.contains(cuisine, na=False) | \
-                       filtered_df['name'].str.lower().str.contains(cuisine, na=False)
                 filtered_df.loc[mask, 'similarity'] *= 1.3
-        # Sort by similarity
         filtered_df = filtered_df.sort_values('similarity', ascending=False)
     else:
         # Fallback: random selection
         filtered_df = filtered_df.sample(min(len(filtered_df), top_k*2), random_state=42)
@@ -465,46 +627,37 @@ async def load_model():
     global tokenizer, model
     try:
-        print("🚀 Loading Recipe AI Model...")
         # Load tokenizer
-        tokenizer = AutoTokenizer.from_pretrained("gpt2")
         if tokenizer.pad_token is None:
             tokenizer.pad_token = tokenizer.eos_token
-        # Load base model
-        print("📦 Loading base GPT-2...")
-        base_model = AutoModelForCausalLM.from_pretrained("gpt2")
-        # Try to load fine-tuned LoRA adapter
-        print("🔧 Looking for LoRA adapter...")
-        try:
-            model = PeftModel.from_pretrained(
-                base_model,
-                "nutrientartcd/recipe-gpt2-lora"
-            ).to(device)
-            print("✅ LoRA adapter loaded successfully!")
-        except Exception as e:
-            print(f"⚠️ Could not load LoRA adapter: {e}")
-            print("🔄 Using base GPT-2 model...")
-            model = base_model.to(device)
         model.eval()
-        print(f"✅ Model loaded successfully on {device}!")
         # Load recipe database
         load_recipes()
     except Exception as e:
-        print(f"❌ Error loading model: {e}")
-        print("🔄 Falling back to base GPT-2...")
-        # Fallback to base model
-        tokenizer = AutoTokenizer.from_pretrained("gpt2")
-        if tokenizer.pad_token is None:
-            tokenizer.pad_token = tokenizer.eos_token
-        model = AutoModelForCausalLM.from_pretrained("gpt2").to(device)
-        model.eval()
         load_recipes()
 # Health check endpoint
@@ -544,8 +697,8 @@ async def get_recipe_suggestions(request: RecipeRequest):
         print(f"📥 Recipe request: {request.ingredients}, prefs: {request.preferences}, time: {request.max_minutes}")
-        # Use GPT-2 enhanced feature extraction
-        query_features = extract_query_features_with_gpt2(
             request.ingredients,
             request.preferences,
             request.max_minutes

 from typing import List, Optional
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
+import json
 import uvicorn
 import os
 import pandas as pd
         raise Exception(f"Failed to load recipe database: {e}")
 @torch.inference_mode()
+def extract_query_features_with_llm(query_text, preferences="", max_minutes=30):
+    """Use DialoGPT and enhanced rule-based extraction for intelligent feature parsing"""
     global tokenizer, model
+    # Always use enhanced rule-based extraction as the foundation
+    enhanced_features = extract_enhanced_features(query_text, preferences, max_minutes)
+    # If model is available, use it to enhance the extraction
+    if model is not None and tokenizer is not None:
+        try:
+            # Use DialoGPT conversational understanding to improve extraction
+            conversation = f"User: I want to cook {query_text} {preferences}".strip()
+            inputs = tokenizer.encode(conversation + tokenizer.eos_token, return_tensors="pt").to(device)
+            # Generate a response to understand intent
+            outputs = model.generate(
+                inputs,
+                max_new_tokens=50,
+                temperature=0.7,
+                top_p=0.9,
+                do_sample=True,
+                pad_token_id=tokenizer.pad_token_id,
+                repetition_penalty=1.2
+            )
+            response = tokenizer.decode(outputs[0][inputs.shape[1]:], skip_special_tokens=True)
+            # Extract additional insights from DialoGPT response
+            llm_insights = extract_insights_from_response(response)
+            # Merge enhanced features with LLM insights
+            merged_features = merge_feature_sets(enhanced_features, llm_insights)
+            print(f"🤖 DialoGPT-enhanced extraction: {merged_features['search_terms'][:8]}")
+            return merged_features
+        except Exception as e:
+            print(f"⚠️ DialoGPT enhancement failed, using rule-based: {e}")
+    print(f"📋 Enhanced rule-based extraction: {enhanced_features['search_terms'][:8]}")
+    return enhanced_features
+def extract_enhanced_features(query_text, preferences="", max_minutes=30):
+    """Enhanced rule-based feature extraction optimized for recipe queries"""
+    query_lower = (query_text + " " + (preferences or "")).lower()
+    # Comprehensive ingredient detection
+    ingredients = detect_ingredients(query_lower)
+    # Meal type detection with better patterns
+    meal_types = detect_meal_types(query_lower)
+    # Cuisine detection
+    cuisines = detect_cuisines(query_lower)
+    # Dietary restrictions and preferences
+    dietary_restrictions = detect_dietary_preferences(query_lower)
+    # Cooking styles and methods
+    cooking_styles = detect_cooking_styles(query_lower)
+    cooking_methods = detect_cooking_methods(query_lower)
+    # Flavor profiles
+    flavors = detect_flavors(query_lower)
     return {
         'ingredients': ingredients,
+        'meal_types': meal_types,
+        'cuisines': cuisines,
+        'dietary_restrictions': dietary_restrictions,
+        'cooking_styles': cooking_styles,
+        'cooking_methods': cooking_methods,
+        'flavors': flavors,
+        'max_minutes': max_minutes,
+        'search_terms': ingredients + meal_types + cuisines + dietary_restrictions + cooking_styles + cooking_methods + flavors
     }
+def detect_ingredients(query_lower):
+    """Detect ingredients with comprehensive patterns"""
+    ingredients = []
+    # Comprehensive ingredient list including dessert ingredients
+    ingredient_patterns = {
+        'proteins': ['chicken', 'beef', 'pork', 'fish', 'salmon', 'shrimp', 'tofu', 'eggs', 'turkey', 'lamb'],
+        'starches': ['rice', 'pasta', 'quinoa', 'bread', 'potatoes', 'noodles', 'flour', 'oats'],
+        'vegetables': ['tomatoes', 'onion', 'garlic', 'ginger', 'peppers', 'broccoli', 'spinach', 'carrots', 'mushrooms', 'avocado'],
+        'dessert_key': ['chocolate', 'cocoa', 'sugar', 'vanilla', 'caramel', 'honey', 'maple syrup', 'cream', 'butter'],
+        'fruits': ['apple', 'banana', 'berries', 'strawberry', 'blueberry', 'lemon', 'lime', 'orange'],
+        'dairy': ['cheese', 'milk', 'yogurt', 'cream'],
+        'nuts_spices': ['nuts', 'almonds', 'walnuts', 'cinnamon', 'nutmeg', 'herbs', 'basil']
+    }
+    for category, items in ingredient_patterns.items():
+        for item in items:
+            if item in query_lower:
+                ingredients.append(item)
+                # Special boost for dessert ingredients
+                if category == 'dessert_key':
+                    ingredients.append(f"sweet_{item}")  # Add emphasis for dessert context
+    return list(set(ingredients))
+def detect_meal_types(query_lower):
+    """Enhanced meal type detection with better patterns"""
+    meal_patterns = {
+        'dessert': ['dessert', 'sweet', 'cake', 'cookie', 'pie', 'ice cream', 'pudding', 'tart', 'chocolate', 'candy'],
+        'breakfast': ['breakfast', 'morning', 'brunch', 'cereal', 'pancake', 'waffle'],
+        'lunch': ['lunch', 'midday', 'sandwich'],
+        'dinner': ['dinner', 'supper', 'evening'],
+        'snack': ['snack', 'appetizer', 'finger food'],
+        'drink': ['drink', 'beverage', 'smoothie', 'juice']
+    }
+    detected = []
+    for meal_type, keywords in meal_patterns.items():
+        if any(keyword in query_lower for keyword in keywords):
+            detected.append(meal_type)
+    return detected
+def detect_cuisines(query_lower):
+    """Detect cuisine types"""
+    cuisines = ['italian', 'mexican', 'asian', 'chinese', 'thai', 'indian', 'greek', 'french', 'mediterranean', 'american', 'japanese']
+    return [cuisine for cuisine in cuisines if cuisine in query_lower]
+def detect_dietary_preferences(query_lower):
+    """Detect dietary restrictions and preferences"""
+    diets = ['vegetarian', 'vegan', 'healthy', 'low-carb', 'keto', 'gluten-free', 'dairy-free']
+    return [diet for diet in diets if diet in query_lower]
+def detect_cooking_styles(query_lower):
+    """Detect cooking styles and preferences"""
+    styles = ['quick', 'easy', 'fast', 'slow', 'comfort', 'light', 'hearty', 'simple']
+    return [style for style in styles if style in query_lower]
+def detect_cooking_methods(query_lower):
+    """Detect cooking methods"""
+    methods = ['baked', 'fried', 'grilled', 'roasted', 'steamed', 'boiled', 'sauteed']
+    return [method for method in methods if method in query_lower]
+def detect_flavors(query_lower):
+    """Detect flavor preferences"""
+    flavors = ['sweet', 'spicy', 'savory', 'sour', 'creamy', 'crispy']
+    return [flavor for flavor in flavors if flavor in query_lower]
+def extract_insights_from_response(response_text):
+    """Extract insights from DialoGPT response"""
+    response_lower = response_text.lower()
+    # Look for food-related words in the response
+    food_words = []
+    cooking_words = []
+    # Simple extraction from response
+    food_indicators = ['recipe', 'cook', 'make', 'prepare', 'dish', 'meal', 'food']
+    for indicator in food_indicators:
+        if indicator in response_lower:
+            cooking_words.append(indicator)
     return {
+        'ingredients': food_words,
+        'cooking_context': cooking_words
     }
+def merge_feature_sets(base_features, llm_insights):
+    """Merge rule-based features with LLM insights"""
+    # Start with base features
+    merged = base_features.copy()
+    # Add LLM insights if they provide new information
+    if llm_insights.get('ingredients'):
+        merged['ingredients'].extend(llm_insights['ingredients'])
+        merged['ingredients'] = list(set(merged['ingredients']))  # Remove duplicates
+    # Rebuild search terms
+    merged['search_terms'] = (
+        merged['ingredients'] + merged['meal_types'] + merged['cuisines'] +
+        merged['dietary_restrictions'] + merged['cooking_styles'] +
+        merged['cooking_methods'] + merged['flavors']
+    )
+    return merged
+def parse_llm_json_response(response_text):
+    """Parse LLM's JSON response into structured features"""
+    try:
+        # Clean the response - remove any non-JSON text
+        response_text = response_text.strip()
+        # Find JSON content between braces
+        start_idx = response_text.find('{')
+        end_idx = response_text.rfind('}') + 1
+        if start_idx == -1 or end_idx == 0:
+            raise ValueError("No JSON found in response")
+        json_text = response_text[start_idx:end_idx]
+        # Parse JSON
+        features = json.loads(json_text)
+        # Ensure all expected keys exist with default empty lists
+        default_features = {
+            'ingredients': [],
+            'meal_types': [],
+            'cuisines': [],
+            'dietary_restrictions': [],
+            'cooking_styles': [],
+            'cooking_methods': [],
+            'flavors': []
+        }
+        # Merge with defaults
+        for key in default_features:
+            if key not in features:
+                features[key] = []
+            elif not isinstance(features[key], list):
+                features[key] = [str(features[key])]
+        return features
+    except Exception as e:
+        print(f"⚠️ JSON parsing failed: {e}")
+        print(f"Response text: {response_text[:200]}...")
+        # Fallback: extract key terms manually
+        text_lower = response_text.lower()
+        return {
+            'ingredients': extract_terms_from_text(text_lower, ['chocolate', 'vanilla', 'sugar', 'flour', 'butter', 'eggs', 'milk']),
+            'meal_types': extract_terms_from_text(text_lower, ['dessert', 'breakfast', 'lunch', 'dinner', 'snack']),
+            'cuisines': extract_terms_from_text(text_lower, ['italian', 'mexican', 'asian', 'french']),
+            'dietary_restrictions': extract_terms_from_text(text_lower, ['vegetarian', 'vegan', 'gluten-free']),
+            'cooking_styles': extract_terms_from_text(text_lower, ['quick', 'easy', 'healthy']),
+            'cooking_methods': extract_terms_from_text(text_lower, ['baked', 'fried', 'grilled']),
+            'flavors': extract_terms_from_text(text_lower, ['sweet', 'savory', 'spicy'])
+        }
+def extract_terms_from_text(text, terms_list):
+    """Helper function to extract terms from text"""
+    return [term for term in terms_list if term in text]
 def search_recipes(query_features, top_k=10):
+    """Enhanced search for recipes matching the LLM-extracted features"""
     global recipes_df, vectorizer, recipe_vectors
     if recipes_df is None:
     if len(filtered_df) == 0:
         filtered_df = recipes_df.copy()  # Fall back to all recipes
+    # Create search query from all LLM-extracted terms
     search_query = ' '.join(query_features['search_terms'])
     if search_query and vectorizer is not None:
             print(f"⚠️ Similarity length mismatch: {len(similarities)} vs {len(filtered_df)}")
             filtered_df['similarity'] = 0.5
+        # Apply intelligent boosting based on enhanced features
+        # HIGHEST PRIORITY: Meal type matches (especially dessert)
+        if query_features.get('meal_types'):
+            for meal_type in query_features['meal_types']:
+                # Check name, tags, and search text for meal type
+                mask = (filtered_df['name'].str.lower().str.contains(meal_type, na=False) |
+                       filtered_df['tags_text'].str.contains(meal_type, na=False) |
+                       filtered_df['search_text'].str.contains(meal_type, na=False))
+                filtered_df.loc[mask, 'similarity'] *= 3.0  # Very high boost
+                # Special handling for desserts - comprehensive dessert detection
+                if meal_type == 'dessert':
+                    dessert_patterns = [
+                        'chocolate', 'cocoa', 'sugar', 'vanilla', 'cake', 'cookie', 'pie',
+                        'sweet', 'candy', 'cream', 'frosting', 'icing', 'dessert', 'pudding',
+                        'brownie', 'tart', 'mousse', 'custard', 'fudge', 'caramel', 'honey'
+                    ]
+                    for pattern in dessert_patterns:
+                        mask = filtered_df['search_text'].str.contains(pattern, na=False)
+                        filtered_df.loc[mask, 'similarity'] *= 2.5  # Strong dessert boost
+                    # Also check recipe names for dessert indicators
+                    dessert_name_patterns = ['cake', 'cookie', 'brownie', 'pie', 'tart', 'sweet', 'chocolate']
+                    for pattern in dessert_name_patterns:
+                        mask = filtered_df['name'].str.lower().str.contains(pattern, na=False)
+                        filtered_df.loc[mask, 'similarity'] *= 2.8
+        # HIGH PRIORITY: Exact ingredient matches
+        if query_features.get('ingredients'):
             for ingredient in query_features['ingredients']:
+                # Regular ingredient matching
+                mask = filtered_df['ingredients_text'].str.contains(ingredient.replace('sweet_', ''), na=False)
+                filtered_df.loc[mask, 'similarity'] *= 2.2
+                # Special handling for dessert ingredients with sweet_ prefix
+                if ingredient.startswith('sweet_'):
+                    base_ingredient = ingredient.replace('sweet_', '')
+                    mask = filtered_df['ingredients_text'].str.contains(base_ingredient, na=False)
+                    # Check if recipe also has dessert context
+                    dessert_context_mask = (
+                        filtered_df['search_text'].str.contains('sweet|dessert|cake|cookie', na=False) |
+                        filtered_df['tags_text'].str.contains('dessert|sweet', na=False)
+                    )
+                    combined_mask = mask & dessert_context_mask
+                    filtered_df.loc[combined_mask, 'similarity'] *= 3.5  # Highest boost for dessert ingredients in dessert context
+        # MEDIUM PRIORITY: Flavor matches (sweet, spicy, etc.)
+        if query_features.get('flavors'):
+            for flavor in query_features['flavors']:
+                mask = filtered_df['search_text'].str.contains(flavor, na=False)
+                multiplier = 2.0 if flavor == 'sweet' else 1.5  # Higher boost for sweet
+                filtered_df.loc[mask, 'similarity'] *= multiplier
+        # LOWER PRIORITY: Cuisine matches
+        if query_features.get('cuisines'):
             for cuisine in query_features['cuisines']:
+                mask = (filtered_df['tags_text'].str.contains(cuisine, na=False) |
+                       filtered_df['name'].str.lower().str.contains(cuisine, na=False))
+                filtered_df.loc[mask, 'similarity'] *= 1.4
+        # LOWER PRIORITY: Cooking method matches
+        if query_features.get('cooking_methods'):
+            for method in query_features['cooking_methods']:
+                mask = (filtered_df['name'].str.lower().str.contains(method, na=False) |
+                       filtered_df['steps_text'].str.contains(method, na=False))
                 filtered_df.loc[mask, 'similarity'] *= 1.3
+        # Sort by similarity (descending)
         filtered_df = filtered_df.sort_values('similarity', ascending=False)
+        # Log the top results for debugging
+        print(f"🔍 Search results for '{search_query}':")
+        for i, (_, recipe) in enumerate(filtered_df.head(3).iterrows()):
+            print(f"  {i+1}. {recipe['name']} (sim: {recipe['similarity']:.3f})")
     else:
         # Fallback: random selection
         filtered_df = filtered_df.sample(min(len(filtered_df), top_k*2), random_state=42)
     global tokenizer, model
     try:
+        print("🚀 Loading DialoGPT for Recipe Intelligence...")
+        # Use DialoGPT-small - lightweight and great for conversational understanding
+        model_name = "microsoft/DialoGPT-small"
         # Load tokenizer
+        print("📚 Loading DialoGPT tokenizer...")
+        tokenizer = AutoTokenizer.from_pretrained(model_name)
         if tokenizer.pad_token is None:
             tokenizer.pad_token = tokenizer.eos_token
+        # Load model - much lighter than Llama 2
+        print("🤖 Loading DialoGPT model (optimized for HF Spaces)...")
+        model = AutoModelForCausalLM.from_pretrained(
+            model_name,
+            torch_dtype=torch.float16 if device == "cuda" else torch.float32,
+            low_cpu_mem_usage=True
+        ).to(device)
         model.eval()
+        print(f"✅ DialoGPT model loaded successfully on {device}!")
         # Load recipe database
         load_recipes()
     except Exception as e:
+        print(f"❌ Error loading DialoGPT model: {e}")
+        print("Falling back to enhanced rule-based processing...")
+        # Don't fail completely - we can still work with enhanced rule-based extraction
+        tokenizer = None
+        model = None
         load_recipes()
 # Health check endpoint
         print(f"📥 Recipe request: {request.ingredients}, prefs: {request.preferences}, time: {request.max_minutes}")
+        # Use LLM for intelligent feature extraction
+        query_features = extract_query_features_with_llm(
             request.ingredients,
             request.preferences,
             request.max_minutes

requirements.txt CHANGED Viewed

@@ -2,11 +2,9 @@ fastapi==0.104.1
 uvicorn[standard]==0.24.0
 torch>=2.0.0
 transformers>=4.35.0
-peft>=0.7.0
 pydantic>=2.0.0
 python-multipart==0.0.6
 huggingface_hub>=0.19.0
-accelerate>=0.24.0
 safetensors>=0.4.0
 pandas>=2.0.0
 scikit-learn>=1.3.0

 uvicorn[standard]==0.24.0
 torch>=2.0.0
 transformers>=4.35.0
 pydantic>=2.0.0
 python-multipart==0.0.6
 huggingface_hub>=0.19.0
 safetensors>=0.4.0
 pandas>=2.0.0
 scikit-learn>=1.3.0