Spaces:

TheHuriShow
/

RecipeWizard

Runtime error

App Files Files Community

TheHuriShow commited on Aug 8, 2025

Commit

68d4109

verified ·

1 Parent(s): dd88dab

Update app.py

Browse files

Files changed (1) hide show

app.py +107 -112

app.py CHANGED Viewed

@@ -1,136 +1,131 @@
-# app.py
 import gradio as gr
 import faiss
 import numpy as np
-from datasets import load_dataset
-from sentence_transformers import SentenceTransformer, util
 from transformers import pipeline
 import time
-# --- 1. LOAD MODELS AND DATA (GLOBAL SCOPE) ---
-# This section runs only once when the app starts.
-print("Loading dataset and embedding model...")
 start_time = time.time()
-# Load the dataset
 dataset = load_dataset("corbt/all-recipes", split="train[:20000]")
-# Extract title and ingredients for embedding
 def extract_title_and_ingredients(sample):
-    """
-    Extract the title and ingredients of a recipe from a sample.
-    """
     extraction = sample['input'][:sample['input'].find("Directions")]
-    return {
-        "text_for_embedding": extraction
-    }
-dataset = dataset.map(extract_title_and_ingredients)
-# Extract all features
 def extract_each_feature(sample):
-    """
-    Extract each feature of a recipe from a sample.
-    """
-    title = sample['input'][:sample['input'].find("\n")]
-    ingredients = sample['input'][sample['input'].find("Ingredients")+len("Ingredients:\n"):sample['input'].find("Directions")].strip()
-    directions = sample['input'][sample['input'].find("Directions")+len("Directions:\n"):].strip()
-    return {
-        "title": title,
-        "ingredients": ingredients,
-        "directions": directions,
-    }
 dataset = dataset.map(extract_each_feature)
-# Load the embedding model
-embedding_model = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
-# Load the pre-built FAISS index
-try:
-    index = faiss.read_index("recipe_index.faiss")
-except Exception as e:
-    print(f"Could not load FAISS index. Error: {e}. Please ensure 'recipe_index.faiss' is in the same directory.")
-    # Handle error gracefully, maybe by disabling the search feature
-    index = None
-# Load the text generation model
-generator = pipeline('text-generation', model='distilgpt2')
 end_time = time.time()
 print(f"Models and data loaded in {end_time - start_time:.2f} seconds.")
-# --- 2. DEFINE THE CORE LOGIC FUNCTION ---
-def find_and_generate(user_ingredients):
-    """
-    This function takes user ingredients, finds similar recipes,
-    and generates a new one.
-    """
-    if not user_ingredients:
-        return "<p>Please enter some ingredients.</p>", "<p></p>"
-    # --- Recommendation Logic ---
-    if index:
-        query_vector = embedding_model.encode([user_ingredients])
-        # We search for 3 results.
-        distances, indices = index.search(np.array(query_vector, dtype=np.float32), 3)
-        recs_html = "<h2>Top 3 Similar Recipes:</h2>"
-        for i, idx in enumerate(indices[0]):
-            title = dataset[int(idx)].get('title', 'No Title')
-            ingredients_list = dataset[int(idx)].get('ingredients', [])
-            # Use a simple join for cleaner HTML
-            ingredients = ", ".join(ingredients_list)
-            recs_html += f"<h3>{i+1}. {title}</h3>"
-            recs_html += f"<p><b>Ingredients:</b> {ingredients}</p><hr>"
-    else:
-        recs_html = "<h2>Recommendation engine not available.</h2> <p>Could not load the FAISS index file.</p>"
-    # --- Generation Logic ---
-    prompt = f"A creative and delicious recipe that features {user_ingredients}.\n\nRecipe Title:"
-    # Let's limit the new tokens to a reasonable amount to prevent overly long responses
-    generated_outputs = generator(prompt, max_new_tokens=100, num_return_sequences=1)
-    generated_text = generated_outputs[0]['generated_text']
-    # --- FIX: Clean up the generated text ---
-    # We remove the original prompt from the start of the generated text.
-    # This prevents sending unnecessary data and fixes the error.
-    if prompt in generated_text:
-        cleaned_generated_text = generated_text[len(prompt):].strip()
-    else:
-        cleaned_generated_text = generated_text.strip()
-    gen_html = "<h2>AI-Generated Idea:</h2>"
-    # Also, replace newline characters with HTML line breaks for better formatting
-    gen_html += cleaned_generated_text.replace("\n", "<br>")
-    return recs_html, gen_html
-# --- 3. CREATE AND LAUNCH THE GRADIO INTERFACE ---
-examples = [
-    ["chicken, potatoes, carrots, onions"],
-    ["beef, soy sauce, ginger, rice"],
-    ["tomatoes, basil, mozzarella, olive oil"],
-]
-demo = gr.Interface(
-    fn=find_and_generate,
-    inputs=gr.Textbox(lines=3, label="Enter Your Ingredients (comma-separated)"),
-    outputs=[
-        gr.HTML(label="Similar Recipes"),
-        gr.HTML(label="AI Generated Recipe")
-    ],
-    title="🍳 Recipe Genius",
-    description="Your personal AI chef! Enter the ingredients you have, and get 3 real recipe recommendations plus 1 new AI-generated idea.",
-    examples=examples,
-    theme=gr.themes.Soft()
-)
-# Launch the app!
-demo.launch(share=True)

 import gradio as gr
+from datasets import load_dataset
+from sentence_transformers import SentenceTransformer
 import faiss
 import numpy as np
+import os
 from transformers import pipeline
 import time
+# --- 1. DATA LOADING AND PREPROCESSING ---
+print("===== Application Startup =====")
 start_time = time.time()
+# Load dataset
 dataset = load_dataset("corbt/all-recipes", split="train[:20000]")
+# Preprocessing functions
 def extract_title_and_ingredients(sample):
     extraction = sample['input'][:sample['input'].find("Directions")]
+    return {"text_for_embedding": extraction}
 def extract_each_feature(sample):
+    title = sample['input'][:sample['input'].find("\\n")]
+    ingredients = sample['input'][sample['input'].find("Ingredients")+len("Ingredients:\\n"):sample['input'].find("Directions")].strip()
+    directions = sample['input'][sample['input'].find("Directions")+len("Directions:\\n"):].strip()
+    return {"title": title, "ingredients": ingredients, "directions": directions}
+# Apply preprocessing
+dataset = dataset.map(extract_title_and_ingredients)
 dataset = dataset.map(extract_each_feature)
+# --- 2. EMBEDDING AND RECOMMENDATION ENGINE ---
+model_name = "all-MiniLM-L6-v2"
+embedding_model = SentenceTransformer(f"sentence-transformers/{model_name}")
+# Compute embeddings
+print("Loading dataset and embedding model...")
+embeddings = embedding_model.encode(dataset['text_for_embedding'], show_progress_bar=True)
+embeddings = np.array(embeddings, dtype=np.float32)
+# Build FAISS index
+dimension = embeddings.shape[1]
+index = faiss.IndexFlatL2(dimension)
+index.add(embeddings)
+print(f"Index is ready. Total vectors in index: {index.ntotal}")
+# --- 3. SYNTHETIC GENERATION ---
+generator = pipeline('text-generation', model='gpt2')
+def get_recommendations_and_generate(query_ingredients, k=3):
+    # 1. Get Recommendations
+    query_vector = embedding_model.encode([query_ingredients])
+    query_vector = np.array(query_vector, dtype=np.float32)
+    distances, indices = index.search(query_vector, k)
+    results = []
+    for i, idx_numpy in enumerate(indices[0]):
+        idx = int(idx_numpy) # FIX: Convert numpy.int64 to standard Python int
+        recipe = {
+            "title": dataset[idx]['title'],
+            "ingredients": dataset[idx]['ingredients'],
+            "directions": dataset[idx]['directions']
+        }
+        results.append(recipe)
+    # 2. Generate a new recipe idea
+    prompt = f"Create a short, simple recipe title and a list of ingredients using: {query_ingredients}."
+    generated_text = generator(prompt, max_length=100, num_return_sequences=1)[0]['generated_text']
+    # Clean up generated text to be more readable
+    # (This is a basic cleanup, can be improved)
+    generated_recipe_parts = generated_text.split("Ingredients:")
+    generated_title = generated_recipe_parts[0].replace(prompt.replace(f"using: {query_ingredients}",""), "").strip()
+    generated_ingredients = generated_recipe_parts[1].strip() if len(generated_recipe_parts) > 1 else "Could not determine ingredients."
+    generated_recipe = {
+        "title": generated_title,
+        "ingredients": generated_ingredients,
+        "directions": "This is an AI-generated idea. Directions are not provided."
+    }
+    return results[0], results[1], results[2], generated_recipe
+# --- 4. GRADIO USER INTERFACE ---
+def format_recipe(recipe):
+    if not recipe or not recipe['title']:
+        return "### No recipe found."
+    return f"### {recipe['title']}\n**Ingredients:**\n{recipe['ingredients']}\n\n**Directions:**\n{recipe['directions']}"
+def recipe_wizard(ingredients):
+    rec1, rec2, rec3, gen_rec = get_recommendations_and_generate(ingredients)
+    return format_recipe(rec1), format_recipe(rec2), format_recipe(rec3), format_recipe(gen_rec)
 end_time = time.time()
 print(f"Models and data loaded in {end_time - start_time:.2f} seconds.")
+# Gradio Interface
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🍳 RecipeWizard AI")
+    gr.Markdown("Enter the ingredients you have, and get recipe recommendations plus a new AI-generated idea!")
+    with gr.Row():
+        ingredient_input = gr.Textbox(label="Your Ingredients", placeholder="e.g., chicken, rice, tomatoes, garlic")
+        submit_btn = gr.Button("Get Recipes")
+    with gr.Row():
+        with gr.Column():
+            gr.Markdown("### Recommended Recipes")
+            output_rec1 = gr.Markdown()
+            output_rec2 = gr.Markdown()
+            output_rec3 = gr.Markdown()
+        with gr.Column():
+            gr.Markdown("### ✨ AI-Generated Idea")
+            output_gen = gr.Markdown()
+    submit_btn.click(
+        fn=recipe_wizard,
+        inputs=ingredient_input,
+        outputs=[output_rec1, output_rec2, output_rec3, output_gen]
+    )
+    gr.Examples(
+        examples=[
+            ["chicken, broccoli, cheese"],
+            ["ground beef, potatoes, onions"],
+            ["flour, sugar, eggs, butter"]
+        ],
+        inputs=ingredient_input
+    )
+demo.launch()