Spaces:

IPTS-PRODDEV
/

AskNature_BioChat

Build error

App Files Files Community

Mohamed284 commited on Feb 8, 2025

Commit

ab710db

1 Parent(s): d90d3ca

Update API keys and enhance chatbot functionality with Groq integration

Browse files

Files changed (3) hide show

.env +1 -2
app.py +74 -21
main.ipynb +412 -65

.env CHANGED Viewed

@@ -1,8 +1,7 @@
 # API Configuration
 OPENAI_API_KEY="d1c9ed1ca70b9721dee1087d93f9662a"
 GEMINI_API_KEY="AIzaSyDDWHYpQKQ5glnQn5Q-kMTjliwpNfYBpeY"
-# GCP_PROJECT_ID="1008673779731"
-# GCP_API_KEY="AIzaSyDDWHYpQKQ5glnQn5Q-kMTjliwpNfYBpeY"
 GEMINI_API_KEY_1= "AIzaSyDDWHYpQKQ5glnQn5Q-kMTjliwpNfYBpeY"
 GEMINI_API_KEY_2= "AIzaSyDzQSzM9vA6Le36V65I2meN5URclq4JSx0"

 # API Configuration
 OPENAI_API_KEY="d1c9ed1ca70b9721dee1087d93f9662a"
 GEMINI_API_KEY="AIzaSyDDWHYpQKQ5glnQn5Q-kMTjliwpNfYBpeY"
+GROQ_API_KEY="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"
 GEMINI_API_KEY_1= "AIzaSyDDWHYpQKQ5glnQn5Q-kMTjliwpNfYBpeY"
 GEMINI_API_KEY_2= "AIzaSyDzQSzM9vA6Le36V65I2meN5URclq4JSx0"

app.py CHANGED Viewed

@@ -1,13 +1,16 @@
-# Combined Llama 3 and Gemini Flash Chatbot
 import json
 import logging
 import re
-import os
-import pickle
-from typing import List, Tuple, Optional
 import gradio as gr
 from openai import OpenAI
 import google.generativeai as genai
 from functools import lru_cache
 from tenacity import retry, stop_after_attempt, wait_exponential
 from langchain_community.retrievers import BM25Retriever
@@ -204,30 +207,37 @@ class EnhancedRetriever:
         context = []
         for doc in docs:
             context_str = f"""**Source**: [{doc.metadata['source']}]({doc.metadata['hyperlink']})
-    **Application**: {doc.metadata['application']}
-    **Key Concepts**: {', '.join(doc.metadata['technical_concepts'])}
-    **Strategy Excerpt**:\n{doc.page_content.split('Strategy Excerpt:')[-1].strip()}"""
             context.append(context_str)
         return "\n\n---\n\n".join(context)
 # --- Generation System ---
-SYSTEM_PROMPT = """**Biomimicry Expert Guidelines**
-1. Firstly Base answers strictly on context and if there is not context answer by your own.
-2. Cite sources as [Source] witht the hyperlink
-3. **Bold** technical terms
-4. Include reference links at the end of the response
-Context: {context}"""
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=20))
 def get_ai_response(query: str, context: str, model: str) -> str:
     try:
         if model == "gemini-2.0-flash":
             gemini_model = genai.GenerativeModel(model)
             response = gemini_model.generate_content(
                 f"{SYSTEM_PROMPT.format(context=context)}\nQuestion: {query}\nProvide a detailed technical answer:"
             )
-            return _postprocess_response(response.text)
         elif model == "meta-llama-3-70b-instruct":
             response = client.chat.completions.create(
                 model=model,
@@ -238,7 +248,20 @@ def get_ai_response(query: str, context: str, model: str) -> str:
                 temperature=0.4,
                 max_tokens=2000
             )
-            return _postprocess_response(response.choices[0].message.content)
     except Exception as e:
         logger.error(f"Generation Error: {str(e)}")
         return "I'm unable to generate a response right now. Please try again later."
@@ -248,6 +271,36 @@ def _postprocess_response(response: str) -> str:
     response = re.sub(r"\*\*([\w-]+)\*\*", r"**\1**", response)
     return response
 # --- Pipeline ---
 documents = load_and_chunk_data(data_file_name)
 retriever = EnhancedRetriever(documents)
@@ -266,22 +319,22 @@ def chat_interface(question: str, history: List[Tuple[str, str]], model: str):
     return "", history + [(question, response)]
 with gr.Blocks(title="AskNature BioRAG Expert", theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🌿 AskNature RAG-based Chatbot ")
     with gr.Row():
         chatbot = gr.Chatbot(label="Dialogue History", height=500)
     with gr.Row():
-        question = gr.Textbox(placeholder="Ask about biomimicry (e.g. 'How does Werewool use coral proteins to make fibers?')",
-                            label="Inquiry", scale=4)
-        model_selector = gr.Dropdown(choices=["gemini-2.0-flash", "meta-llama-3-70b-instruct"], label="Generation Model", value="gemini-2.0-flash")
         clear_btn = gr.Button("Clear History", variant="secondary")
     gr.Markdown("""
         <div style="text-align: center; color: #4a7c59;">
             <small>Powered by AskNature's Database |
             Explore nature's blueprints at <a href="https://asknature.org">asknature.org</a></small>
         </div>""")
     question.submit(chat_interface, [question, chatbot, model_selector], [question, chatbot])
     clear_btn.click(lambda: [], None, chatbot)
 if __name__ == "__main__":
-    demo.launch(show_error=True)

+# Combined Gemini Flash and Meta-LLAMA 3 GWDG and Groq Chatbot
+# For Gemini Flash rate limit is 15 requests per minute
+# For Groq rate 30 RPM , 14400 RPD, 6K TPM and 500K TPD
+import os
 import json
 import logging
 import re
+from typing import List, Tuple
 import gradio as gr
 from openai import OpenAI
 import google.generativeai as genai
+import requests
 from functools import lru_cache
 from tenacity import retry, stop_after_attempt, wait_exponential
 from langchain_community.retrievers import BM25Retriever
         context = []
         for doc in docs:
             context_str = f"""**Source**: [{doc.metadata['source']}]({doc.metadata['hyperlink']})
+**Application**: {doc.metadata['application']}
+**Key Concepts**: {', '.join(doc.metadata['technical_concepts'])}
+**Strategy Excerpt**:
+{doc.page_content.split('Strategy Excerpt:')[-1].strip()}"""
             context.append(context_str)
         return "\n\n---\n\n".join(context)
 # --- Generation System ---
+SYSTEM_PROMPT = """
+**Biomimicry Expert Guidelines**
+- Use only the provided AskNature context (e.g., Source, Application, Strategy, technical_concepts). If no context is given, note that you're using your own expertise.
+- When referencing facts, use numeric citations in square brackets (e.g., [1]). Do not include full URLs inline.
+- Bold all technical terms (e.g., **protein-based pigmentation**, **DNA-level fiber design**).
+- Provide a concise, expert answer that explains the innovation and its sustainability benefits.
+- End your response with a "References" section listing each URL with its citation number.
+Context: {context}
+"""
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=20))
 def get_ai_response(query: str, context: str, model: str) -> str:
+    result = ""  # Initialize the result variable
     try:
         if model == "gemini-2.0-flash":
             gemini_model = genai.GenerativeModel(model)
             response = gemini_model.generate_content(
                 f"{SYSTEM_PROMPT.format(context=context)}\nQuestion: {query}\nProvide a detailed technical answer:"
             )
+            logger.info(f"Response from gemini-2.0-flash: {response.text}")
+            result = _postprocess_response(response.text)
         elif model == "meta-llama-3-70b-instruct":
             response = client.chat.completions.create(
                 model=model,
                 temperature=0.4,
                 max_tokens=2000
             )
+            logger.info(f"Response from meta-llama-3-70b-instruct: {response}")
+            try:
+                result = response.choices[0].message.content
+            except Exception as e:
+                logger.error(f"Error processing meta-llama-3-70b-instruct response: {str(e)}")
+                result = "Failed to process response from meta-llama-3-70b-instruct"
+        elif model == "llama3-70b-8192":
+            result = get_groq_llama3_response(query)
+            logger.info(f"Response from llama3-70b-8192: {result}")
+            if result is None:
+                result = "Failed to get response from llama3-70b-8192"
+        # Append the model name to the response for clarity
+        result += f"\n\n**Model:** {model}"
+        return result
     except Exception as e:
         logger.error(f"Generation Error: {str(e)}")
         return "I'm unable to generate a response right now. Please try again later."
     response = re.sub(r"\*\*([\w-]+)\*\*", r"**\1**", response)
     return response
+def get_groq_llama3_response(query: str) -> str:
+    """Get response from Llama 3 on Groq Cloud."""
+    api_key = os.getenv("GROQ_API_KEY")
+    url = "https://api.groq.com/openai/v1/chat/completions"
+    headers = {
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {api_key}"
+    }
+    payload = {
+        "model": "llama3-70b-8192",
+        "messages": [
+            {
+                "role": "user",
+                "content": query
+            }
+        ]
+    }
+    try:
+        response = requests.post(url, headers=headers, json=payload)
+        response.raise_for_status()
+        result = response.json()
+        logger.info(f"Groq API Response: {result}")
+        return result["choices"][0]["message"]["content"]
+    except requests.exceptions.RequestException as e:
+        logger.error(f"Groq API Error: {str(e)}")
+        return "An error occurred while contacting Groq's Llama 3 model."
 # --- Pipeline ---
 documents = load_and_chunk_data(data_file_name)
 retriever = EnhancedRetriever(documents)
     return "", history + [(question, response)]
 with gr.Blocks(title="AskNature BioRAG Expert", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🌿 AskNature RAG-based Chatbot")
     with gr.Row():
         chatbot = gr.Chatbot(label="Dialogue History", height=500)
     with gr.Row():
+        question = gr.Textbox(placeholder="Ask about biomimicry (e.g. 'How does Werewool use coral proteins to make fibers?')", label="Inquiry", scale=4)
+        model_selector = gr.Dropdown(choices=["gemini-2.0-flash", "meta-llama-3-70b-instruct(GWDG)", "llama3-70b-8192(Groq)"], label="Generation Model", value="gemini-2.0-flash")
         clear_btn = gr.Button("Clear History", variant="secondary")
     gr.Markdown("""
         <div style="text-align: center; color: #4a7c59;">
             <small>Powered by AskNature's Database |
             Explore nature's blueprints at <a href="https://asknature.org">asknature.org</a></small>
         </div>""")
     question.submit(chat_interface, [question, chatbot, model_selector], [question, chatbot])
     clear_btn.click(lambda: [], None, chatbot)
 if __name__ == "__main__":
+    demo.launch(show_error=True)

main.ipynb CHANGED Viewed

@@ -873,6 +873,315 @@
    "outputs": [],
    "source": []
   },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -885,8 +1194,6 @@
       "INFO:__main__:Loading cached documents\n",
       "INFO:__main__:Loading cached BM25 index\n",
       "INFO:__main__:Loading cached FAISS index\n",
-      "INFO:faiss.loader:Loading faiss with AVX2 support.\n",
-      "INFO:faiss.loader:Successfully loaded faiss with AVX2 support.\n",
       "c:\\Users\\Mohamed Elsafty\\.conda\\envs\\rag\\Lib\\site-packages\\gradio\\components\\chatbot.py:273: UserWarning: You have not specified a value for the `type` parameter. Defaulting to the 'tuples' format for chatbot messages, but this is deprecated and will be removed in a future version of Gradio. Please set type='messages' instead, which uses openai-style dictionaries with 'role' and 'content' keys.\n",
       "  warnings.warn(\n"
      ]
@@ -895,16 +1202,15 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "* Running on local URL:  http://127.0.0.1:7860\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "INFO:httpx:HTTP Request: GET https://api.gradio.app/pkg-version \"HTTP/1.1 200 OK\"\n",
-      "INFO:httpx:HTTP Request: GET http://127.0.0.1:7860/gradio_api/startup-events \"HTTP/1.1 200 OK\"\n",
-      "INFO:httpx:HTTP Request: HEAD http://127.0.0.1:7860/ \"HTTP/1.1 200 OK\"\n"
      ]
     },
     {
@@ -918,7 +1224,7 @@
     {
      "data": {
       "text/html": [
-       "<div><iframe src=\"http://127.0.0.1:7860/\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
       ],
       "text/plain": [
        "<IPython.core.display.HTML object>"
@@ -931,24 +1237,50 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
       "INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/chat/completions \"HTTP/1.1 200 OK\"\n",
       "Embedding Progress:   0%|          | 0/1 [00:00<?, ?it/s]INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/embeddings \"HTTP/1.1 200 OK\"\n",
-      "Embedding Progress: 100%|██████████| 1/1 [00:00<00:00,  4.64it/s]\n",
-      "INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/chat/completions \"HTTP/1.1 200 OK\"\n"
      ]
     }
    ],
    "source": [
-    "# Combined Llama 3 and Gemini Flash Chatbot\n",
     "import json\n",
     "import logging\n",
     "import re\n",
-    "import os\n",
-    "import pickle\n",
-    "from typing import List, Tuple, Optional\n",
     "import gradio as gr\n",
     "from openai import OpenAI\n",
     "import google.generativeai as genai\n",
     "from functools import lru_cache\n",
     "from tenacity import retry, stop_after_attempt, wait_exponential\n",
     "from langchain_community.retrievers import BM25Retriever\n",
@@ -1145,30 +1477,37 @@
     "        context = []\n",
     "        for doc in docs:\n",
     "            context_str = f\"\"\"**Source**: [{doc.metadata['source']}]({doc.metadata['hyperlink']})\n",
-    "    **Application**: {doc.metadata['application']}\n",
-    "    **Key Concepts**: {', '.join(doc.metadata['technical_concepts'])}\n",
-    "    **Strategy Excerpt**:\\n{doc.page_content.split('Strategy Excerpt:')[-1].strip()}\"\"\"\n",
     "            context.append(context_str)\n",
     "        return \"\\n\\n---\\n\\n\".join(context)\n",
     "\n",
     "# --- Generation System ---\n",
-    "SYSTEM_PROMPT = \"\"\"**Biomimicry Expert Guidelines**\n",
-    "1. Base answers strictly on context\n",
-    "2. Cite sources as [Source]\n",
-    "3. **Bold** technical terms\n",
-    "4. Include reference links\n",
     "\n",
-    "Context: {context}\"\"\"\n",
     "\n",
     "@retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=20))\n",
     "def get_ai_response(query: str, context: str, model: str) -> str:\n",
     "    try:\n",
     "        if model == \"gemini-2.0-flash\":\n",
     "            gemini_model = genai.GenerativeModel(model)\n",
     "            response = gemini_model.generate_content(\n",
     "                f\"{SYSTEM_PROMPT.format(context=context)}\\nQuestion: {query}\\nProvide a detailed technical answer:\"\n",
     "            )\n",
-    "            return _postprocess_response(response.text)\n",
     "        elif model == \"meta-llama-3-70b-instruct\":\n",
     "            response = client.chat.completions.create(\n",
     "                model=model,\n",
@@ -1179,7 +1518,20 @@
     "                temperature=0.4,\n",
     "                max_tokens=2000\n",
     "            )\n",
-    "            return _postprocess_response(response.choices[0].message.content)\n",
     "    except Exception as e:\n",
     "        logger.error(f\"Generation Error: {str(e)}\")\n",
     "        return \"I'm unable to generate a response right now. Please try again later.\"\n",
@@ -1189,6 +1541,36 @@
     "    response = re.sub(r\"\\*\\*([\\w-]+)\\*\\*\", r\"**\\1**\", response)\n",
     "    return response\n",
     "\n",
     "# --- Pipeline ---\n",
     "documents = load_and_chunk_data(data_file_name)\n",
     "retriever = EnhancedRetriever(documents)\n",
@@ -1207,62 +1589,27 @@
     "    return \"\", history + [(question, response)]\n",
     "\n",
     "with gr.Blocks(title=\"AskNature BioRAG Expert\", theme=gr.themes.Soft()) as demo:\n",
-    "    gr.Markdown(\"# 🌿 AskNature RAG-based Chatbot \")\n",
     "    with gr.Row():\n",
     "        chatbot = gr.Chatbot(label=\"Dialogue History\", height=500)\n",
     "    with gr.Row():\n",
-    "        question = gr.Textbox(placeholder=\"Ask about biomimicry (e.g. 'How does Werewool use coral proteins to make fibers?')\",\n",
-    "                            label=\"Inquiry\", scale=4)\n",
-    "        model_selector = gr.Dropdown(choices=[\"gemini-2.0-flash\", \"meta-llama-3-70b-instruct\"], label=\"Generation Model\", value=\"gemini-2.0-flash\")\n",
     "        clear_btn = gr.Button(\"Clear History\", variant=\"secondary\")\n",
-    "    \n",
     "    gr.Markdown(\"\"\"\n",
     "        <div style=\"text-align: center; color: #4a7c59;\">\n",
     "            <small>Powered by AskNature's Database | \n",
     "            Explore nature's blueprints at <a href=\"https://asknature.org\">asknature.org</a></small>\n",
     "        </div>\"\"\")\n",
     "    question.submit(chat_interface, [question, chatbot, model_selector], [question, chatbot])\n",
     "    clear_btn.click(lambda: [], None, chatbot)\n",
     "\n",
     "if __name__ == \"__main__\":\n",
-    "    demo.launch(show_error=True)"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
   {
    "cell_type": "code",
    "execution_count": null,

    "outputs": [],
    "source": []
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Combined Llama 3 and Gemini Flash Chatbot\n",
+    "import json\n",
+    "import logging\n",
+    "import re\n",
+    "import os\n",
+    "import pickle\n",
+    "from typing import List, Tuple, Optional\n",
+    "import gradio as gr\n",
+    "from openai import OpenAI\n",
+    "import google.generativeai as genai\n",
+    "from functools import lru_cache\n",
+    "from tenacity import retry, stop_after_attempt, wait_exponential\n",
+    "from langchain_community.retrievers import BM25Retriever\n",
+    "from langchain_community.vectorstores import FAISS\n",
+    "from langchain_core.embeddings import Embeddings\n",
+    "from langchain_core.documents import Document\n",
+    "from collections import defaultdict\n",
+    "import hashlib\n",
+    "from tqdm import tqdm\n",
+    "from dotenv import load_dotenv\n",
+    "\n",
+    "load_dotenv()\n",
+    "\n",
+    "# --- Configuration ---\n",
+    "FAISS_INDEX_PATH = \"faiss_index\"\n",
+    "BM25_INDEX_PATH = \"bm25_index.pkl\"\n",
+    "CACHE_VERSION = \"v1\"\n",
+    "embedding_model = \"e5-mistral-7b-instruct\"\n",
+    "data_file_name = \"AskNatureNet_data_enhanced.json\"\n",
+    "CHUNK_SIZE = 800\n",
+    "OVERLAP = 200\n",
+    "EMBEDDING_BATCH_SIZE = 32\n",
+    "\n",
+    "# Initialize clients\n",
+    "OPENAI_API_CONFIG = {\n",
+    "    \"api_key\": os.getenv(\"OPENAI_API_KEY\"),\n",
+    "    \"base_url\": \"https://chat-ai.academiccloud.de/v1\"\n",
+    "}\n",
+    "client = OpenAI(**OPENAI_API_CONFIG)\n",
+    "genai.configure(api_key=os.getenv(\"GEMINI_API_KEY\"))\n",
+    "\n",
+    "logging.basicConfig(level=logging.INFO)\n",
+    "logger = logging.getLogger(__name__)\n",
+    "\n",
+    "# --- Helper Functions ---\n",
+    "def get_data_hash(file_path: str) -> str:\n",
+    "    \"\"\"Generate hash of data file for cache validation\"\"\"\n",
+    "    with open(file_path, \"rb\") as f:\n",
+    "        return hashlib.md5(f.read()).hexdigest()\n",
+    "\n",
+    "# --- Custom Embedding Handler ---\n",
+    "class MistralEmbeddings(Embeddings):\n",
+    "    \"\"\"E5-Mistral-7B embedding adapter\"\"\"\n",
+    "    def embed_documents(self, texts: List[str]) -> List[List[float]]:\n",
+    "        embeddings = []\n",
+    "        try:\n",
+    "            for i in tqdm(range(0, len(texts), EMBEDDING_BATCH_SIZE), desc=\"Embedding Progress\"):\n",
+    "                batch = texts[i:i + EMBEDDING_BATCH_SIZE]\n",
+    "                response = client.embeddings.create(\n",
+    "                    input=batch,\n",
+    "                    model=embedding_model,\n",
+    "                    encoding_format=\"float\"\n",
+    "                )\n",
+    "                embeddings.extend([e.embedding for e in response.data])\n",
+    "            return embeddings\n",
+    "        except Exception as e:\n",
+    "            logger.error(f\"Embedding Error: {str(e)}\")\n",
+    "            return [[] for _ in texts]\n",
+    "        \n",
+    "    def embed_query(self, text: str) -> List[float]:\n",
+    "        return self.embed_documents([text])[0]\n",
+    "\n",
+    "# --- Data Processing ---\n",
+    "def load_and_chunk_data(file_path: str) -> List[Document]:\n",
+    "    \"\"\"Enhanced chunking with metadata preservation\"\"\"\n",
+    "    current_hash = get_data_hash(file_path)\n",
+    "    cache_file = f\"documents_{CACHE_VERSION}_{current_hash}.pkl\"\n",
+    "    \n",
+    "    if os.path.exists(cache_file):\n",
+    "        logger.info(\"Loading cached documents\")\n",
+    "        with open(cache_file, \"rb\") as f:\n",
+    "            return pickle.load(f)\n",
+    "    \n",
+    "    with open(file_path, 'r', encoding='utf-8') as f:\n",
+    "        data = json.load(f)\n",
+    "    \n",
+    "    documents = []\n",
+    "    for item in tqdm(data, desc=\"Chunking Progress\"):\n",
+    "        base_content = f\"\"\"Source: {item['Source']}\n",
+    "Application: {item['Application']}\n",
+    "Functions: {', '.join(filter(None, [item.get('Function1'), item.get('Function2')]))}\n",
+    "Technical Concepts: {', '.join(item['technical_concepts'])}\n",
+    "Biological Mechanisms: {', '.join(item['biological_mechanisms'])}\"\"\"\n",
+    "        \n",
+    "        strategy = item['Strategy']\n",
+    "        for i in range(0, len(strategy), CHUNK_SIZE - OVERLAP):\n",
+    "            chunk = strategy[i:i + CHUNK_SIZE]\n",
+    "            documents.append(Document(\n",
+    "                page_content=f\"{base_content}\\nStrategy Excerpt:\\n{chunk}\",\n",
+    "                metadata={\n",
+    "                    \"source\": item[\"Source\"],\n",
+    "                    \"application\": item[\"Application\"],\n",
+    "                    \"technical_concepts\": item[\"technical_concepts\"],\n",
+    "                    \"sustainability_impacts\": item[\"sustainability_impacts\"],\n",
+    "                    \"hyperlink\": item[\"Hyperlink\"],\n",
+    "                    \"chunk_id\": f\"{item['Source']}-{len(documents)+1}\"\n",
+    "                }\n",
+    "            ))\n",
+    "    \n",
+    "    with open(cache_file, \"wb\") as f:\n",
+    "        pickle.dump(documents, f)\n",
+    "    return documents\n",
+    "\n",
+    "# --- Optimized Retrieval System ---\n",
+    "class EnhancedRetriever:\n",
+    "    \"\"\"Hybrid retriever with persistent caching\"\"\"\n",
+    "    def __init__(self, documents: List[Document]):\n",
+    "        self.documents = documents\n",
+    "        self.bm25 = self._init_bm25()\n",
+    "        self.vector_store = self._init_faiss()\n",
+    "        self.vector_retriever = self.vector_store.as_retriever(search_kwargs={\"k\": 3})\n",
+    "\n",
+    "    def _init_bm25(self) -> BM25Retriever:\n",
+    "        cache_key = f\"{BM25_INDEX_PATH}_{get_data_hash(data_file_name)}\"\n",
+    "        if os.path.exists(cache_key):\n",
+    "            logger.info(\"Loading cached BM25 index\")\n",
+    "            with open(cache_key, \"rb\") as f:\n",
+    "                return pickle.load(f)\n",
+    "        \n",
+    "        logger.info(\"Building new BM25 index\")\n",
+    "        retriever = BM25Retriever.from_documents(self.documents)\n",
+    "        retriever.k = 5\n",
+    "        with open(cache_key, \"wb\") as f:\n",
+    "            pickle.dump(retriever, f)\n",
+    "        return retriever\n",
+    "\n",
+    "    def _init_faiss(self) -> FAISS:\n",
+    "        cache_key = f\"{FAISS_INDEX_PATH}_{get_data_hash(data_file_name)}\"\n",
+    "        if os.path.exists(cache_key):\n",
+    "            logger.info(\"Loading cached FAISS index\")\n",
+    "            return FAISS.load_local(\n",
+    "                cache_key,\n",
+    "                MistralEmbeddings(),\n",
+    "                allow_dangerous_deserialization=True\n",
+    "            )\n",
+    "        \n",
+    "        logger.info(\"Building new FAISS index\")\n",
+    "        vector_store = FAISS.from_documents(self.documents, MistralEmbeddings())\n",
+    "        vector_store.save_local(cache_key)\n",
+    "        return vector_store\n",
+    "\n",
+    "    @lru_cache(maxsize=500)\n",
+    "    def retrieve(self, query: str) -> str:\n",
+    "        try:\n",
+    "            processed_query = self._preprocess_query(query)\n",
+    "            expanded_query = self._hyde_expansion(processed_query)\n",
+    "            \n",
+    "            bm25_results = self.bm25.invoke(processed_query)\n",
+    "            vector_results = self.vector_retriever.invoke(processed_query)\n",
+    "            expanded_results = self.bm25.invoke(expanded_query)\n",
+    "            \n",
+    "            fused_results = self._fuse_results([bm25_results, vector_results, expanded_results])\n",
+    "            return self._format_context(fused_results[:5])\n",
+    "        except Exception as e:\n",
+    "            logger.error(f\"Retrieval Error: {str(e)}\")\n",
+    "            return \"\"\n",
+    "\n",
+    "    def _preprocess_query(self, query: str) -> str:\n",
+    "        return query.lower().strip()\n",
+    "\n",
+    "    @lru_cache(maxsize=500)\n",
+    "    def _hyde_expansion(self, query: str) -> str:\n",
+    "        try:\n",
+    "            response = client.chat.completions.create(\n",
+    "                model=\"meta-llama-3-70b-instruct\",\n",
+    "                messages=[{\n",
+    "                    \"role\": \"user\",\n",
+    "                    \"content\": f\"Generate a technical draft about biomimicry for: {query}\\nInclude domain-specific terms.\"\n",
+    "                }],\n",
+    "                temperature=0.5,\n",
+    "                max_tokens=200\n",
+    "            )\n",
+    "            return response.choices[0].message.content\n",
+    "        except Exception as e:\n",
+    "            logger.error(f\"HyDE Error: {str(e)}\")\n",
+    "            return query\n",
+    "\n",
+    "    def _fuse_results(self, result_sets: List[List[Document]]) -> List[Document]:\n",
+    "        fused_scores = defaultdict(float)\n",
+    "        for docs in result_sets:\n",
+    "            for rank, doc in enumerate(docs, 1):\n",
+    "                fused_scores[doc.metadata[\"chunk_id\"]] += 1 / (rank + 60)\n",
+    "        \n",
+    "        seen = set()\n",
+    "        return [\n",
+    "            doc for doc in sorted(\n",
+    "                (doc for docs in result_sets for doc in docs),\n",
+    "                key=lambda x: fused_scores[x.metadata[\"chunk_id\"]],\n",
+    "                reverse=True\n",
+    "            ) if not (doc.metadata[\"chunk_id\"] in seen or seen.add(doc.metadata[\"chunk_id\"]))\n",
+    "        ]\n",
+    "\n",
+    "    def _format_context(self, docs: List[Document]) -> str:\n",
+    "        context = []\n",
+    "        for doc in docs:\n",
+    "            context_str = f\"\"\"**Source**: [{doc.metadata['source']}]({doc.metadata['hyperlink']})\n",
+    "    **Application**: {doc.metadata['application']}\n",
+    "    **Key Concepts**: {', '.join(doc.metadata['technical_concepts'])}\n",
+    "    **Strategy Excerpt**:\\n{doc.page_content.split('Strategy Excerpt:')[-1].strip()}\"\"\"\n",
+    "            context.append(context_str)\n",
+    "        return \"\\n\\n---\\n\\n\".join(context)\n",
+    "\n",
+    "# --- Generation System ---\n",
+    "SYSTEM_PROMPT = \"\"\"**Biomimicry Expert Guidelines**\n",
+    "1. Firstly Base answers strictly on context and if there is not context answer by your own.\n",
+    "2. Cite sources as [Source] witht the hyperlink\n",
+    "3. **Bold** technical terms\n",
+    "4. Include reference links at the end of the response\n",
+    "\n",
+    "Context: {context}\"\"\"\n",
+    "\n",
+    "@retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=20))\n",
+    "def get_ai_response(query: str, context: str, model: str) -> str:\n",
+    "    try:\n",
+    "        if model == \"gemini-2.0-flash\":\n",
+    "            gemini_model = genai.GenerativeModel(model)\n",
+    "            response = gemini_model.generate_content(\n",
+    "                f\"{SYSTEM_PROMPT.format(context=context)}\\nQuestion: {query}\\nProvide a detailed technical answer:\"\n",
+    "            )\n",
+    "            return _postprocess_response(response.text)\n",
+    "        elif model == \"meta-llama-3-70b-instruct\":\n",
+    "            response = client.chat.completions.create(\n",
+    "                model=model,\n",
+    "                messages=[\n",
+    "                    {\"role\": \"system\", \"content\": SYSTEM_PROMPT.format(context=context)},\n",
+    "                    {\"role\": \"user\", \"content\": f\"Question: {query}\\nProvide a detailed technical answer:\"}\n",
+    "                ],\n",
+    "                temperature=0.4,\n",
+    "                max_tokens=2000\n",
+    "            )\n",
+    "            return _postprocess_response(response.choices[0].message.content)\n",
+    "    except Exception as e:\n",
+    "        logger.error(f\"Generation Error: {str(e)}\")\n",
+    "        return \"I'm unable to generate a response right now. Please try again later.\"\n",
+    "\n",
+    "def _postprocess_response(response: str) -> str:\n",
+    "    response = re.sub(r\"\\[(.*?)\\]\", r\"[\\1](#)\", response)\n",
+    "    response = re.sub(r\"\\*\\*([\\w-]+)\\*\\*\", r\"**\\1**\", response)\n",
+    "    return response\n",
+    "\n",
+    "# --- Pipeline ---\n",
+    "documents = load_and_chunk_data(data_file_name)\n",
+    "retriever = EnhancedRetriever(documents)\n",
+    "\n",
+    "def generate_response(question: str, model: str) -> str:\n",
+    "    try:\n",
+    "        context = retriever.retrieve(question)\n",
+    "        return get_ai_response(question, context, model) if context else \"No relevant information found.\"\n",
+    "    except Exception as e:\n",
+    "        logger.error(f\"Pipeline Error: {str(e)}\")\n",
+    "        return \"An error occurred processing your request.\"\n",
+    "\n",
+    "# --- Gradio Interface ---\n",
+    "def chat_interface(question: str, history: List[Tuple[str, str]], model: str):\n",
+    "    response = generate_response(question, model)\n",
+    "    return \"\", history + [(question, response)]\n",
+    "\n",
+    "with gr.Blocks(title=\"AskNature BioRAG Expert\", theme=gr.themes.Soft()) as demo:\n",
+    "    gr.Markdown(\"# 🌿 AskNature RAG-based Chatbot \")\n",
+    "    with gr.Row():\n",
+    "        chatbot = gr.Chatbot(label=\"Dialogue History\", height=500)\n",
+    "    with gr.Row():\n",
+    "        question = gr.Textbox(placeholder=\"Ask about biomimicry (e.g. 'How does Werewool use coral proteins to make fibers?')\",\n",
+    "                            label=\"Inquiry\", scale=4)\n",
+    "        model_selector = gr.Dropdown(choices=[\"gemini-2.0-flash\", \"meta-llama-3-70b-instruct\"], label=\"Generation Model\", value=\"gemini-2.0-flash\")\n",
+    "        clear_btn = gr.Button(\"Clear History\", variant=\"secondary\")\n",
+    "    \n",
+    "    gr.Markdown(\"\"\"\n",
+    "        <div style=\"text-align: center; color: #4a7c59;\">\n",
+    "            <small>Powered by AskNature's Database | \n",
+    "            Explore nature's blueprints at <a href=\"https://asknature.org\">asknature.org</a></small>\n",
+    "        </div>\"\"\")\n",
+    "    question.submit(chat_interface, [question, chatbot, model_selector], [question, chatbot])\n",
+    "    clear_btn.click(lambda: [], None, chatbot)\n",
+    "\n",
+    "if __name__ == \"__main__\":\n",
+    "    demo.launch(show_error=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
   {
    "cell_type": "code",
    "execution_count": null,
       "INFO:__main__:Loading cached documents\n",
       "INFO:__main__:Loading cached BM25 index\n",
       "INFO:__main__:Loading cached FAISS index\n",
       "c:\\Users\\Mohamed Elsafty\\.conda\\envs\\rag\\Lib\\site-packages\\gradio\\components\\chatbot.py:273: UserWarning: You have not specified a value for the `type` parameter. Defaulting to the 'tuples' format for chatbot messages, but this is deprecated and will be removed in a future version of Gradio. Please set type='messages' instead, which uses openai-style dictionaries with 'role' and 'content' keys.\n",
       "  warnings.warn(\n"
      ]
      "name": "stdout",
      "output_type": "stream",
      "text": [
+      "* Running on local URL:  http://127.0.0.1:7861\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
+      "INFO:httpx:HTTP Request: GET http://127.0.0.1:7861/gradio_api/startup-events \"HTTP/1.1 200 OK\"\n",
+      "INFO:httpx:HTTP Request: HEAD http://127.0.0.1:7861/ \"HTTP/1.1 200 OK\"\n"
      ]
     },
     {
     {
      "data": {
       "text/html": [
+       "<div><iframe src=\"http://127.0.0.1:7861/\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
       ],
       "text/plain": [
        "<IPython.core.display.HTML object>"
      "name": "stderr",
      "output_type": "stream",
      "text": [
+      "INFO:httpx:HTTP Request: GET https://api.gradio.app/pkg-version \"HTTP/1.1 200 OK\"\n",
       "INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/chat/completions \"HTTP/1.1 200 OK\"\n",
       "Embedding Progress:   0%|          | 0/1 [00:00<?, ?it/s]INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/embeddings \"HTTP/1.1 200 OK\"\n",
+      "Embedding Progress: 100%|██████████| 1/1 [00:00<00:00,  6.02it/s]\n",
+      "INFO:__main__:Response from gemini-2.0-flash: Inspired by the **protein-based pigmentation** found in *Discosoma* coral, Werewool is developing biodegradable fibers for the textile industry [1]. This innovation utilizes **DNA-level fiber design** and **biotechnology** to create sustainable textiles with inherent color and other properties, eliminating the need for toxic dyes and petroleum-based synthetics [1]. The *Discosoma* coral's **red fluorescent protein (RFP)** serves as a model for creating color within the fiber itself [1].\n",
+      "\n",
+      "Furthermore, corals utilize **coral acid-rich proteins (CARP)** to build their rock-hard reefs [2]. These proteins interact with minerals like calcium carbonate, shaping them into **aragonite** crystals [2]. The corals then combine these crystals with other organic molecules, acting as cement to form the strong coral skeletons [2]. This **protein-mineral interaction**, along with the **molecular scaffolding** provided by proteins such as **collagen-based structure**, inspires the creation of durable materials [2].\n",
+      "\n",
+      "These approaches reduce the textile industry's reliance on harmful chemicals and unsustainable materials [1]. The global textile market produces 1.2 billion tons of CO2 equivalent per year and uses dyes that are responsible for 20% of global wastewater. The industry also depends on petroleum based synthetic fibers that account for 35% of global microplastic pollution [1].\n",
+      "\n",
+      "References:\n",
+      "[1] https://asknature.org/innovation/colorful-fibers-inspired-by-proteins-found-in-discosoma-coral/\n",
+      "[2] https://asknature.org/strategy/how-proteins-help-corals-build-rock-hard-reefs/\n",
+      "\n",
+      "INFO:httpx:HTTP Request: POST https://chat-ai.academiccloud.de/v1/chat/completions \"HTTP/1.1 200 OK\"\n",
+      "INFO:__main__:Response from meta-llama-3-70b-instruct: ChatCompletion(id='chat-2b0d6684e9744a0ba5c48bad6bcdd4d7', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content=\"**Coral Proteins: A Sustainable Solution for Eco-Friendly Fabrics**\\n\\nThe Discosoma coral's protein, specifically the red fluorescent protein (RFP), has inspired a revolutionary approach to creating eco-friendly fabrics without the need for toxic dyes. This innovation leverages the principles of **protein-based pigmentation** and **DNA-level fiber design** to produce biodegradable fibers with inherent color properties.\\n\\n**The Science Behind Coral Proteins**\\n\\nThe RFP found in Discosoma coral is a naturally occurring protein that provides the coral with its vibrant color. This protein is capable of absorbing light and emitting it at a longer wavelength, resulting in a red fluorescent color. By harnessing the properties of this protein, researchers can create fibers that exhibit similar color characteristics without the need for synthetic dyes.\\n\\n**How Coral Proteins Are Used in Fabric Production**\\n\\nTo create eco-friendly fabrics, researchers use biotechnology to design fibers at the DNA level. This involves identifying the protein structures found in nature, such as the RFP, and incorporating them into the fiber production process. The resulting fibers are reliant on these proteins for their color properties, eliminating the need for toxic dyes and finishes.\\n\\n**The Benefits of Coral Protein-Based Fabrics**\\n\\nThe use of coral proteins in fabric production offers several sustainability benefits, including:\\n\\n1. **Reduced environmental impact**: By eliminating the need for synthetic dyes and finishes, coral protein-based fabrics reduce the amount of toxic chemicals released into the environment.\\n2. **Biodegradable**: The fibers produced using coral proteins are biodegradable, reducing the amount of microplastic pollution in the environment.\\n3. **Sustainable production**: The use of biotechnology and natural proteins reduces the reliance on non-renewable resources and minimizes the carbon footprint of fabric production.\\n\\n**Conclusion**\\n\\nThe use of coral proteins in fabric production represents a significant step towards creating eco-friendly and sustainable textiles. By harnessing the power of nature and leveraging the principles of protein-based pigmentation and DNA-level fiber design, researchers can create biodegradable fibers with inherent color properties, reducing the environmental impact of the textile industry.\\n\\nReferences:\\n[1] https://asknature.org/innovation/colorful-fibers-inspired-by-proteins-found-in-discosoma-coral/\", refusal=None, role='assistant', audio=None, function_call=None, tool_calls=[]), stop_reason=None)], created=1739018886, model='meta-llama-3.1-70b-instruct', object='chat.completion', service_tier=None, system_fingerprint=None, usage=CompletionUsage(completion_tokens=459, prompt_tokens=1341, total_tokens=1800, completion_tokens_details=None, prompt_tokens_details=None), prompt_logprobs=None)\n",
+      "INFO:__main__:Groq API Response: {'id': 'chatcmpl-55dc0b3b-1528-416e-bd30-93b4a851484e', 'object': 'chat.completion', 'created': 1739018907, 'model': 'llama3-70b-8192', 'choices': [{'index': 0, 'message': {'role': 'assistant', 'content': \"Coral proteins are not directly involved in the production of eco-friendly fabrics without dyes. However, coral-inspired technologies have led to the development of innovative textile production methods that reduce the need for synthetic dyes.\\n\\nHere's how it works:\\n\\n1. **Biomimicry**: Scientists have taken inspiration from the vibrant colors and unique properties of coral reefs to develop sustainable textile production methods. Coral reefs are known for their incredible ability to display a range of colors without using pigments, instead relying on the structure of their skeletons to refract and scatter light.\\n2. **Structural coloration**: Researchers have replicated this natural phenomenon by developing fibers with nanostructured surfaces that create color through the manipulation of light. This approach, known as structural coloration, eliminates the need for synthetic dyes and pigments.\\n3. **Protein-based fibers**: Some companies are using protein-based fibers, such as those derived from silk, soy, or milk, to create sustainable textiles. These fibers can be engineered to have specific properties, such as structural coloration, that reduce the need for dyes.\\n4. **Natural coloration**: Other innovations involve using natural colorants, such as plant-based dyes, to create a more sustainable textile production process. These natural colorants can be derived from various sources, including fruits, vegetables, and spices.\\n\\nWhile coral proteins are not directly involved in this process, the biomimicry approach inspired by coral reefs has led to the development of innovative, eco-friendly textile production methods that reduce the need for synthetic dyes. These sustainable textiles have the potential to minimize environmental impacts, such as water pollution and energy consumption, associated with traditional dyeing processes.\"}, 'logprobs': None, 'finish_reason': 'stop'}], 'usage': {'queue_time': 0.016959538, 'prompt_tokens': 23, 'prompt_time': 0.004020428, 'completion_tokens': 339, 'completion_time': 1.021682599, 'total_tokens': 362, 'total_time': 1.025703027}, 'system_fingerprint': 'fp_753a4aecf6', 'x_groq': {'id': 'req_01jkjsnbgpf5n9ybppv09d1rb5'}}\n",
+      "INFO:__main__:Response from llama3-70b-8192: Coral proteins are not directly involved in the production of eco-friendly fabrics without dyes. However, coral-inspired technologies have led to the development of innovative textile production methods that reduce the need for synthetic dyes.\n",
+      "\n",
+      "Here's how it works:\n",
+      "\n",
+      "1. **Biomimicry**: Scientists have taken inspiration from the vibrant colors and unique properties of coral reefs to develop sustainable textile production methods. Coral reefs are known for their incredible ability to display a range of colors without using pigments, instead relying on the structure of their skeletons to refract and scatter light.\n",
+      "2. **Structural coloration**: Researchers have replicated this natural phenomenon by developing fibers with nanostructured surfaces that create color through the manipulation of light. This approach, known as structural coloration, eliminates the need for synthetic dyes and pigments.\n",
+      "3. **Protein-based fibers**: Some companies are using protein-based fibers, such as those derived from silk, soy, or milk, to create sustainable textiles. These fibers can be engineered to have specific properties, such as structural coloration, that reduce the need for dyes.\n",
+      "4. **Natural coloration**: Other innovations involve using natural colorants, such as plant-based dyes, to create a more sustainable textile production process. These natural colorants can be derived from various sources, including fruits, vegetables, and spices.\n",
+      "\n",
+      "While coral proteins are not directly involved in this process, the biomimicry approach inspired by coral reefs has led to the development of innovative, eco-friendly textile production methods that reduce the need for synthetic dyes. These sustainable textiles have the potential to minimize environmental impacts, such as water pollution and energy consumption, associated with traditional dyeing processes.\n"
      ]
     }
    ],
    "source": [
+    "# Combined Gemini Flash and Meta-LLAMA 3 GWDG and Groq Chatbot\n",
+    "# For Gemini Flash rate limit is 15 requests per minute\n",
+    "# For Groq rate 30 RPM , 14400 RPD, 6K TPM and 500K TPD\n",
+    "\n",
+    "import os\n",
     "import json\n",
     "import logging\n",
     "import re\n",
+    "from typing import List, Tuple\n",
     "import gradio as gr\n",
     "from openai import OpenAI\n",
     "import google.generativeai as genai\n",
+    "import requests\n",
     "from functools import lru_cache\n",
     "from tenacity import retry, stop_after_attempt, wait_exponential\n",
     "from langchain_community.retrievers import BM25Retriever\n",
     "        context = []\n",
     "        for doc in docs:\n",
     "            context_str = f\"\"\"**Source**: [{doc.metadata['source']}]({doc.metadata['hyperlink']})\n",
+    "**Application**: {doc.metadata['application']}\n",
+    "**Key Concepts**: {', '.join(doc.metadata['technical_concepts'])}\n",
+    "**Strategy Excerpt**:\n",
+    "{doc.page_content.split('Strategy Excerpt:')[-1].strip()}\"\"\"\n",
     "            context.append(context_str)\n",
     "        return \"\\n\\n---\\n\\n\".join(context)\n",
     "\n",
     "# --- Generation System ---\n",
+    "SYSTEM_PROMPT = \"\"\"\n",
+    "**Biomimicry Expert Guidelines**\n",
     "\n",
+    "- Use only the provided AskNature context (e.g., Source, Application, Strategy, technical_concepts). If no context is given, note that you're using your own expertise.\n",
+    "- When referencing facts, use numeric citations in square brackets (e.g., [1]). Do not include full URLs inline.\n",
+    "- Bold all technical terms (e.g., **protein-based pigmentation**, **DNA-level fiber design**).\n",
+    "- Provide a concise, expert answer that explains the innovation and its sustainability benefits.\n",
+    "- End your response with a \"References\" section listing each URL with its citation number.\n",
+    "\n",
+    "Context: {context}\n",
+    "\"\"\"\n",
     "\n",
     "@retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=20))\n",
     "def get_ai_response(query: str, context: str, model: str) -> str:\n",
+    "    result = \"\"  # Initialize the result variable\n",
     "    try:\n",
     "        if model == \"gemini-2.0-flash\":\n",
     "            gemini_model = genai.GenerativeModel(model)\n",
     "            response = gemini_model.generate_content(\n",
     "                f\"{SYSTEM_PROMPT.format(context=context)}\\nQuestion: {query}\\nProvide a detailed technical answer:\"\n",
     "            )\n",
+    "            logger.info(f\"Response from gemini-2.0-flash: {response.text}\")\n",
+    "            result = _postprocess_response(response.text)\n",
     "        elif model == \"meta-llama-3-70b-instruct\":\n",
     "            response = client.chat.completions.create(\n",
     "                model=model,\n",
     "                temperature=0.4,\n",
     "                max_tokens=2000\n",
     "            )\n",
+    "            logger.info(f\"Response from meta-llama-3-70b-instruct: {response}\")\n",
+    "            try:\n",
+    "                result = response.choices[0].message.content\n",
+    "            except Exception as e:\n",
+    "                logger.error(f\"Error processing meta-llama-3-70b-instruct response: {str(e)}\")\n",
+    "                result = \"Failed to process response from meta-llama-3-70b-instruct\"\n",
+    "        elif model == \"llama3-70b-8192\":\n",
+    "            result = get_groq_llama3_response(query)\n",
+    "            logger.info(f\"Response from llama3-70b-8192: {result}\")\n",
+    "            if result is None:\n",
+    "                result = \"Failed to get response from llama3-70b-8192\"\n",
+    "        # Append the model name to the response for clarity\n",
+    "        result += f\"\\n\\n**Model:** {model}\"\n",
+    "        return result\n",
     "    except Exception as e:\n",
     "        logger.error(f\"Generation Error: {str(e)}\")\n",
     "        return \"I'm unable to generate a response right now. Please try again later.\"\n",
     "    response = re.sub(r\"\\*\\*([\\w-]+)\\*\\*\", r\"**\\1**\", response)\n",
     "    return response\n",
     "\n",
+    "def get_groq_llama3_response(query: str) -> str:\n",
+    "    \"\"\"Get response from Llama 3 on Groq Cloud.\"\"\"\n",
+    "    api_key = os.getenv(\"GROQ_API_KEY\")\n",
+    "    url = \"https://api.groq.com/openai/v1/chat/completions\"\n",
+    "    \n",
+    "    headers = {\n",
+    "        \"Content-Type\": \"application/json\",\n",
+    "        \"Authorization\": f\"Bearer {api_key}\"\n",
+    "    }\n",
+    "    \n",
+    "    payload = {\n",
+    "        \"model\": \"llama3-70b-8192\",\n",
+    "        \"messages\": [\n",
+    "            {\n",
+    "                \"role\": \"user\",\n",
+    "                \"content\": query\n",
+    "            }\n",
+    "        ]\n",
+    "    }\n",
+    "    \n",
+    "    try:\n",
+    "        response = requests.post(url, headers=headers, json=payload)\n",
+    "        response.raise_for_status()\n",
+    "        result = response.json()\n",
+    "        logger.info(f\"Groq API Response: {result}\")\n",
+    "        return result[\"choices\"][0][\"message\"][\"content\"]\n",
+    "    except requests.exceptions.RequestException as e:\n",
+    "        logger.error(f\"Groq API Error: {str(e)}\")\n",
+    "        return \"An error occurred while contacting Groq's Llama 3 model.\"\n",
+    "\n",
     "# --- Pipeline ---\n",
     "documents = load_and_chunk_data(data_file_name)\n",
     "retriever = EnhancedRetriever(documents)\n",
     "    return \"\", history + [(question, response)]\n",
     "\n",
     "with gr.Blocks(title=\"AskNature BioRAG Expert\", theme=gr.themes.Soft()) as demo:\n",
+    "    gr.Markdown(\"# 🌿 AskNature RAG-based Chatbot\")\n",
     "    with gr.Row():\n",
     "        chatbot = gr.Chatbot(label=\"Dialogue History\", height=500)\n",
     "    with gr.Row():\n",
+    "        question = gr.Textbox(placeholder=\"Ask about biomimicry (e.g. 'How does Werewool use coral proteins to make fibers?')\", label=\"Inquiry\", scale=4)\n",
+    "        model_selector = gr.Dropdown(choices=[\"gemini-2.0-flash\", \"meta-llama-3-70b-instruct(GWDG)\", \"llama3-70b-8192(Groq)\"], label=\"Generation Model\", value=\"gemini-2.0-flash\")\n",
     "        clear_btn = gr.Button(\"Clear History\", variant=\"secondary\")\n",
+    "\n",
     "    gr.Markdown(\"\"\"\n",
     "        <div style=\"text-align: center; color: #4a7c59;\">\n",
     "            <small>Powered by AskNature's Database | \n",
     "            Explore nature's blueprints at <a href=\"https://asknature.org\">asknature.org</a></small>\n",
     "        </div>\"\"\")\n",
+    "    \n",
     "    question.submit(chat_interface, [question, chatbot, model_selector], [question, chatbot])\n",
     "    clear_btn.click(lambda: [], None, chatbot)\n",
     "\n",
     "if __name__ == \"__main__\":\n",
+    "    demo.launch(show_error=True)\n"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,