Spaces:

ckharche
/

saayam-STT

Paused

App Files Files Community

ckharche commited on Nov 22, 2025

Commit

2063825

verified ·

1 Parent(s): 118610a

Upload 13 files

Browse files

Files changed (14) hide show

.gitattributes +1 -0
MetaAIAPI_app.py +137 -0
README.md +217 -12
app.py +336 -0
model_metrics.log +141 -0
static/android-chrome-192x192.png +0 -0
static/android-chrome-512x512.png +3 -0
static/apple-touch-icon.png +0 -0
static/favicon-16x16.png +0 -0
static/favicon-32x32.png +0 -0
static/favicon.ico +0 -0
static/site.webmanifest +1 -0
templates/index.html +405 -0
test_app.py +32 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+static/android-chrome-512x512.png filter=lfs diff=lfs merge=lfs -text

MetaAIAPI_app.py ADDED Viewed

	@@ -0,0 +1,137 @@

+from flask import Flask, render_template, request, jsonify
+from transformers import pipeline
+from meta_ai_api import MetaAI
+import os
+import re  # For text processing
+# Initialize Meta AI client
+client = MetaAI()
+# Category list (unchanged)
+categories = [
+    "Banking", "Books", "Clothes", "College Admissions", "Cooking",
+    "Elementary Education", "Middle School Education", "High School Education", "University Education",
+    "Employment", "Finance", "Food", "Gardening", "Homelessness", "Housing", "Jobs", "Investing",
+    "Matrimonial", "Brain Medical", "Depression Medical", "Eye Medical", "Hand Medical",
+    "Head Medical", "Leg Medical", "Rental", "School", "Shopping",
+    "Baseball Sports", "Basketball Sports", "Cricket Sports", "Handball Sports",
+    "Jogging Sports", "Hockey Sports", "Running Sports", "Tennis Sports",
+    "Stocks", "Travel", "Tourism"
+]
+# Zero-shot classification pipeline (unchanged)
+classifier = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")
+app = Flask(__name__)
+@app.route('/')
+def home():
+    return render_template('index.html', categories=categories)
+@app.route('/predict_categories', methods=['POST'])
+def predict_categories():
+    data = request.get_json()
+    subject = data.get("subject")
+    description = data.get("description")
+    if not subject or not description:
+        return jsonify({"error": "Subject and description required"}), 400
+    prompt = f"{subject}. {description}"
+    try:
+        result = classifier(prompt, categories)
+        return jsonify({"predicted_categories": result['labels'][:3]})
+    except Exception as e:
+        return jsonify({"error": str(e)}), 500
+@app.route('/generate_answer', methods=['POST'])
+def generate_answer():
+    data = request.get_json()
+    category = data.get("category")
+    question = data.get("question")
+    if not category or not question:
+        return jsonify({"error": "Category and question required"}), 400
+    # Create a more specific prompt with formatting instructions
+    prompt = (
+        f"Category: {category}\n"
+        f"Question: {question}\n\n"
+        "Please provide a detailed and well-structured answer. Format your response as follows:\n"
+        "- For any list of items (e.g., websites, tips, steps, examples, or recommendations), use bullet points starting with '-' (e.g., - Item).\n"
+        "- Use bold text (e.g., **text**) for headings or key terms, such as section titles or important concepts.\n"
+        "- Use line breaks to separate paragraphs or sections for clarity.\n"
+        "- Ensure the response is clear, concise, and easy to read.\n"
+        "- If the question asks for recommendations, resources, or a list, always present them as bullet points.\n"
+        "For example, if asked for websites, format the response like this:\n"
+        "**Websites**\n"
+        "- Website 1: Description.\n"
+        "- Website 2: Description.\n"
+    )
+    try:
+        # Get the response from Meta AI
+        response = client.prompt(prompt)
+        raw_answer = response['message'].strip()
+        # Format the response to ensure consistency
+        formatted_answer = format_response(raw_answer)
+        return jsonify({"answer": formatted_answer})
+    except Exception as e:
+        return jsonify({"error": str(e)}), 500
+def format_response(text):
+    """
+    Format the raw AI response to ensure bullet points and structure, even if the AI doesn't follow instructions.
+    """
+    # Split the text into lines
+    lines = text.split('\n')
+    formatted_lines = []
+    in_list = False
+    # Patterns to detect list-like content
+    list_indicators = [
+        r'^(General|Niche|International|Country-Specific|Additional)\b',  # Section headings
+        r'^(Indeed|LinkedIn|Glassdoor|H1BGrader|H1B Visa Jobs|ImmIhelp)\b',  # Website names
+        r'^(Network|Check|Stay)\b'  # Tips starting with verbs
+    ]
+    for line in lines:
+        line = line.strip()
+        if not line:
+            if in_list:
+                in_list = False
+                formatted_lines.append('')  # Add a line break after a list
+            continue
+        # Check if the line starts a new section (e.g., "General Job Search Websites")
+        if any(re.match(pattern, line, re.IGNORECASE) for pattern in list_indicators):
+            if in_list:
+                in_list = False
+                formatted_lines.append('')  # Add a line break before a new section
+            # Add the section as a bold heading
+            formatted_lines.append(f"**{line}**")
+            in_list = True
+            continue
+        # If we're in a list, format the line as a bullet point
+        if in_list and not line.startswith('-'):
+            # Split the line into website/tip and description (e.g., "Indeed (link unavailable): Description")
+            if ': ' in line:
+                parts = line.split(': ', 1)
+                item = parts[0].strip()
+                description = parts[1].strip() if len(parts) > 1 else ""
+                formatted_lines.append(f"- **{item}**: {description}")
+            else:
+                formatted_lines.append(f"- {line}")
+        else:
+            # If not in a list, add the line as a paragraph
+            if in_list:
+                in_list = False
+                formatted_lines.append('')  # Add a line break after a list
+            formatted_lines.append(line)
+    # Join the lines with proper spacing
+    formatted_text = '\n'.join(formatted_lines)
+    return formatted_text
+if __name__ == '__main__':
+    app.run(debug=True)

README.md CHANGED Viewed

@@ -1,12 +1,217 @@
----
-title: Saayam STT
-emoji: 🐨
-colorFrom: red
-colorTo: green
-sdk: docker
-pinned: false
-license: mit
-short_description: Testing Speech-to-Text Feature for Saayam Web UI
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+#  🔍 Saayam AI Assistant 🤖
+Saayam AI Assistant is a web-based application built with Flask that allows users to query various AI models (Meta AI, Gemini, ChatGPT, and groq) for answers across multiple categories (e.g., Jobs, Education, Finance). The application uses zero-shot classification to predict relevant categories for user queries and provides detailed, formatted responses. Additionally, it collects performance metrics (latency, speed, temperature, token counts) to compare the efficiency of each AI model.
+## 🧠 Features
+- **Multi-Model Support**: Query Meta AI, Gemini, ChatGPT, or groq via a command-line argument.
+- **Category Prediction**: Uses zero-shot classification (`facebook/bart-large-mnli`) to predict relevant categories for user queries.
+- **Formatted Responses**: Responses are structured with bullet points, bold headings, and clear sections for readability.
+- **Performance Metrics**: Measures latency (TTFT/TTLT), speed (tokens/second), temperature, and token counts for each model.
+- **Web Interface**: A user-friendly interface built with Flask, HTML, and JavaScript, with Markdown rendering for responses.
+## 🔧 Setup Instructions
+### 1. Create & Activate Conda Environment
+Create a Conda environment with Python 3.10 and activate it:
+```bash
+conda create -n saayam-env python=3.10
+conda activate saayam-env
+```
+### 2. Clone the Repository
+Clone the project repository to your local machine:
+```bash
+git clone https://github.com/RobuRishabh/Saayam_ai.git
+cd Saayam_ai
+```
+### 3. Install Requirements
+Install the required Python packages listed in requirements.txt:
+```bash
+pip install -r requirements.txt
+```
+Note: Ensure you have the following packages in your requirements.txt:
+```
+flask
+transformers
+meta-ai-api
+google-generativeai
+openai
+groq
+python-dotenv
+tiktoken
+```
+### 4. Set Up Environment Variables
+Create a .env file in the project root directory and add your API keys for Gemini, ChatGPT, and groq:
+```
+GEMINI_API_KEY=your_gemini_api_key
+OPENAI_API_KEY=your_openai_api_key
+GROQ_API_KEY=your_groq_api_key
+```
+Note: Meta AI doesn’t require an API key in this setup (uses meta-ai-api library).
+### 5. Run the Application
+Run the application with a specific AI model using the --model argument. The available models are meta_ai, gemini, openai, and groq.
+Meta AI:
+```bash
+python app.py --model meta_ai
+```
+Gemini:
+```bash
+python app.py --model gemini
+```
+ChatGPT (OpenAI):
+```bash
+python app.py --model openai
+```
+groq:
+```bash
+python app.py --model groq
+```
+After running the application, open your browser and navigate to http://127.0.0.1:5000 to access the Saayam AI Assistant interface.
+## 📁 Project Structure
+```
+Saayam_ai/
+├── app.py                 # Main application with multi-model support and metrics
+├── MetaAIAPI_app.py       # Meta AI-only version (simpler implementation)
+├── templates/
+│   └── index.html         # Frontend HTML template
+├── static/
+│   ├── apple-touch-icon.png
+│   ├── favicon-16x16.png
+│   ├── favicon-32x32.png
+│   ├── favicon.ico
+│   └── site.webmanifest    # Web manifest for favicon and icons
+├── requirements.txt        # Python dependencies
+├── .env                    # Environment variables (API keys)
+├── model_metrics.log       # Log file for performance metrics
+└── .gitignore              # Git ignore file
+```
+## 📊 API Performance Evaluation
+The application collects performance metrics for each AI model, including latency, speed, temperature, and token counts. The metrics were evaluated using the query "Suggest me good job searching websites for international students" in the "Jobs" category.
+### Performance Metrics
+**Meta AI**:
+- Model: meta_ai
+- Temperature: 0.7 (default)
+- Time to First Token (TTFT): 15.185 seconds
+- Total Response Time (TTLT): 15.185 seconds
+- Speed: 20.81 tokens/second
+- Input Tokens: 127
+- Output Tokens: 316
+**Gemini**:
+- Model: gemini
+- Temperature: 0.7
+- Time to First Token (TTFT): 4.515 seconds
+- Total Response Time (TTLT): 4.515 seconds
+- Speed: 100.32 tokens/second
+- Input Tokens: 127
+- Output Tokens: 453
+**ChatGPT (OpenAI)**:
+- Model: openai
+- Temperature: 0.7
+- Time to First Token (TTFT): 4.619 seconds
+- Total Response Time (TTLT): 4.619 seconds
+- Speed: 81.83 tokens/second
+- Input Tokens: 176
+- Output Tokens: 378
+**groq**:
+- Model: groq
+- Temperature: 0.7
+- Time to First Token (TTFT): 0.856 seconds
+- Total Response Time (TTLT): 0.856 seconds
+- Speed: 630.66 tokens/second
+- Input Tokens: 127
+- Output Tokens: 540
+### Cost Analysis
+- **Meta AI**: Free (unofficial API), but may have rate limits or reliability issues.
+- **Gemini**: Free tier available, with paid plans for higher usage.
+- **ChatGPT**: Pay-per-use ($0.002 per 1K tokens for gpt-3.5-turbo).
+- **groq**: Free tier available, with paid plans for higher usage.
+### Limitations
+- **Meta AI**: Slow, low speed, lacks temperature control.
+- **Gemini**: Moderate performance, potential tokenization differences.
+- **ChatGPT**: Reliable, slightly slower than groq.
+- **groq**: Fastest, high output token count (verbosity).
+## ⚖️ Comparison with Alternative Solutions
+| Model     | Speed (tokens/s) | TTLT (s) | Cost         | Quality               |
+|-----------|------------------|----------|--------------|------------------------|
+| Meta AI   | 20.81            | 15.185   | Free         | Least consistent       |
+| Gemini    | 100.32           | 4.515    | Free tier    | Moderate consistency   |
+| ChatGPT   | 81.83            | 4.619    | Pay-per-use  | Highly consistent      |
+| groq      | 630.66           | 0.856    | Free tier    | Practical, fast        |
+## 🛠️ Proof-of-Concept Implementation
+### Overview
+Flask-based web app to query 4 models, classify categories, format answers, and log metrics.
+### Backend (`app.py`)
+- Flask app, handles routes `/predict_categories` and `/generate_answer`
+- Model passed using `--model` CLI argument
+- Collects and logs metrics (TTFT, TTLT, token counts, temperature)
+### Frontend (`index.html`)
+- HTML + JavaScript interface
+- Markdown rendering using marked.js
+- Submits subject, description, category
+- Displays response + metrics
+### Example
+```bash
+python app.py --model groq
+```
+Visit [http://127.0.0.1:5000](http://127.0.0.1:5000)
+## 📈 Analysis and Recommendations
+- **Fastest**: groq (0.856s TTLT, 630.66 tokens/s)
+- **Most Consistent**: ChatGPT
+- **Cost-Effective**: Gemini & groq
+- **Slowest**: Meta AI
+### Recommendations
+- Use **groq** for real-time speed
+- Use **ChatGPT** for reliability & consistency
+- Use **Gemini** for cost-conscious performance
+- Avoid **Meta AI** for production
+## 🚀 Future Improvements
+- Enable streaming for better TTFT
+- Add cosine similarity for response sensitivity
+- Load testing (e.g., locust)
+- Caching frequent queries to save cost
+## 🙌 Acknowledgments
+Built with ❤️ using Flask, Transformers, and AI APIs.
+Special thanks to the open-source contributors of meta-ai-api.

app.py ADDED Viewed

	@@ -0,0 +1,336 @@

+from flask import Flask, render_template, request, jsonify
+from transformers import pipeline
+from meta_ai_api import MetaAI
+import google.generativeai as genai  # Gemini API
+from openai import OpenAI  # OpenAI API
+from groq import Groq  # groq API
+from huggingface_hub import InferenceClient  # Hugging Face API
+from dotenv import load_dotenv
+import os
+import re
+import argparse
+import time
+import tiktoken
+import logging
+import transformers
+import tempfile
+# Suppress transformers logging to reduce clutter
+transformers.logging.set_verbosity_error()
+# Load environment variables from .env
+load_dotenv()
+# Set up logging to a file for metrics
+logging.basicConfig(
+    filename='model_metrics.log',
+    level=logging.INFO,
+    format='%(asctime)s - %(message)s'
+)
+# Ensure Flask's logger outputs to the console
+console_handler = logging.StreamHandler()
+console_handler.setLevel(logging.INFO)
+werkzeug_logger = logging.getLogger('werkzeug')
+werkzeug_logger.addHandler(console_handler)
+# Parse command-line arguments
+parser = argparse.ArgumentParser(description="Run Saayam AI Assistant with a specific AI model.")
+parser.add_argument(
+    "--model",
+    type=str,
+    choices=["meta_ai", "gemini", "openai", "groq"],
+    default="meta_ai",
+    help="Choose the AI model to use: meta_ai, gemini, openai, or groq"
+)
+args = parser.parse_args()
+selected_model = args.model
+# Default temperature for models that support it
+DEFAULT_TEMPERATURE = 0.7
+# Initialize the chosen AI client
+if selected_model == "meta_ai":
+    ai_client = MetaAI()
+elif selected_model == "gemini":
+    gemini_api_key = os.getenv("GEMINI_API_KEY")
+    genai.configure(api_key=gemini_api_key)
+    ai_client = genai.GenerativeModel('gemini-1.5-flash')
+elif selected_model == "openai":
+    ai_client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+elif selected_model == "groq":
+    groq_api_key = os.getenv("GROQ_API_KEY")
+    ai_client = Groq(api_key=groq_api_key)
+# Initialize Hugging Face client for Speech-to-Text
+hf_client = InferenceClient(token=os.getenv("HF_API_KEY"))
+# Category list (unchanged)
+categories = [
+    "Banking", "Books", "Clothes", "College Admissions", "Cooking",
+    "Elementary Education", "Middle School Education", "High School Education", "University Education",
+    "Employment", "Finance", "Food", "Gardening", "Homelessness", "Housing", "Jobs", "Investing",
+    "Matrimonial", "Brain Medical", "Depression Medical", "Eye Medical", "Hand Medical",
+    "Head Medical", "Leg Medical", "Rental", "School", "Shopping",
+    "Baseball Sports", "Basketball Sports", "Cricket Sports", "Handball Sports",
+    "Jogging Sports", "Hockey Sports", "Running Sports", "Tennis Sports",
+    "Stocks", "Travel", "Tourism"
+]
+# Zero-shot classification pipeline (unchanged)
+classifier = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")
+# Initialize tokenizer for token counting (for OpenAI models)
+try:
+    openai_tokenizer = tiktoken.encoding_for_model("gpt-3.5-turbo")
+except:
+    openai_tokenizer = None  # Fallback if tiktoken fails
+app = Flask(__name__)
+@app.route('/')
+def home():
+    return render_template('index.html', categories=categories)
+@app.route('/transcribe', methods=['POST'])
+def transcribe_audio():
+    """
+    Transcribe audio using Whisper Large V3 Turbo via Hugging Face Inference API.
+    """
+    if 'audio' not in request.files:
+        return jsonify({"error": "No audio file provided"}), 400
+    audio_file = request.files['audio']
+    temp_file_path = None
+    try:
+        # Read the audio bytes
+        audio_bytes = audio_file.read()
+        # Detect if it's video/webm and use .ogg instead to force audio interpretation
+        content_type = audio_file.content_type or 'audio/webm'
+        # Force .ogg extension to avoid video/webm interpretation
+        if 'webm' in content_type:
+            suffix = '.ogg'
+        elif 'wav' in content_type:
+            suffix = '.wav'
+        elif 'ogg' in content_type:
+            suffix = '.ogg'
+        else:
+            suffix = '.webm'
+        # Save to a temporary file
+        temp_dir = "/tmp/audio"
+        if not os.path.exists(temp_dir):
+            os.makedirs(temp_dir)
+        suffix = '.ogg'
+        # Use os.path.join for explicit path control in container
+        temp_file_path = os.path.join(temp_dir, f"recording_{int(time.time())}{suffix}")
+        with open(temp_file_path, "wb") as f:
+            f.write(audio_bytes)
+        # Pass the file path to the Hugging Face client
+        result = hf_client.automatic_speech_recognition(
+            temp_file_path,
+            model="openai/whisper-large-v3-turbo"
+        )
+        # Clean up the temporary file
+        if temp_file_path and os.path.exists(temp_file_path):
+            os.unlink(temp_file_path)
+        # Extract transcribed text
+        transcribed_text = ""
+        if isinstance(result, dict) and 'text' in result:
+            transcribed_text = result['text']
+        elif hasattr(result, 'text'):
+            transcribed_text = result.text
+        elif isinstance(result, str):
+            transcribed_text = result
+        else:
+            transcribed_text = str(result)
+        return jsonify({
+            "text": transcribed_text.strip()
+        })
+    except Exception as e:
+        # Clean up temp file if it exists
+        if temp_file_path and os.path.exists(temp_file_path):
+            os.unlink(temp_file_path)
+        import traceback
+        traceback.print_exc()
+        return jsonify({"error": f"Transcription failed: {str(e)}"}), 500
+@app.route('/predict_categories', methods=['POST'])
+def predict_categories():
+    data = request.get_json()
+    subject = data.get("subject")
+    description = data.get("description")
+    if not subject or not description:
+        return jsonify({"error": "Subject and description required"}), 400
+    prompt = f"{subject}. {description}"
+    try:
+        result = classifier(prompt, categories)
+        return jsonify({"predicted_categories": result['labels'][:3]})
+    except Exception as e:
+        return jsonify({"error": str(e)}), 500
+@app.route('/generate_answer', methods=['POST'])
+def generate_answer():
+    data = request.get_json()
+    category = data.get("category")
+    question = data.get("question")
+    if not category or not question:
+        return jsonify({"error": "Category and question required"}), 400
+    # Create a prompt with formatting instructions
+    prompt = (
+        f"Category: {category}\n"
+        f"Question: {question}\n\n"
+        "Please provide a detailed and well-structured answer. Format your response as follows:\n"
+        "- For any list of items (e.g., websites, tips, steps, examples, or recommendations), use bullet points starting with '-' (e.g., - Item).\n"
+        "- Use bold text (e.g., **text**) for headings or key terms, such as section titles or important concepts.\n"
+        "- Use line breaks to separate paragraphs or sections for clarity.\n"
+        "- Ensure the response is clear, concise, and easy to read.\n"
+        "- If the question asks for recommendations, resources, or a list, always present them as bullet points.\n"
+        "For example, if asked for websites, format the response like this:\n"
+        "**Websites**\n"
+        "- Website 1: Description.\n"
+        "- Website 2: Description.\n"
+    )
+    # Count input tokens (approximation for non-OpenAI models)
+    if openai_tokenizer:
+        input_tokens = len(openai_tokenizer.encode(prompt))
+    else:
+        input_tokens = len(prompt.split())
+    # Measure latency and generate response
+    try:
+        start_time = time.time()
+        first_token_time = None
+        raw_answer = None
+        if selected_model == "meta_ai":
+            response = ai_client.prompt(prompt)
+            raw_answer = response['message'].strip()
+            first_token_time = time.time()
+        elif selected_model == "gemini":
+            response = ai_client.generate_content(prompt, generation_config={"temperature": DEFAULT_TEMPERATURE})
+            raw_answer = response.text.strip()
+            first_token_time = time.time()
+        elif selected_model == "openai":
+            response = ai_client.chat.completions.create(
+                model="gpt-3.5-turbo",
+                messages=[
+                    {"role": "system", "content": "You are a helpful assistant."},
+                    {"role": "user", "content": prompt}
+                ],
+                temperature=DEFAULT_TEMPERATURE
+            )
+            raw_answer = response.choices[0].message.content.strip()
+            first_token_time = time.time()
+        elif selected_model == "groq":
+            response = ai_client.chat.completions.create(
+                model="llama-3.1-8b-instant",
+                messages=[
+                    {"role": "system", "content": "You are a helpful assistant."},
+                    {"role": "user", "content": prompt}
+                ],
+                temperature=DEFAULT_TEMPERATURE
+            )
+            raw_answer = response.choices[0].message.content.strip()
+            first_token_time = time.time()
+        end_time = time.time()
+        # Calculate latency
+        ttft = first_token_time - start_time
+        ttlt = end_time - start_time
+        # Format the response
+        formatted_answer = format_response(raw_answer)
+        # Count output tokens
+        if openai_tokenizer:
+            output_tokens = len(openai_tokenizer.encode(raw_answer))
+        else:
+            output_tokens = len(raw_answer.split())
+        # Calculate speed (tokens per second)
+        speed = output_tokens / ttlt if ttlt > 0 else 0
+        # Log metrics
+        metrics = {
+            "model": selected_model,
+            "temperature": DEFAULT_TEMPERATURE if selected_model in ["gemini", "openai", "groq"] else "N/A",
+            "ttft_seconds": round(ttft, 3),
+            "ttlt_seconds": round(ttlt, 3),
+            "speed_tokens_per_second": round(speed, 2),
+            "input_tokens": input_tokens,
+            "output_tokens": output_tokens
+        }
+        logging.info(f"Metrics: {metrics}")
+        # Return the answer and metrics
+        return jsonify({
+            "answer": formatted_answer,
+            "metrics": metrics
+        })
+    except Exception as e:
+        return jsonify({"error": str(e)}), 500
+def format_response(text):
+    lines = text.split('\n')
+    formatted_lines = []
+    in_list = False
+    list_indicators = [
+        r'^(General|Niche|International|Country-Specific|Additional)\b',
+        r'^(Indeed|LinkedIn|Glassdoor|H1BGrader|H1B Visa Jobs|ImmIhelp)\b',
+        r'^(Network|Check|Stay)\b'
+    ]
+    for line in lines:
+        line = line.strip()
+        if not line:
+            if in_list:
+                in_list = False
+                formatted_lines.append('')
+            continue
+        if any(re.match(pattern, line, re.IGNORECASE) for pattern in list_indicators):
+            if in_list:
+                in_list = False
+                formatted_lines.append('')
+            formatted_lines.append(f"**{line}**")
+            in_list = True
+            continue
+        if in_list and not line.startswith('-'):
+            if ': ' in line:
+                parts = line.split(': ', 1)
+                item = parts[0].strip()
+                description = parts[1].strip() if len(parts) > 1 else ""
+                formatted_lines.append(f"- **{item}**: {description}")
+            else:
+                formatted_lines.append(f"- {line}")
+        else:
+            if in_list:
+                in_list = False
+                formatted_lines.append('')
+            formatted_lines.append(line)
+    formatted_text = '\n'.join(formatted_lines)
+    return formatted_text
+if __name__ == '__main__':
+    print(f"Starting Saayam AI Assistant with model: {selected_model}")
+    app.run(debug=True, host='127.0.0.1', port=5000)

model_metrics.log ADDED Viewed

	@@ -0,0 +1,141 @@

+2025-11-20 15:13:05,032 - Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`
+2025-11-20 15:18:21,164 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-20 15:18:21,164 - [33mPress CTRL+C to quit[0m
+2025-11-20 15:18:21,167 -  * Restarting with stat
+2025-11-20 15:18:35,608 -  * Debugger is active!
+2025-11-20 15:18:35,612 -  * Debugger PIN: 465-628-698
+2025-11-20 15:18:35,710 - 127.0.0.1 - - [20/Nov/2025 15:18:35] "GET / HTTP/1.1" 200 -
+2025-11-20 15:18:35,965 - 127.0.0.1 - - [20/Nov/2025 15:18:35] "GET /static/favicon.ico HTTP/1.1" 200 -
+2025-11-20 15:18:35,968 - 127.0.0.1 - - [20/Nov/2025 15:18:35] "GET /static/site.webmanifest HTTP/1.1" 200 -
+2025-11-20 15:19:05,508 - Metrics: {'model': 'meta_ai', 'temperature': 'N/A', 'ttft_seconds': 10.035, 'ttlt_seconds': 10.035, 'speed_tokens_per_second': 3.29, 'input_tokens': 115, 'output_tokens': 33}
+2025-11-20 15:19:05,510 - 127.0.0.1 - - [20/Nov/2025 15:19:05] "POST /generate_answer HTTP/1.1" 200 -
+2025-11-20 15:19:08,871 - Metrics: {'model': 'meta_ai', 'temperature': 'N/A', 'ttft_seconds': 3.13, 'ttlt_seconds': 3.13, 'speed_tokens_per_second': 14.7, 'input_tokens': 115, 'output_tokens': 46}
+2025-11-20 15:19:08,872 - 127.0.0.1 - - [20/Nov/2025 15:19:08] "POST /generate_answer HTTP/1.1" 200 -
+2025-11-20 15:19:59,788 - Metrics: {'model': 'meta_ai', 'temperature': 'N/A', 'ttft_seconds': 7.48, 'ttlt_seconds': 7.48, 'speed_tokens_per_second': 26.07, 'input_tokens': 126, 'output_tokens': 195}
+2025-11-20 15:19:59,788 - 127.0.0.1 - - [20/Nov/2025 15:19:59] "POST /generate_answer HTTP/1.1" 200 -
+2025-11-20 15:20:48,377 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-20 15:20:48,377 - [33mPress CTRL+C to quit[0m
+2025-11-20 15:20:48,379 -  * Restarting with stat
+2025-11-20 15:21:03,705 -  * Debugger is active!
+2025-11-20 15:21:03,712 -  * Debugger PIN: 465-628-698
+2025-11-20 15:21:03,747 - 127.0.0.1 - - [20/Nov/2025 15:21:03] "GET / HTTP/1.1" 200 -
+2025-11-20 15:21:04,891 - 127.0.0.1 - - [20/Nov/2025 15:21:04] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-20 15:23:15,016 - HTTP Request: POST https://api.groq.com/openai/v1/chat/completions "HTTP/1.1 400 Bad Request"
+2025-11-20 15:23:15,017 - 127.0.0.1 - - [20/Nov/2025 15:23:15] "[35m[1mPOST /generate_answer HTTP/1.1[0m" 500 -
+2025-11-20 15:24:09,660 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-20 15:24:10,236 -  * Restarting with stat
+2025-11-20 15:24:17,104 -  * Debugger is active!
+2025-11-20 15:24:17,106 -  * Debugger PIN: 465-628-698
+2025-11-20 15:24:29,466 - HTTP Request: POST https://api.groq.com/openai/v1/chat/completions "HTTP/1.1 404 Not Found"
+2025-11-20 15:24:29,468 - 127.0.0.1 - - [20/Nov/2025 15:24:29] "[35m[1mPOST /generate_answer HTTP/1.1[0m" 500 -
+2025-11-20 15:25:10,940 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-20 15:25:11,864 -  * Restarting with stat
+2025-11-20 15:25:20,254 -  * Debugger is active!
+2025-11-20 15:25:20,257 -  * Debugger PIN: 465-628-698
+2025-11-20 15:26:01,027 - HTTP Request: POST https://api.groq.com/openai/v1/chat/completions "HTTP/1.1 200 OK"
+2025-11-20 15:26:01,071 - Metrics: {'model': 'grok', 'temperature': 0.7, 'ttft_seconds': 1.227, 'ttlt_seconds': 1.227, 'speed_tokens_per_second': 301.62, 'input_tokens': 126, 'output_tokens': 370}
+2025-11-20 15:26:01,075 - 127.0.0.1 - - [20/Nov/2025 15:26:01] "POST /generate_answer HTTP/1.1" 200 -
+2025-11-21 15:12:43,192 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 15:12:43,192 - [33mPress CTRL+C to quit[0m
+2025-11-21 15:12:43,194 -  * Restarting with stat
+2025-11-21 15:12:49,726 -  * Debugger is active!
+2025-11-21 15:12:49,734 -  * Debugger PIN: 465-628-698
+2025-11-21 15:12:49,781 - 127.0.0.1 - - [21/Nov/2025 15:12:49] "GET / HTTP/1.1" 200 -
+2025-11-21 15:12:49,996 - 127.0.0.1 - - [21/Nov/2025 15:12:49] "GET /static/site.webmanifest HTTP/1.1" 200 -
+2025-11-21 15:13:30,295 - HTTP Request: POST https://api.groq.com/openai/v1/chat/completions "HTTP/1.1 200 OK"
+2025-11-21 15:13:30,341 - Metrics: {'model': 'groq', 'temperature': 0.7, 'ttft_seconds': 1.451, 'ttlt_seconds': 1.451, 'speed_tokens_per_second': 298.44, 'input_tokens': 134, 'output_tokens': 433}
+2025-11-21 15:13:30,342 - 127.0.0.1 - - [21/Nov/2025 15:13:30] "POST /generate_answer HTTP/1.1" 200 -
+2025-11-21 16:41:31,251 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 16:41:31,252 - [33mPress CTRL+C to quit[0m
+2025-11-21 16:41:31,256 -  * Restarting with stat
+2025-11-21 16:41:57,973 -  * Debugger is active!
+2025-11-21 16:41:57,983 -  * Debugger PIN: 465-628-698
+2025-11-21 16:41:58,031 - 127.0.0.1 - - [21/Nov/2025 16:41:58] "GET / HTTP/1.1" 200 -
+2025-11-21 16:41:58,408 - 127.0.0.1 - - [21/Nov/2025 16:41:58] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 16:48:14,113 - 127.0.0.1 - - [21/Nov/2025 16:48:14] "GET / HTTP/1.1" 200 -
+2025-11-21 16:48:14,330 - 127.0.0.1 - - [21/Nov/2025 16:48:14] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 16:48:14,333 - 127.0.0.1 - - [21/Nov/2025 16:48:14] "GET /static/favicon.ico HTTP/1.1" 200 -
+2025-11-21 16:48:23,602 - 127.0.0.1 - - [21/Nov/2025 16:48:23] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 16:48:51,478 - 127.0.0.1 - - [21/Nov/2025 16:48:51] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 16:48:51,483 - 127.0.0.1 - - [21/Nov/2025 16:48:51] "[33mGET /.well-known/appspecific/com.chrome.devtools.json HTTP/1.1[0m" 404 -
+2025-11-21 16:48:57,299 - 127.0.0.1 - - [21/Nov/2025 16:48:57] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:00:33,452 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:00:34,779 -  * Restarting with stat
+2025-11-21 17:05:05,788 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 17:05:05,789 - [33mPress CTRL+C to quit[0m
+2025-11-21 17:05:05,793 -  * Restarting with stat
+2025-11-21 17:05:24,987 -  * Debugger is active!
+2025-11-21 17:05:24,993 -  * Debugger PIN: 465-628-698
+2025-11-21 17:05:31,454 - 127.0.0.1 - - [21/Nov/2025 17:05:31] "GET / HTTP/1.1" 200 -
+2025-11-21 17:05:31,511 - 127.0.0.1 - - [21/Nov/2025 17:05:31] "[33mGET /.well-known/appspecific/com.chrome.devtools.json HTTP/1.1[0m" 404 -
+2025-11-21 17:05:31,753 - 127.0.0.1 - - [21/Nov/2025 17:05:31] "GET /static/favicon.ico HTTP/1.1" 200 -
+2025-11-21 17:05:31,755 - 127.0.0.1 - - [21/Nov/2025 17:05:31] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:05:43,532 - 127.0.0.1 - - [21/Nov/2025 17:05:43] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:05:50,954 - 127.0.0.1 - - [21/Nov/2025 17:05:50] "GET / HTTP/1.1" 200 -
+2025-11-21 17:05:51,252 - 127.0.0.1 - - [21/Nov/2025 17:05:51] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:05:53,650 - 127.0.0.1 - - [21/Nov/2025 17:05:53] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:05:53,669 - 127.0.0.1 - - [21/Nov/2025 17:05:53] "[33mGET /.well-known/appspecific/com.chrome.devtools.json HTTP/1.1[0m" 404 -
+2025-11-21 17:06:07,126 - 127.0.0.1 - - [21/Nov/2025 17:06:07] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:06:20,044 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:06:21,979 -  * Restarting with stat
+2025-11-21 17:06:53,632 -  * Debugger is active!
+2025-11-21 17:06:53,642 -  * Debugger PIN: 465-628-698
+2025-11-21 17:06:53,698 - 127.0.0.1 - - [21/Nov/2025 17:06:53] "GET / HTTP/1.1" 200 -
+2025-11-21 17:06:53,756 - 127.0.0.1 - - [21/Nov/2025 17:06:53] "[33mGET /.well-known/appspecific/com.chrome.devtools.json HTTP/1.1[0m" 404 -
+2025-11-21 17:06:54,076 - 127.0.0.1 - - [21/Nov/2025 17:06:54] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:06:54,078 - 127.0.0.1 - - [21/Nov/2025 17:06:54] "GET /static/favicon.ico HTTP/1.1" 200 -
+2025-11-21 17:09:47,214 - 127.0.0.1 - - [21/Nov/2025 17:09:47] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:24:06,935 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:24:08,306 -  * Restarting with stat
+2025-11-21 17:24:30,142 -  * Debugger is active!
+2025-11-21 17:24:30,144 -  * Debugger PIN: 465-628-698
+2025-11-21 17:24:40,736 - 127.0.0.1 - - [21/Nov/2025 17:24:40] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:26:37,091 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:26:38,450 -  * Restarting with stat
+2025-11-21 17:26:52,990 -  * Debugger is active!
+2025-11-21 17:26:52,997 -  * Debugger PIN: 465-628-698
+2025-11-21 17:27:10,347 - 127.0.0.1 - - [21/Nov/2025 17:27:10] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:27:25,067 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 17:27:25,067 - [33mPress CTRL+C to quit[0m
+2025-11-21 17:27:25,069 -  * Restarting with stat
+2025-11-21 17:27:35,951 -  * Debugger is active!
+2025-11-21 17:27:35,956 -  * Debugger PIN: 465-628-698
+2025-11-21 17:27:35,985 - 127.0.0.1 - - [21/Nov/2025 17:27:35] "GET / HTTP/1.1" 200 -
+2025-11-21 17:27:36,140 - 127.0.0.1 - - [21/Nov/2025 17:27:36] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:28:38,222 - 127.0.0.1 - - [21/Nov/2025 17:28:38] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:28:38,232 - 127.0.0.1 - - [21/Nov/2025 17:28:38] "[33mGET /.well-known/appspecific/com.chrome.devtools.json HTTP/1.1[0m" 404 -
+2025-11-21 17:28:56,242 - 127.0.0.1 - - [21/Nov/2025 17:28:56] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:34:01,152 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 17:34:01,153 - [33mPress CTRL+C to quit[0m
+2025-11-21 17:34:01,155 -  * Restarting with stat
+2025-11-21 17:34:14,790 -  * Debugger is active!
+2025-11-21 17:34:14,795 -  * Debugger PIN: 465-628-698
+2025-11-21 17:34:36,971 - 127.0.0.1 - - [21/Nov/2025 17:34:36] "GET / HTTP/1.1" 200 -
+2025-11-21 17:34:37,154 - 127.0.0.1 - - [21/Nov/2025 17:34:37] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:34:51,570 - 127.0.0.1 - - [21/Nov/2025 17:34:51] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:34:54,847 - 127.0.0.1 - - [21/Nov/2025 17:34:54] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:35:02,069 - 127.0.0.1 - - [21/Nov/2025 17:35:02] "[35m[1mPOST /transcribe HTTP/1.1[0m" 500 -
+2025-11-21 17:35:16,704 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:35:17,645 -  * Restarting with stat
+2025-11-21 17:35:31,749 -  * Debugger is active!
+2025-11-21 17:35:31,753 -  * Debugger PIN: 465-628-698
+2025-11-21 17:36:46,964 -  * Detected change in 'C:\\Users\\chaitanyakharche\\OneDrive\\Desktop\\saayam\\ai\\app.py', reloading
+2025-11-21 17:36:47,930 -  * Restarting with stat
+2025-11-21 17:37:02,683 - [31m[1mWARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.[0m
+ * Running on http://127.0.0.1:5000
+2025-11-21 17:37:02,683 - [33mPress CTRL+C to quit[0m
+2025-11-21 17:37:02,687 -  * Restarting with stat
+2025-11-21 17:37:15,615 -  * Debugger is active!
+2025-11-21 17:37:15,617 -  * Debugger PIN: 465-628-698
+2025-11-21 17:37:15,714 - 127.0.0.1 - - [21/Nov/2025 17:37:15] "GET / HTTP/1.1" 200 -
+2025-11-21 17:37:15,841 - 127.0.0.1 - - [21/Nov/2025 17:37:15] "[36mGET /static/site.webmanifest HTTP/1.1[0m" 304 -
+2025-11-21 17:37:30,830 - 127.0.0.1 - - [21/Nov/2025 17:37:30] "POST /transcribe HTTP/1.1" 200 -
+2025-11-21 17:37:44,136 - 127.0.0.1 - - [21/Nov/2025 17:37:44] "POST /transcribe HTTP/1.1" 200 -
+2025-11-21 17:38:01,648 - 127.0.0.1 - - [21/Nov/2025 17:38:01] "POST /transcribe HTTP/1.1" 200 -

static/android-chrome-192x192.png ADDED Viewed

static/android-chrome-512x512.png ADDED Viewed

Git LFS Details

SHA256: b171ec2611e5755bf1fc228568dcc8568d93879a874f0fc9c3c5fdec692db697
Pointer size: 131 Bytes
Size of remote file: 222 kB

static/apple-touch-icon.png ADDED Viewed

static/favicon-16x16.png ADDED Viewed

static/favicon-32x32.png ADDED Viewed

static/favicon.ico ADDED Viewed

static/site.webmanifest ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"name":"","short_name":"","icons":[{"src":"/android-chrome-192x192.png","sizes":"192x192","type":"image/png"},{"src":"/android-chrome-512x512.png","sizes":"512x512","type":"image/png"}],"theme_color":"#ffffff","background_color":"#ffffff","display":"standalone"}

templates/index.html ADDED Viewed

	@@ -0,0 +1,405 @@

+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <title>Saayam AI Assistant</title>
+    <!-- Favicon & Icons -->
+    <link rel="apple-touch-icon" sizes="180x180" href="{{ url_for('static', filename='apple-touch-icon.png') }}">
+    <link rel="icon" type="image/png" sizes="32x32" href="{{ url_for('static', filename='favicon-32x32.png') }}">
+    <link rel="icon" type="image/png" sizes="16x16" href="{{ url_for('static', filename='favicon-16x16.png') }}">
+    <link rel="manifest" href="{{ url_for('static', filename='site.webmanifest') }}">
+    <link rel="icon" type="image/x-icon" href="{{ url_for('static', filename='favicon.ico') }}">
+    <!-- Add marked.js for Markdown rendering -->
+    <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+    <style>
+        body {
+            font-family: Arial, sans-serif;
+            margin: 20px;
+            background-color: #f9f9f9;
+        }
+        .container {
+            max-width: 600px;
+            margin: auto;
+            background: #fff;
+            padding: 20px;
+            border-radius: 8px;
+            box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);
+        }
+        h1 {
+            text-align: center;
+            color: #4CAF50;
+        }
+        label {
+            font-weight: bold;
+            margin-top: 10px;
+            display: block;
+        }
+        textarea, select, input, button {
+            margin-top: 10px;
+            width: 100%;
+            padding: 10px;
+            border: 1px solid #ccc;
+            border-radius: 5px;
+            box-sizing: border-box; /* Ensures padding doesn't affect width */
+        }
+        button {
+            background-color: #4CAF50;
+            color: white;
+            border: none;
+            cursor: pointer;
+            font-size: 16px;
+        }
+        button:hover {
+            background-color: #45a049;
+        }
+        /* STT Toolbar Styles */
+        .stt-toolbar {
+            display: flex;
+            gap: 10px;
+            margin-top: 5px;
+            margin-bottom: 5px;
+            align-items: center;
+        }
+        .stt-select {
+            flex-grow: 1;
+            margin-top: 0;
+            padding: 8px;
+        }
+        .mic-button {
+            width: auto;
+            margin-top: 0;
+            background-color: #f0f0f0;
+            color: #333;
+            border: 1px solid #ccc;
+            padding: 8px 15px;
+            display: flex;
+            align-items: center;
+            gap: 5px;
+            transition: all 0.3s ease;
+        }
+        .mic-button:hover {
+            background-color: #e0e0e0;
+        }
+        .mic-button.recording {
+            background-color: #ffebee;
+            color: #d32f2f;
+            border-color: #d32f2f;
+            animation: pulse 1.5s infinite;
+        }
+        .mic-icon {
+            width: 16px;
+            height: 16px;
+            fill: currentColor;
+        }
+        @keyframes pulse {
+            0% { box-shadow: 0 0 0 0 rgba(211, 47, 47, 0.4); }
+            70% { box-shadow: 0 0 0 10px rgba(211, 47, 47, 0); }
+            100% { box-shadow: 0 0 0 0 rgba(211, 47, 47, 0); }
+        }
+        .predicted-categories {
+            margin-top: 10px;
+            display: flex;
+            gap: 10px;
+            flex-wrap: wrap;
+        }
+        .category-option {
+            padding: 10px;
+            border: 1px solid #ccc;
+            border-radius: 5px;
+            background-color: #e7f5e7;
+            cursor: pointer;
+        }
+        .category-option.selected {
+            background-color: #4CAF50;
+            color: white;
+            border: 1px solid #4CAF50;
+        }
+        .loading-message {
+            text-align: center;
+            margin-top: 10px;
+            font-style: italic;
+            color: #888;
+        }
+        .response {
+            margin-top: 20px;
+            display: none;
+        }
+        .response p {
+            background: #e7f5e7;
+            padding: 10px;
+            border: 1px solid #4CAF50;
+            border-radius: 5px;
+            font-family: Arial, sans-serif;
+        }
+        .metrics {
+            margin-top: 10px;
+            padding: 10px;
+            background: #f0f0f0;
+            border-radius: 5px;
+        }
+        .metrics p {
+            margin: 5px 0;
+        }
+    </style>
+</head>
+<body>
+    <div class="container">
+        <h1>Saayam AI Assistant</h1>
+        <p><strong>Homepage:</strong><br>Enter a subject and description for your query.<br>
+        Optionally, select a category from the dropdown menu.</p>
+        <form id="qa-form">
+            <label for="subject">Subject:</label>
+            <input id="subject" name="subject" type="text" required />
+            <label for="category">Category (Optional):</label>
+            <select id="category" name="category">
+                <option value="" disabled selected>Select a category</option>
+            </select>
+            <label for="description">Description:</label>
+            <!-- STT Toolbar -->
+            <div class="stt-toolbar">
+                <select id="stt-language" class="stt-select">
+                    <option value="auto">Auto-Detect Language</option>
+                    <option value="en">English</option>
+                    <option value="zh">Mandarin Chinese</option>
+                    <option value="hi">Hindi</option>
+                    <option value="es">Spanish</option>
+                    <option value="fr">French</option>
+                    <option value="ar">Arabic</option>
+                    <option value="bn">Bengali</option>
+                    <option value="pt">Portuguese</option>
+                    <option value="ru">Russian</option>
+                    <option value="ur">Urdu</option>
+                    <option value="id">Indonesian</option>
+                    <option value="de">German</option>
+                    <option value="ja">Japanese</option>
+                </select>
+                <button type="button" id="mic-btn" class="mic-button" onclick="toggleRecording()">
+                    <svg class="mic-icon" viewBox="0 0 24 24">
+                        <path d="M12 14c1.66 0 3-1.34 3-3V5c0-1.66-1.34-3-3-3S9 3.34 9 5v6c0 1.66 1.34 3 3 3z"/>
+                        <path d="M17 11c0 2.76-2.24 5-5 5s-5-2.24-5-5H5c0 3.53 2.61 6.43 6 6.92V21h2v-3.08c3.39-.49 6-3.39 6-6.92h-2z"/>
+                    </svg>
+                    Record
+                </button>
+            </div>
+            <textarea id="description" name="description" rows="4" required placeholder="Type or use the microphone to speak..."></textarea>
+            <div id="category-prediction-area"></div>
+            <button type="button" onclick="askQuestion()" style="margin-top: 20px;">Ask</button>
+        </form>
+        <div class="response" id="response-container">
+            <h3>AI Response:</h3>
+            <div id="response-text"></div>
+            <div class="metrics" id="metrics-container"></div>
+        </div>
+    </div>
+    <script>
+        const categories = JSON.parse('{{ categories | tojson | safe }}');
+        const categoryDropdown = document.getElementById("category");
+        const predictionArea = document.getElementById("category-prediction-area");
+        let selectedCategory = "";
+        // Populate category dropdown
+        categories.forEach(cat => {
+            const option = document.createElement("option");
+            option.value = cat;
+            option.textContent = cat;
+            categoryDropdown.appendChild(option);
+        });
+        // --- Speech to Text Logic ---
+        let mediaRecorder;
+        let audioChunks = [];
+        const micBtn = document.getElementById('mic-btn');
+        const descriptionArea = document.getElementById('description');
+        async function toggleRecording() {
+            if (mediaRecorder && mediaRecorder.state === "recording") {
+                mediaRecorder.stop();
+            } else {
+                try {
+                    const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
+                    startRecording(stream);
+                } catch (err) {
+                    console.error("Error accessing microphone:", err);
+                    alert("Microphone access denied or unavailable.");
+                }
+            }
+        }
+        function startRecording(stream) {
+            audioChunks = [];
+            let options;
+            if (MediaRecorder.isTypeSupported('audio/webm;codecs=opus')) {
+                options = { mimeType: 'audio/webm;codecs=opus' };
+            } else if (MediaRecorder.isTypeSupported('audio/webm')) {
+                options = { mimeType: 'audio/webm' };
+            } else {
+                options = { mimeType: 'audio/ogg;codecs=opus' };
+            }
+            mediaRecorder = new MediaRecorder(stream, options);
+            mediaRecorder.ondataavailable = event => {
+                audioChunks.push(event.data);
+            };
+            mediaRecorder.onstop = async () => {
+                // Visual reset
+                micBtn.classList.remove("recording");
+                micBtn.innerHTML = `
+                    <svg class="mic-icon" viewBox="0 0 24 24">
+                        <path d="M12 14c1.66 0 3-1.34 3-3V5c0-1.66-1.34-3-3-3S9 3.34 9 5v6c0 1.66 1.34 3 3 3z"/>
+                        <path d="M17 11c0 2.76-2.24 5-5 5s-5-2.24-5-5H5c0 3.53 2.61 6.43 6 6.92V21h2v-3.08c3.39-.49 6-3.39 6-6.92h-2z"/>
+                    </svg> Record`;
+                descriptionArea.placeholder = "Processing audio...";
+                // Prepare file
+                const mimeType = mediaRecorder.mimeType || 'audio/webm';
+                const audioBlob = new Blob(audioChunks, { type: mimeType });
+                const formData = new FormData();
+                formData.append("audio", audioBlob);
+                const lang = document.getElementById('stt-language').value;
+                formData.append("language", lang);
+                try {
+                    const response = await fetch('/transcribe', {
+                        method: 'POST',
+                        body: formData
+                    });
+                    const data = await response.json();
+                    if (data.text) {
+                        // Append text if content exists, otherwise set it
+                        const currentText = descriptionArea.value;
+                        descriptionArea.value = currentText ? currentText + " " + data.text : data.text;
+                        descriptionArea.placeholder = "Type or use the microphone to speak...";
+                    } else if (data.error) {
+                        alert("Transcription failed: " + data.error);
+                        descriptionArea.placeholder = "Error in transcription.";
+                    }
+                } catch (error) {
+                    console.error("API Error:", error);
+                    alert("Failed to connect to transcription server.");
+                    descriptionArea.placeholder = "Connection failed.";
+                }
+                // Stop all tracks to release mic
+                stream.getTracks().forEach(track => track.stop());
+            };
+            mediaRecorder.start();
+            micBtn.classList.add("recording");
+            micBtn.innerHTML = "Listening... (Click to Stop)";
+            descriptionArea.placeholder = "Listening...";
+        }
+        // --- Existing Logic ---
+        function askQuestion() {
+            const subject = document.getElementById("subject").value;
+            const category = document.getElementById("category").value || selectedCategory;
+            const description = document.getElementById("description").value;
+            if (!subject || !description) {
+                alert("Please fill out all required fields.");
+                return;
+            }
+            // Basic prediction logic if category missing
+            if (!category) {
+                predictionArea.innerHTML = '<p class="loading-message">Predicting categories...</p>';
+                fetch('/predict_categories', {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({ subject, description })
+                })
+                .then(res => res.json())
+                .then(data => {
+                    predictionArea.innerHTML = "";
+                    const predictedContainer = document.createElement("div");
+                    predictedContainer.className = "predicted-categories";
+                    if(data.predicted_categories) {
+                        data.predicted_categories.forEach(cat => {
+                            const div = document.createElement("div");
+                            div.textContent = cat;
+                            div.className = "category-option";
+                            div.onclick = () => selectCategory(div, cat);
+                            predictedContainer.appendChild(div);
+                        });
+                    }
+                    predictionArea.appendChild(predictedContainer);
+                })
+                .catch(err => {
+                    predictionArea.innerHTML = "<p class='loading-message'>Failed to predict categories.</p>";
+                    console.error(err);
+                });
+                return;
+            }
+            const responseContainer = document.getElementById("response-container");
+            const responseText = document.getElementById("response-text");
+            responseContainer.style.display = 'block';
+            responseText.innerHTML = '<p class="loading-message">Thinking...</p>';
+            document.getElementById("metrics-container").innerHTML = "";
+            fetch('/generate_answer', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ category, question: description })
+            })
+            .then(res => res.json())
+            .then(data => {
+                if (data.error) {
+                    responseText.innerHTML = `<p style="color:red">Error: ${data.error}</p>`;
+                    return;
+                }
+                // Render the response as Markdown
+                responseText.innerHTML = marked.parse(data.answer);
+                // Display metrics
+                const metricsContainer = document.getElementById("metrics-container");
+                if (data.metrics) {
+                    metricsContainer.innerHTML = `
+                        <h4>Performance Metrics:</h4>
+                        <p><strong>Model:</strong> ${data.metrics.model}</p>
+                        <p><strong>Temperature:</strong> ${data.metrics.temperature}</p>
+                        <p><strong>Time to First Token (TTFT):</strong> ${data.metrics.ttft_seconds} seconds</p>
+                        <p><strong>Total Response Time (TTLT):</strong> ${data.metrics.ttlt_seconds} seconds</p>
+                        <p><strong>Speed:</strong> ${data.metrics.speed_tokens_per_second} tokens/second</p>
+                        <p><strong>Input Tokens:</strong> ${data.metrics.input_tokens}</p>
+                        <p><strong>Output Tokens:</strong> ${data.metrics.output_tokens}</p>
+                    `;
+                } else {
+                    metricsContainer.innerHTML = '<p>No metrics available.</p>';
+                }
+            })
+            .catch(err => {
+                console.error(err);
+                responseText.innerHTML = `<p style="color:red">Request failed.</p>`;
+            });
+        }
+        function selectCategory(element, category) {
+            document.querySelectorAll(".category-option").forEach(el => el.classList.remove("selected"));
+            element.classList.add("selected");
+            selectedCategory = category;
+        }
+    </script>
+</body>
+</html>

test_app.py ADDED Viewed

	@@ -0,0 +1,32 @@

+import pytest
+from app import app, categories
+@pytest.fixture
+def client():
+    with app.test_client() as client:
+        yield client
+def test_homepage(client):
+    response = client.get('/')
+    assert response.status_code == 200
+    assert b"Saayam AI Assistant" in response.data
+def test_predict_categories(client):
+    response = client.post('/predict_categories', json={
+        "subject": "How to save money?",
+        "description": "I want to start budgeting my expenses."
+    })
+    assert response.status_code == 200
+    data = response.get_json()
+    assert "predicted_categories" in data
+    assert len(data["predicted_categories"]) > 0
+@pytest.mark.parametrize("category", categories[:5])  # Use a few categories for demo
+def test_generate_answer(client, category):
+    response = client.post('/generate_answer', json={
+        "category": category,
+        "question": "Tell me something about this category."
+    })
+    assert response.status_code == 200
+    data = response.get_json()
+    assert "answer" in data or "error" in data