Spaces:

iitmbs24f
/

Prj2

Sleeping

App Files Files Community

iitmbs24f commited on Nov 29, 2025

Commit

8d6b09c

verified ·

1 Parent(s): 23fc6bf

Upload 17 files

Browse files

Files changed (4) hide show

app/media_processor.py +5 -4
app/solver.py +159 -25
app/specialized_handlers.py +210 -0
requirements.txt +1 -0

app/media_processor.py CHANGED Viewed

@@ -20,7 +20,7 @@ class MediaProcessor:
     """Process audio, video, and image content for quizzes."""
     def __init__(self):
-        self.supported_audio_formats = ['.mp3', '.wav', '.ogg', '.m4a', '.flac', '.webm']
         self.supported_video_formats = ['.mp4', '.webm', '.ogg', '.mov', '.avi', '.mkv']
         self.supported_image_formats = ['.jpg', '.jpeg', '.png', '.gif', '.bmp', '.webp']
@@ -197,11 +197,12 @@ Provide a comprehensive description."""
         base_url = page_content.get('url', '')
         text = page_content.get('text', '') + ' ' + page_content.get('html', '')
-        # Find audio files
         audio_patterns = [
             r'<audio[^>]+src=["\']([^"\']+)["\']',
-            r'<source[^>]+src=["\']([^"\']+\.(?:mp3|wav|ogg|m4a|flac|webm))["\']',
-            r'(https?://[^\s<>"\'\)]+\.(?:mp3|wav|ogg|m4a|flac|webm))',
         ]
         for pattern in audio_patterns:

     """Process audio, video, and image content for quizzes."""
     def __init__(self):
+        self.supported_audio_formats = ['.mp3', '.wav', '.ogg', '.m4a', '.flac', '.webm', '.opus']
         self.supported_video_formats = ['.mp4', '.webm', '.ogg', '.mov', '.avi', '.mkv']
         self.supported_image_formats = ['.jpg', '.jpeg', '.png', '.gif', '.bmp', '.webp']
         base_url = page_content.get('url', '')
         text = page_content.get('text', '') + ' ' + page_content.get('html', '')
+        # Find audio files (including .opus)
         audio_patterns = [
             r'<audio[^>]+src=["\']([^"\']+)["\']',
+            r'<source[^>]+src=["\']([^"\']+\.(?:mp3|wav|ogg|m4a|flac|webm|opus))["\']',
+            r'(https?://[^\s<>"\'\)]+\.(?:mp3|wav|ogg|m4a|flac|webm|opus))',
+            r'(/[^\s<>"\'\)]+\.(?:mp3|wav|ogg|m4a|flac|webm|opus))',  # Relative paths
         ]
         for pattern in audio_patterns:

app/solver.py CHANGED Viewed

@@ -18,6 +18,10 @@ from app.llm import ask_gpt, parse_question_with_llm, solve_with_llm, initialize
 from app.utils import extract_submit_url, clean_text, extract_json_from_text, is_valid_url
 from app.media_processor import get_media_processor
 from app.calculations import get_calc_engine
 logger = logging.getLogger(__name__)
@@ -141,6 +145,42 @@ class QuizSolver:
                 submit_url, email, secret, url, answer
             )
             # Check if there's a next quiz
             if isinstance(response, dict) and 'url' in response:
                 next_url = response['url']
@@ -229,17 +269,23 @@ class QuizSolver:
         try:
             media_processor = get_media_processor()
             media_files = media_processor.find_media_in_page(page_content)
             if media_files['audio']:
                 logger.info(f"Found audio files: {media_files['audio']}")
                 for audio_url in media_files['audio']:
                     try:
                         remaining = self._check_time_remaining()
-                        if remaining >= 20.0:  # Need more time to process audio - only if we have plenty
                             transcription = await media_processor.process_audio_from_url(audio_url)
                             if transcription:
                                 # Use transcription to solve
                                 available_data['audio_transcription'] = transcription
                                 # Try to extract answer from transcription
                                 answer = self._extract_answer_from_transcription(transcription, question)
                                 if answer:
@@ -248,12 +294,45 @@ class QuizSolver:
                         logger.warning(f"Error processing audio {audio_url}: {e}")
                         continue  # Try next audio file
             if media_files['video']:
                 logger.info(f"Found video files: {media_files['video']}")
                 for video_url in media_files['video']:
                     try:
                         remaining = self._check_time_remaining()
-                        if remaining >= 25.0:  # Need more time to process video - only if we have plenty
                             video_info = await media_processor.process_video_from_url(video_url)
                             if video_info and 'analysis' in video_info:
                                 available_data['video_analysis'] = video_info['analysis']
@@ -264,23 +343,6 @@ class QuizSolver:
                     except Exception as e:
                         logger.warning(f"Error processing video {video_url}: {e}")
                         continue  # Try next video file
-            if media_files['images']:
-                logger.info(f"Found images: {len(media_files['images'])}")
-                for img_url in media_files['images'][:2]:  # Process first 2 images only (reduced from 3)
-                    try:
-                        remaining = self._check_time_remaining()
-                        if remaining >= 15.0:  # Need time to process image - only if we have enough
-                            ocr_text = await media_processor.process_image_from_url(img_url)
-                            if ocr_text:
-                                available_data['image_ocr'] = ocr_text
-                                # Try to extract answer from OCR text
-                                answer = self._extract_answer_from_text(ocr_text, question)
-                                if answer:
-                                    return answer
-                    except Exception as e:
-                        logger.warning(f"Error processing image {img_url}: {e}")
-                        continue  # Try next image
         except Exception as e:
             logger.warning(f"Error in media processing: {e}")
             # Continue with other strategies
@@ -294,10 +356,17 @@ class QuizSolver:
             return specific_answer
         # Strategy 4: Check if answer is already in the page
-        answer_in_page = self._find_answer_in_page(page_content, question)
-        if answer_in_page:
-            logger.info("Answer found in page content")
-            return answer_in_page
         # Strategy 5: Try mathematical calculations
         try:
@@ -311,6 +380,23 @@ class QuizSolver:
         # Strategy 6: Check for data files/links to download
         data_files = self._find_data_files(page_content)
         if data_files:
             logger.info(f"Found data files: {data_files}")
             processed_data = await self._process_data_files(data_files)
@@ -320,6 +406,37 @@ class QuizSolver:
                 if answer:
                     return answer
         # Strategy 7: Use LLM to solve (only if we have enough time)
         remaining = self._check_time_remaining()
         # Only use LLM if we have enough time AND haven't found answer yet
@@ -533,8 +650,25 @@ class QuizSolver:
                 return command
             # Look for command patterns in the page
-            # Pattern: "uv http get https://..." - need to capture full URL and optional header
-            # More specific pattern that captures the full command
             command_patterns = [
                 r'(uv\s+http\s+get\s+https?://[^\s<>"]+(?:\?[^\s<>"]+)?(?:\s+-H\s+"[^"]+")?)',  # Full URL with query params and header
                 r'(uv\s+http\s+get\s+https?://[^\s<>"]+)',  # Just URL

 from app.utils import extract_submit_url, clean_text, extract_json_from_text, is_valid_url
 from app.media_processor import get_media_processor
 from app.calculations import get_calc_engine
+from app.specialized_handlers import (
+    extract_image_color, convert_csv_to_json,
+    call_github_api, count_md_files_in_tree
+)
 logger = logging.getLogger(__name__)
                 submit_url, email, secret, url, answer
             )
+            # Check if answer was incorrect and we have a reason with the correct format
+            # This allows us to retry with the correct answer format
+            if isinstance(response, dict) and response.get('correct') == False:
+                reason = response.get('reason', '')
+                if reason:
+                    logger.info(f"Incorrect answer, reason: {reason}")
+                    # Try to extract correct format from reason and retry (only once)
+                    if 'command string' in reason.lower() and 'uv http get' in reason.lower():
+                        # Extract command from reason
+                        command_match = re.search(r'(uv\s+http\s+get\s+[^\n<>"]+(?:\s+-H\s+"[^"]+")?)', reason, re.IGNORECASE)
+                        if command_match:
+                            correct_command = command_match.group(1).strip()
+                            if email:
+                                correct_command = correct_command.replace('<your email>', email).replace('<email>', email)
+                            logger.info(f"Retrying with correct command: {correct_command[:100]}...")
+                            # Retry submission with correct command
+                            retry_response = await self._submit_answer(
+                                submit_url, email, secret, url, correct_command
+                            )
+                            if isinstance(retry_response, dict) and retry_response.get('correct'):
+                                response = retry_response
+                    elif 'git add' in reason.lower() and 'git commit' in reason.lower():
+                        # Extract git commands from reason
+                        need_match = re.search(r'[Nn]eed\s+(git\s+add\s+[^\s]+)\s+then\s+(git\s+commit\s+[^\n<>"]+)', reason, re.IGNORECASE)
+                        if need_match:
+                            cmd1 = need_match.group(1).strip()
+                            cmd2 = need_match.group(2).strip()
+                            correct_commands = f"{cmd1}\n{cmd2}"
+                            logger.info(f"Retrying with correct git commands: {correct_commands}")
+                            # Retry submission
+                            retry_response = await self._submit_answer(
+                                submit_url, email, secret, url, correct_commands
+                            )
+                            if isinstance(retry_response, dict) and retry_response.get('correct'):
+                                response = retry_response
             # Check if there's a next quiz
             if isinstance(response, dict) and 'url' in response:
                 next_url = response['url']
         try:
             media_processor = get_media_processor()
             media_files = media_processor.find_media_in_page(page_content)
+            base_url = page_content.get('url', '')
+            # Handle audio transcription (for passphrase quizzes)
             if media_files['audio']:
                 logger.info(f"Found audio files: {media_files['audio']}")
                 for audio_url in media_files['audio']:
                     try:
                         remaining = self._check_time_remaining()
+                        if remaining >= 20.0:  # Need more time to process audio
                             transcription = await media_processor.process_audio_from_url(audio_url)
                             if transcription:
                                 # Use transcription to solve
                                 available_data['audio_transcription'] = transcription
+                                # For passphrase quizzes, return the transcription directly
+                                if 'transcribe' in question.lower() or 'passphrase' in question.lower():
+                                    logger.info(f"Returning audio transcription as answer: {transcription[:100]}...")
+                                    return transcription
                                 # Try to extract answer from transcription
                                 answer = self._extract_answer_from_transcription(transcription, question)
                                 if answer:
                         logger.warning(f"Error processing audio {audio_url}: {e}")
                         continue  # Try next audio file
+            # Handle image color extraction (for heatmap quizzes)
+            if media_files['images']:
+                logger.info(f"Found images: {len(media_files['images'])}")
+                # Check if this is a color extraction question
+                if 'rgb color' in question.lower() or 'hex' in question.lower() or 'heatmap' in question.lower():
+                    for img_url in media_files['images']:
+                        try:
+                            remaining = self._check_time_remaining()
+                            if remaining >= 15.0:
+                                hex_color = await extract_image_color(img_url, base_url)
+                                if hex_color:
+                                    logger.info(f"Extracted color from image: {hex_color}")
+                                    return hex_color
+                        except Exception as e:
+                            logger.warning(f"Error extracting color from image {img_url}: {e}")
+                            continue
+                # Regular OCR processing
+                for img_url in media_files['images'][:2]:  # Process first 2 images only
+                    try:
+                        remaining = self._check_time_remaining()
+                        if remaining >= 15.0:
+                            ocr_text = await media_processor.process_image_from_url(img_url)
+                            if ocr_text:
+                                available_data['image_ocr'] = ocr_text
+                                # Try to extract answer from OCR text
+                                answer = self._extract_answer_from_text(ocr_text, question)
+                                if answer:
+                                    return answer
+                    except Exception as e:
+                        logger.warning(f"Error processing image {img_url}: {e}")
+                        continue  # Try next image
             if media_files['video']:
                 logger.info(f"Found video files: {media_files['video']}")
                 for video_url in media_files['video']:
                     try:
                         remaining = self._check_time_remaining()
+                        if remaining >= 25.0:  # Need more time to process video
                             video_info = await media_processor.process_video_from_url(video_url)
                             if video_info and 'analysis' in video_info:
                                 available_data['video_analysis'] = video_info['analysis']
                     except Exception as e:
                         logger.warning(f"Error processing video {video_url}: {e}")
                         continue  # Try next video file
         except Exception as e:
             logger.warning(f"Error in media processing: {e}")
             # Continue with other strategies
             return specific_answer
         # Strategy 4: Check if answer is already in the page
+        # BUT: Skip this if we need specific formats (commands, paths, etc.)
+        # to avoid returning generic text that overrides specific format extraction
+        needs_specific_format = any(keyword in question.lower() for keyword in [
+            'command string', 'craft the command', 'exact', 'git', 'shell command',
+            'transcribe', 'rgb color', 'hex', 'json array', 'github api'
+        ])
+        if not needs_specific_format:
+            answer_in_page = self._find_answer_in_page(page_content, question)
+            if answer_in_page:
+                logger.info("Answer found in page content")
+                return answer_in_page
         # Strategy 5: Try mathematical calculations
         try:
         # Strategy 6: Check for data files/links to download
         data_files = self._find_data_files(page_content)
+        base_url = page_content.get('url', '')
+        # Special handling for CSV to JSON conversion
+        if 'normalize to json' in question.lower() or 'json array' in question.lower():
+            for file_url in data_files:
+                if file_url.endswith('.csv'):
+                    try:
+                        remaining = self._check_time_remaining()
+                        if remaining >= 15.0:
+                            json_data = await convert_csv_to_json(file_url, base_url, normalize=True)
+                            if json_data:
+                                logger.info(f"Converted CSV to JSON: {len(json_data)} records")
+                                return json_data
+                    except Exception as e:
+                        logger.warning(f"Error converting CSV to JSON: {e}")
+                        continue
         if data_files:
             logger.info(f"Found data files: {data_files}")
             processed_data = await self._process_data_files(data_files)
                 if answer:
                     return answer
+        # Strategy 6.5: Handle GitHub API calls
+        if 'github api' in question.lower() or 'git/trees' in question.lower():
+            try:
+                # Extract API endpoint from question
+                # Pattern: "GET /repos/{owner}/{repo}/git/trees/{sha}?recursive=1"
+                api_pattern = r'(/repos/[^\s<>"\'\)]+/git/trees/[^\s<>"\'\)]+(?:\?[^\s<>"\'\)]+)?)'
+                match = re.search(api_pattern, question, re.IGNORECASE)
+                if match:
+                    endpoint = match.group(1)
+                    # Extract prefix if mentioned
+                    prefix_match = re.search(r'prefix[:\s]+([^\s<>"\'\)]+)', question, re.IGNORECASE)
+                    prefix = prefix_match.group(1) if prefix_match else ''
+                    remaining = self._check_time_remaining()
+                    if remaining >= 15.0:
+                        tree_data = await call_github_api(endpoint)
+                        if tree_data:
+                            count = count_md_files_in_tree(tree_data, prefix)
+                            # Add email length mod 2 offset if personalized
+                            if 'personalized' in question.lower() and 'email' in question.lower():
+                                offset = len(email) % 2
+                                result = count + offset
+                                logger.info(f"GitHub tree count: {count}, offset: {offset}, result: {result}")
+                                return result
+                            else:
+                                logger.info(f"GitHub tree count: {count}")
+                                return count
+            except Exception as e:
+                logger.warning(f"Error handling GitHub API: {e}")
+                # Continue with other strategies
         # Strategy 7: Use LLM to solve (only if we have enough time)
         remaining = self._check_time_remaining()
         # Only use LLM if we have enough time AND haven't found answer yet
                 return command
             # Look for command patterns in the page
+            # First, try to find the URL mentioned in the question
+            url_pattern = r'https?://[^\s<>"\'\)]+/project2/[^\s<>"\'\)]+'
+            url_match = re.search(url_pattern, combined, re.IGNORECASE)
+            if url_match:
+                base_url = url_match.group(0)
+                # Construct the full command
+                if 'uv.json' in base_url or '/uv' in base_url:
+                    # Add email parameter if personalized
+                    if email and '<your email>' not in base_url and 'email=' not in base_url:
+                        separator = '&' if '?' in base_url else '?'
+                        base_url = f"{base_url}{separator}email={email}"
+                    elif '<your email>' in base_url or 'email=' in base_url:
+                        base_url = base_url.replace('<your email>', email).replace('<email>', email)
+                    command = f'uv http get {base_url} -H "Accept: application/json"'
+                    logger.info(f"Constructed command from URL: {command[:100]}...")
+                    return command
+            # Fallback: try to find command patterns
             command_patterns = [
                 r'(uv\s+http\s+get\s+https?://[^\s<>"]+(?:\?[^\s<>"]+)?(?:\s+-H\s+"[^"]+")?)',  # Full URL with query params and header
                 r'(uv\s+http\s+get\s+https?://[^\s<>"]+)',  # Just URL

app/specialized_handlers.py ADDED Viewed

	@@ -0,0 +1,210 @@

+"""
+Specialized handlers for specific quiz types.
+"""
+import json
+import re
+import logging
+import requests
+import httpx
+from typing import Optional, Dict, Any, List
+from urllib.parse import urljoin, urlparse
+import io
+from collections import Counter
+try:
+    from PIL import Image
+    PIL_AVAILABLE = True
+except ImportError:
+    PIL_AVAILABLE = False
+    logger = logging.getLogger(__name__)
+    logger.warning("PIL/Pillow not available - image color extraction will be disabled")
+logger = logging.getLogger(__name__)
+async def extract_image_color(image_url: str, base_url: str = '') -> Optional[str]:
+    """
+    Extract the most frequent RGB color from an image and return as hex.
+    Args:
+        image_url: URL to image file
+        base_url: Base URL for relative paths
+    Returns:
+        Hex color string (e.g., "#rrggbb") or None
+    """
+    if not PIL_AVAILABLE:
+        logger.warning("PIL not available, cannot extract image colors")
+        return None
+    try:
+        # Make absolute URL if relative
+        if image_url.startswith('/') and base_url:
+            image_url = urljoin(base_url, image_url)
+        logger.info(f"Processing image for color extraction: {image_url}")
+        # Download image
+        response = requests.get(image_url, timeout=30)
+        response.raise_for_status()
+        # Open image with PIL
+        img = Image.open(io.BytesIO(response.content))
+        # Convert to RGB if needed
+        if img.mode != 'RGB':
+            img = img.convert('RGB')
+        # Get all pixel colors
+        pixels = list(img.getdata())
+        # Count color frequencies
+        color_counts = Counter(pixels)
+        # Get most frequent color
+        most_common = color_counts.most_common(1)[0][0]
+        # Convert to hex
+        hex_color = f"#{most_common[0]:02x}{most_common[1]:02x}{most_common[2]:02x}"
+        logger.info(f"Most frequent color: {hex_color}")
+        return hex_color
+    except Exception as e:
+        logger.error(f"Error extracting image color: {e}")
+        return None
+async def convert_csv_to_json(csv_url: str, base_url: str = '', normalize: bool = True) -> Optional[List[Dict[str, Any]]]:
+    """
+    Download CSV and convert to normalized JSON format.
+    Args:
+        csv_url: URL to CSV file
+        base_url: Base URL for relative paths
+        normalize: Whether to normalize keys (snake_case), dates (ISO-8601), etc.
+    Returns:
+        List of dictionaries (JSON array) or None
+    """
+    try:
+        import pandas as pd
+        from datetime import datetime
+        # Make absolute URL if relative
+        if csv_url.startswith('/') and base_url:
+            csv_url = urljoin(base_url, csv_url)
+        logger.info(f"Converting CSV to JSON: {csv_url}")
+        # Download and read CSV
+        response = requests.get(csv_url, timeout=30)
+        response.raise_for_status()
+        df = pd.read_csv(io.StringIO(response.text))
+        # Normalize if requested
+        if normalize:
+            # Convert column names to snake_case
+            df.columns = [col.strip().lower().replace(' ', '_') for col in df.columns]
+            # Normalize date columns to ISO-8601
+            for col in df.columns:
+                if 'date' in col.lower() or 'joined' in col.lower() or 'time' in col.lower():
+                    try:
+                        df[col] = pd.to_datetime(df[col]).dt.strftime('%Y-%m-%dT%H:%M:%S')
+                    except:
+                        pass  # Skip if not a date column
+            # Convert integer columns
+            for col in df.columns:
+                if 'id' in col.lower() or 'value' in col.lower():
+                    try:
+                        df[col] = pd.to_numeric(df[col], errors='ignore').astype('Int64', errors='ignore')
+                    except:
+                        pass
+        # Convert to list of dictionaries
+        result = df.to_dict('records')
+        # Convert NaN to None for JSON serialization
+        for record in result:
+            for key, value in record.items():
+                if pd.isna(value):
+                    record[key] = None
+                elif isinstance(value, (pd.Timestamp, pd.DatetimeTZDtype)):
+                    record[key] = value.isoformat()
+        logger.info(f"Converted CSV to JSON: {len(result)} records")
+        return result
+    except Exception as e:
+        logger.error(f"Error converting CSV to JSON: {e}")
+        import traceback
+        logger.debug(traceback.format_exc())
+        return None
+async def call_github_api(endpoint: str, token: Optional[str] = None) -> Optional[Dict[str, Any]]:
+    """
+    Call GitHub API endpoint.
+    Args:
+        endpoint: API endpoint (e.g., "/repos/owner/repo/git/trees/sha?recursive=1")
+        token: Optional GitHub token
+    Returns:
+        API response as dict or None
+    """
+    try:
+        base_url = "https://api.github.com"
+        url = base_url + endpoint if endpoint.startswith('/') else base_url + '/' + endpoint
+        headers = {
+            'Accept': 'application/vnd.github.v3+json',
+            'User-Agent': 'IITM-Quiz-Solver'
+        }
+        if token:
+            headers['Authorization'] = f'token {token}'
+        logger.info(f"Calling GitHub API: {url}")
+        async with httpx.AsyncClient(timeout=30) as client:
+            response = await client.get(url, headers=headers)
+            response.raise_for_status()
+            return response.json()
+    except Exception as e:
+        logger.error(f"Error calling GitHub API: {e}")
+        return None
+def count_md_files_in_tree(tree_data: Dict[str, Any], prefix: str = '') -> int:
+    """
+    Count .md files in GitHub tree response under given prefix.
+    Args:
+        tree_data: GitHub API tree response
+        prefix: Path prefix to filter by
+    Returns:
+        Count of .md files
+    """
+    try:
+        if 'tree' not in tree_data:
+            return 0
+        count = 0
+        for item in tree_data['tree']:
+            path = item.get('path', '')
+            if path.startswith(prefix) and path.endswith('.md'):
+                count += 1
+        logger.info(f"Found {count} .md files under prefix '{prefix}'")
+        return count
+    except Exception as e:
+        logger.error(f"Error counting .md files: {e}")
+        return 0

requirements.txt CHANGED Viewed

@@ -12,4 +12,5 @@ pydantic==2.5.0
 lxml==4.9.3
 html5lib==1.1
 python-dotenv==1.0.0

 lxml==4.9.3
 html5lib==1.1
 python-dotenv==1.0.0
+Pillow==10.1.0