Spaces:

Yusufarsh
/

ReproAgent

Runtime error

File size: 6,863 Bytes

80f8512

import os
import json
import google.generativeai as genai
from dotenv import load_dotenv

load_dotenv()

def get_gemini_client():
    api_key = os.getenv("GEMINI_API_KEY")
    if not api_key:
        raise ValueError("GEMINI_API_KEY not found in environment variables")
    genai.configure(api_key=api_key)
    # Note: User specified gemini-2.5-flash, but we'll fallback to 1.5-flash if needed
    try:
        return genai.GenerativeModel('gemini-2.5-flash')
    except:
        return genai.GenerativeModel('gemini-pro')

def generate_summary_and_ppt_content(text: str):
    """

    Generates a summary and PPT structure from research paper text.

    """
    model = get_gemini_client()
    
    prompt = f"""

    Analyze the research paper and provide two things:

    1. A summary in a clean, structured format.

    2. A structured plan for an impressive PowerPoint presentation.



    STRICT FORMATTING RULES FOR THE SUMMARY:

    - Use clear section headings like: 1. Core Idea, 2. Background, etc.

    - Do NOT use emojis.

    - Do NOT use excessive bold formatting inside paragraphs.

    - Only bold the section titles.

    - Use bullet points (•) instead of long paragraphs.

    - Keep sentences short and clear.

    - Avoid decorative or marketing-style language.

    - Keep it concise but informative.

    - Do not use * at all.



    SUMMARY STRUCTURE:

    1. Core Idea

    2. Background / Problem

    3. Key Observation

    4. Method (How it works)

    5. Results

    6. Contributions

    7. Limitations (if any)



    Format your response as a valid JSON object. Ensure all strings (especially the 'description') are properly escaped for JSON (e.g., use \\n for newlines).



    JSON structure:

    {{

        "description": "The summary following the formatting rules above",

        "ppt_slides": [

            {{

                "title": "Slide Title",

                "content": ["Key point 1", "Key point 2", ...]

            }}

        ]

    }}



    Research Paper Text:

    {text[:30000]}

    """


    response = model.generate_content(prompt)
    
    try:
        # Clean the response to ensure it's valid JSON
        content = response.text.strip()
        if content.startswith("```json"):
            content = content[7:-3].strip()
        elif content.startswith("```"):
            content = content[3:-3].strip()
        
        # Use strict=False to be more lenient with control characters
        return json.loads(content, strict=False)
    except Exception as e:
        print(f"Error parsing LLM response: {e}")
        return {
            "description": "Error generating description. Please try again.",
            "ppt_slides": []
        }

def analyze_installation_error(error_log: str, repo_structure: str):
    """

    Uses AI to analyze an installation error and suggest a fix.

    """
    model = get_gemini_client()
    
    prompt = f"""

    You are an expert DevOps and ML Engineer. A Python environment installation failed with the following error:

    

    ERROR LOG:

    {error_log[-2000:]}

    

    REPOSITORY STRUCTURE:

    {repo_structure}

    

    Based on the error, provide a solution to fix the installation. 

    Format your response as a JSON object:

    {{

        "diagnosis": "Short explanation of what went wrong",

        "action": "install_package" | "edit_requirements" | "change_python_version",

        "command": "The exact command to run to fix it (if any)",

        "file_to_edit": "path/to/file (if any)",

        "new_content": "New content for the file (if any)"

    }}

    """
    
    response = model.generate_content(prompt)
    try:
        content = response.text.strip()
        if content.startswith("```json"):
            content = content[7:-3].strip()
        elif content.startswith("```"):
            content = content[3:-3].strip()
        return json.loads(content, strict=False)
    except:
        return None

def extract_execution_instructions(repo_structure: str, readme_text: str):
    """

    Asks AI to figure out how to run the evaluation/test script.

    """
    model = get_gemini_client()
    prompt = f"""

    Based on the repository structure and README, what is the exact command to run the evaluation or test script to verify the results?

    

    STRUCTURE:

    {repo_structure}

    

    README SNIPPET:

    {readme_text[:5000]}

    

    Return a JSON object:

    {{

        "command": "python eval.py ...",

        "explanation": "Why this command is selected"

    }}

    """
    response = model.generate_content(prompt)
    try:
        content = response.text.strip()
        if content.startswith("```json"):
            content = content[7:-3].strip()
        elif content.startswith("```"):
            content = content[3:-3].strip()
        return json.loads(content, strict=False)
    except:
        return {{"command": "python main.py", "explanation": "Fallback to main.py"}}

def extract_claimed_metrics(paper_text: str):
    """

    Extracts the main results reported in the paper.

    """
    model = get_gemini_client()
    prompt = f"""

    Extract the primary performance metrics (accuracy, F1, FID, etc.) reported in the following paper text. 

    Focus on the main results table.

    

    TEXT:

    {paper_text[:20000]}

    

    Return a JSON object:

    {{

        "metrics": [

            {{"name": "Accuracy", "value": "94.2%", "context": "ImageNet validation"}},

            ...

        ]

    }}

    """
    response = model.generate_content(prompt)
    try:
        content = response.text.strip()
        if content.startswith("```json"):
            content = content[7:-3].strip()
        elif content.startswith("```"):
            content = content[3:-3].strip()
        return json.loads(content, strict=False)
    except:
        return {{"metrics": []}}

def extract_metrics_from_logs(logs: str):
    """

    Parses execution logs to find resulting metrics.

    """
    model = get_gemini_client()
    prompt = f"""

    The following is the output log of a research paper's evaluation script. 

    Identify and extract the final performance metrics achieved.

    

    LOGS:

    {logs[-5000:]}

    

    Return a JSON object:

    {{

        "metrics": [

            {{"name": "Accuracy", "value": "93.8%"}},

            ...

        ]

    }}

    """
    response = model.generate_content(prompt)
    try:
        content = response.text.strip()
        if content.startswith("```json"):
            content = content[7:-3].strip()
        elif content.startswith("```"):
            content = content[3:-3].strip()
        return json.loads(content, strict=False)
    except:
        return {{"metrics": []}}