Spaces:

hamxaameer
/

pseudo2code

Sleeping

App Files Files Community

hamxaameer commited on Oct 29, 2025

Commit

4521d33

1 Parent(s): 9bb5531

Update app.py

Browse files

Files changed (1) hide show

app.py +209 -689

app.py CHANGED Viewed

@@ -1,726 +1,246 @@
 import gradio as gr
-import pickle
 import torch
-import numpy as np
-from nltk.translate.bleu_score import sentence_bleu, SmoothingFunction
-from nltk.tokenize import word_tokenize
-import nltk
-import time
-import os
-# Download required NLTK data
-try:
-    nltk.download('punkt', quiet=True)
-    nltk.download('punkt_tab', quiet=True)
-except:
-    pass
-# Global variables to store loaded model
-loaded_model = None
-loaded_tokenizer = None
-loaded_config = None
-generation_history = []
-# Auto-load model on startup
-def initialize_model():
-    """Initialize model automatically on app startup"""
-    return load_model_from_pickle("best_model.pkl")
-def load_model_from_pickle(pickle_path="best_model.pkl"):
-    """Load model from pickle file (auto-loads on startup)"""
-    global loaded_model, loaded_tokenizer, loaded_config
-    try:
-        # Check if file exists
-        if not os.path.exists(pickle_path):
-            return f"❌ Model file not found: {pickle_path}\n\nPlease ensure best_model.pkl is uploaded to the HuggingFace Space."
-        # ULTIMATE FIX: Check if CPU version exists, if not convert it
-        cpu_pickle_path = pickle_path.replace('.pkl', '_cpu.pkl')
-        if not os.path.exists(cpu_pickle_path):
-            # Need to convert CUDA pickle to CPU pickle
-            try:
-                # Use torch.load with custom map_location that captures and remaps ALL devices
-                def smart_map_location(storage, location):
-                    # This function is called for EACH tensor storage during unpickling
-                    # It runs BEFORE the "CUDA device check", allowing us to remap
-                    return storage.cpu()
-                # Load with our smart mapper
-                model_package = torch.load(pickle_path, map_location=smart_map_location)
-                # Now save it as a CPU-only pickle for future loads
-                torch.save(model_package, cpu_pickle_path)
-                return f"✅ Converted CUDA model to CPU! Loading from converted version...\n\nPlease wait, loading model..."
-            except Exception as convert_error:
-                # Conversion failed, try direct load with aggressive remapping
-                import io
-                import pickle as pkl
-                try:
-                    # Read the pickle bytes
-                    with open(pickle_path, 'rb') as f:
-                        buffer = io.BytesIO(f.read())
-                    # Create custom unpickler with aggressive CPU forcing
-                    class AggressiveCPUUnpickler(pkl.Unpickler):
-                        def find_class(self, module, name):
-                            # Remap any CUDA storage to CPU storage
-                            if 'cuda' in name.lower():
-                                name = name.replace('cuda', '').replace('Cuda', '')
-                            return super().find_class(module, name)
-                        def load_build(self):
-                            # Override to catch tensor builds
-                            stack = self.stack
-                            state = stack.pop()
-                            inst = stack[-1]
-                            # If this is a tensor, force to CPU
-                            if hasattr(inst, 'to'):
-                                try:
-                                    inst = inst.cpu()
-                                    stack[-1] = inst
-                                except:
-                                    pass
-                            if hasattr(inst, '__setstate__'):
-                                inst.__setstate__(state)
-                            else:
-                                for k, v in state.items():
-                                    setattr(inst, k, v)
-                        def persistent_load(self, pid):
-                            # Intercept ALL storage loads
-                            if isinstance(pid, tuple) and len(pid) >= 5:
-                                # Standard torch storage format
-                                tag, storage_type, key, location, size = pid[0], pid[1], pid[2], pid[3], pid[4]
-                                if tag == 'storage':
-                                    # Force location to CPU
-                                    return (tag, storage_type, key, 'cpu', size)
-                            return pid
-                    # Try to load with aggressive unpickler
-                    unpickler = AggressiveCPUUnpickler(buffer)
-                    model_package = unpickler.load()
-                    # Save as CPU version for next time
-                    torch.save(model_package, cpu_pickle_path)
-                except Exception as aggressive_error:
-                    return (f"❌ Failed to convert CUDA pickle to CPU.\n\n"
-                            f"Convert error: {str(convert_error)[:100]}\n"
-                            f"Aggressive error: {str(aggressive_error)[:100]}\n\n"
-                            f"Please re-save your model on a CPU machine:\n"
-                            f"```python\n"
-                            f"import torch\n"
-                            f"# Load your model\n"
-                            f"model = model.cpu()  # Move to CPU\n"
-                            f"torch.save({{'model': model, 'tokenizer': tokenizer, 'config': config}}, 'best_model.pkl')\n"
-                            f"```")
-        else:
-            # CPU version exists, load it directly
-            model_package = torch.load(cpu_pickle_path, map_location='cpu')
-        # Success! Model loaded with one of the strategies above
-        # Handle a few common package shapes.
-        if isinstance(model_package, dict):
-            loaded_model = model_package.get('model', None)
-            loaded_tokenizer = model_package.get('tokenizer', None)
-            loaded_config = model_package.get('config', {}) or {}
-        else:
-            # Unknown package format: assume the object itself is the model
-            loaded_model = model_package
-            loaded_tokenizer = None
-            loaded_config = {}
-        # If user saved a state_dict instead of a model object, provide guidance
-        if isinstance(loaded_model, dict) and 'state_dict' in loaded_model:
-            # the file contains something like {'state_dict': ...}
-            return ("❌ The pickle appears to contain a state_dict rather than a full model object. "
-                    "This app expects a pickled model object (model instance).\n"
-                    "If you only have a state_dict, re-create the model architecture and load the state_dict before pickling, "
-                    "or provide a pickled model object saved with torch.save(model, path).")
-        if loaded_model is None:
-            return ("❌ No model object found inside the pickle. Please ensure the pickle contains a dict with keys "
-                    "'model', 'tokenizer', and 'config' (or the model object itself).")
-        # Set model to evaluation mode and move to appropriate device
-        try:
-            loaded_model.eval()
-            device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-            loaded_model = loaded_model.to(device)
-        except Exception as e:
-            return (f"❌ Error preparing model for inference: {str(e)}\n\n"
-                    "This can happen if the saved object is not a proper torch.nn.Module or if tensors couldn't be mapped to the current device.")
-        config_info = f"""✅ Model loaded successfully!
-📊 Model Configuration:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-• Base Model: {loaded_config.get('model_name', 'GPT-2')}
-• Training Epochs: {loaded_config.get('num_epochs', 'N/A')}
-• Training Samples: {loaded_config.get('training_samples', 'N/A'):,}
-• Validation Samples: {loaded_config.get('validation_samples', 'N/A'):,}
-• BLEU Score: {loaded_config.get('bleu_score', 0):.4f}
-• Perplexity: {loaded_config.get('perplexity', 0):.2f}
-• Final Loss: {loaded_config.get('final_loss', 0):.4f}
-• Device: {device}
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-🚀 Model is ready to generate code!
-"""
-        return config_info
-    except Exception as e:
-        # Final catch-all for any unexpected errors
-        err = str(e)
-        return f"❌ Unexpected error loading model: {err}\n\nPlease ensure best_model.pkl is properly uploaded and compatible with this environment."
-def calculate_bleu_score(reference, hypothesis):
-    """Calculate BLEU score between reference and generated code"""
-    try:
-        # Tokenize
-        ref_tokens = word_tokenize(reference.lower())
-        hyp_tokens = word_tokenize(hypothesis.lower())
-        # Calculate BLEU with smoothing
-        smooth = SmoothingFunction()
-        bleu_1 = sentence_bleu([ref_tokens], hyp_tokens, weights=(1, 0, 0, 0), smoothing_function=smooth.method1)
-        bleu_2 = sentence_bleu([ref_tokens], hyp_tokens, weights=(0.5, 0.5, 0, 0), smoothing_function=smooth.method1)
-        bleu_3 = sentence_bleu([ref_tokens], hyp_tokens, weights=(0.33, 0.33, 0.33, 0), smoothing_function=smooth.method1)
-        bleu_4 = sentence_bleu([ref_tokens], hyp_tokens, weights=(0.25, 0.25, 0.25, 0.25), smoothing_function=smooth.method1)
-        return bleu_1, bleu_2, bleu_3, bleu_4
-    except Exception as e:
-        return 0.0, 0.0, 0.0, 0.0
-def calculate_code_metrics(reference, generated):
-    """Calculate various code similarity metrics"""
-    try:
-        # Length ratio
-        len_ratio = len(generated) / max(len(reference), 1)
-        # Word overlap
-        ref_words = set(reference.lower().split())
-        gen_words = set(generated.lower().split())
-        if len(ref_words) > 0:
-            precision = len(ref_words.intersection(gen_words)) / len(gen_words) if len(gen_words) > 0 else 0
-            recall = len(ref_words.intersection(gen_words)) / len(ref_words)
-            f1 = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
-        else:
-            precision = recall = f1 = 0
-        # Character-level similarity
-        char_overlap = sum(1 for c in generated if c in reference) / max(len(generated), 1)
-        return {
-            'length_ratio': len_ratio,
-            'precision': precision,
-            'recall': recall,
-            'f1_score': f1,
-            'char_overlap': char_overlap
-        }
-    except Exception as e:
-        return {
-            'length_ratio': 0,
-            'precision': 0,
-            'recall': 0,
-            'f1_score': 0,
-            'char_overlap': 0
-        }
-def generate_code_from_pseudo(pseudo_code, max_length, temperature, top_k, top_p, num_sequences, reference_code):
-    """Generate code from pseudo-code using loaded model"""
-    global loaded_model, loaded_tokenizer, generation_history
-    if loaded_model is None or loaded_tokenizer is None:
-        return "❌ Please upload and load a model first!", "", "", ""
-    if not pseudo_code.strip():
-        return "❌ Please enter pseudo-code description!", "", "", ""
     try:
-        start_time = time.time()
-        # Format input
-        prompt = f"<PSEUDO> {pseudo_code.strip()} <SEP> <CODE>"
-        # Tokenize
-        device = next(loaded_model.parameters()).device
-        inputs = loaded_tokenizer(prompt, return_tensors='pt').to(device)
-        # Generate (ensure type safety for parameters)
         with torch.no_grad():
-            outputs = loaded_model.generate(
                 **inputs,
-                max_length=int(max_length),
-                temperature=float(temperature),
-                top_k=int(top_k),
-                top_p=float(top_p),
                 do_sample=True,
-                num_return_sequences=int(num_sequences),
-                pad_token_id=loaded_tokenizer.pad_token_id,
-                eos_token_id=loaded_tokenizer.eos_token_id,
             )
-        generation_time = time.time() - start_time
-        # Decode all sequences
-        generated_codes = []
-        for output in outputs:
-            generated = loaded_tokenizer.decode(output, skip_special_tokens=False)
-            # Extract code part
-            if '<CODE>' in generated:
-                code = generated.split('<CODE>')[-1].strip()
-                # Remove special tokens
-                code = code.replace('<PAD>', '').replace('<SEP>', '').strip()
-            else:
-                code = generated
-            generated_codes.append(code)
-        # Use the first generated code as primary output
-        primary_code = generated_codes[0]
-        # Calculate metrics if reference code is provided
-        metrics_output = ""
-        bleu_output = ""
-        if reference_code and reference_code.strip():
-            # Calculate BLEU scores
-            bleu_1, bleu_2, bleu_3, bleu_4 = calculate_bleu_score(reference_code, primary_code)
-            bleu_output = f"""📊 BLEU Scores:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-• BLEU-1 (Unigram): {bleu_1:.4f} ({bleu_1*100:.2f}%)
-• BLEU-2 (Bigram):  {bleu_2:.4f} ({bleu_2*100:.2f}%)
-• BLEU-3 (Trigram): {bleu_3:.4f} ({bleu_3*100:.2f}%)
-• BLEU-4 (4-gram):  {bleu_4:.4f} ({bleu_4*100:.2f}%)
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-💡 Interpretation:
-• BLEU > 0.4: Excellent match
-• BLEU 0.3-0.4: Good match
-• BLEU 0.2-0.3: Fair match
-• BLEU < 0.2: Poor match
-"""
-            # Calculate additional metrics
-            code_metrics = calculate_code_metrics(reference_code, primary_code)
-            metrics_output = f"""📈 Additional Metrics:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-• Length Ratio: {code_metrics['length_ratio']:.3f}
-• Precision: {code_metrics['precision']:.4f} ({code_metrics['precision']*100:.2f}%)
-• Recall: {code_metrics['recall']:.4f} ({code_metrics['recall']*100:.2f}%)
-• F1-Score: {code_metrics['f1_score']:.4f} ({code_metrics['f1_score']*100:.2f}%)
-• Character Overlap: {code_metrics['char_overlap']:.4f} ({code_metrics['char_overlap']*100:.2f}%)
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-⏱️ Generation Time: {generation_time:.2f}s
-📝 Sequences Generated: {num_sequences}
-🔢 Output Length: {len(primary_code)} characters
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-"""
         else:
-            metrics_output = f"""⏱️ Generation Time: {generation_time:.2f}s
-📝 Sequences Generated: {num_sequences}
-🔢 Output Length: {len(primary_code)} characters
-💡 Tip: Provide reference code to see BLEU scores and similarity metrics!
-"""
-        # Format alternative sequences
-        alternatives = ""
-        if num_sequences > 1:
-            alternatives = "🔄 Alternative Generations:\n" + "━"*50 + "\n\n"
-            for i, code in enumerate(generated_codes[1:], 2):
-                alternatives += f"Variation {i}:\n```python\n{code}\n```\n\n"
-        # Add to history
-        generation_history.append({
-            'pseudo': pseudo_code,
-            'generated': primary_code,
-            'bleu_4': bleu_4 if reference_code else None,
-            'time': generation_time
-        })
-        return primary_code, metrics_output, bleu_output, alternatives
-    except Exception as e:
-        return f"❌ Error generating code: {str(e)}", "", "", ""
-def show_examples(example_name):
-    """Load example pseudo-code"""
-    examples = {
-        "Basic Loop": "create a list of numbers from 1 to 10",
-        "Function Definition": "define a function to calculate the sum of two numbers",
-        "List Iteration": "iterate through a list and print each element",
-        "Conditional Check": "check if a number is even or odd",
-        "Sorting": "sort a list in descending order",
-        "Maximum Element": "create a function to find maximum element in array",
-        "Binary Search": "implement binary search algorithm",
-        "Factorial": "create a recursive function to calculate factorial",
-        "Palindrome": "check if a string is palindrome",
-        "Fibonacci": "generate fibonacci sequence up to n terms"
-    }
-    return examples.get(example_name, "")
-def clear_all():
-    """Clear all inputs and outputs"""
-    return "", "", "", "", "", 150, 0.7, 50, 0.95, 1
-def show_history():
-    """Display generation history"""
-    if not generation_history:
-        return "No generation history yet. Start generating code!"
-    history_text = "📜 Generation History:\n" + "="*60 + "\n\n"
-    for i, entry in enumerate(reversed(generation_history[-10:]), 1):  # Show last 10
-        history_text += f"{i}. Pseudo: {entry['pseudo'][:60]}...\n"
-        history_text += f"   Time: {entry['time']:.2f}s"
-        if entry['bleu_4'] is not None:
-            history_text += f" | BLEU-4: {entry['bleu_4']:.4f}"
-        history_text += f"\n   Code: {entry['generated'][:80]}...\n\n"
-    return history_text
-# Create Gradio interface with custom CSS
-custom_css = """
-.gradio-container {
-    font-family: 'Arial', sans-serif;
-}
-.output-code {
-    font-family: 'Courier New', monospace;
-    font-size: 14px;
-}
-.metrics-box {
-    background-color: #f0f8ff;
-    border-radius: 8px;
-    padding: 10px;
-}
-"""
-with gr.Blocks(title="🚀 GPT-2 Pseudo-Code to Code Generator", theme=gr.themes.Soft(), css=custom_css) as demo:
-    gr.Markdown("""
-    # 🚀 GPT-2 Pseudo-Code to Python Code Generator
-    **Transform natural language descriptions into executable Python code using fine-tuned GPT-2!**
-    This model is trained on the SPOC (Search-based Pseudo-code to Code) dataset and can generate Python code from pseudo-code descriptions.
-    """)
-    with gr.Tabs():
-        # Tab 1: Code Generation
-        with gr.Tab("💻 Code Generation"):
-            with gr.Row():
-                with gr.Column(scale=1):
-                    gr.Markdown("### � Model Status")
-                    model_status = gr.Textbox(
-                        label="Model Information",
-                        lines=15,
-                        interactive=False,
-                        value=initialize_model()  # Auto-load on startup
-                    )
-            gr.Markdown("---")
             with gr.Row():
-                with gr.Column(scale=1):
-                    gr.Markdown("### ✍️ Enter Pseudo-Code")
-                    # Example selector
-                    with gr.Row():
-                        example_dropdown = gr.Dropdown(
-                            choices=["Basic Loop", "Function Definition", "List Iteration",
-                                   "Conditional Check", "Sorting", "Maximum Element",
-                                   "Binary Search", "Factorial", "Palindrome", "Fibonacci"],
-                            label="📚 Load Example",
-                            value=None
-                        )
-                    pseudo_input = gr.Textbox(
-                        label="Pseudo-Code Description",
-                        placeholder="Example: create a function to calculate factorial of a number",
-                        lines=4
-                    )
-                    reference_code = gr.Textbox(
-                        label="Reference Code (Optional - for BLEU score calculation)",
-                        placeholder="Paste reference code here to calculate BLEU scores...",
-                        lines=4
-                    )
-                    gr.Markdown("### ⚙️ Generation Parameters")
-                    with gr.Row():
-                        max_length = gr.Slider(
-                            minimum=50,
-                            maximum=500,
-                            value=150,
-                            step=10,
-                            label="Max Length",
-                            info="Maximum tokens to generate"
-                        )
-                        temperature = gr.Slider(
-                            minimum=0.1,
-                            maximum=1.5,
-                            value=0.7,
-                            step=0.1,
-                            label="Temperature",
-                            info="Higher = more creative"
-                        )
-                    with gr.Row():
-                        top_k = gr.Slider(
-                            minimum=10,
-                            maximum=100,
-                            value=50,
-                            step=5,
-                            label="Top-K",
-                            info="Vocabulary filtering"
-                        )
-                        top_p = gr.Slider(
-                            minimum=0.5,
-                            maximum=1.0,
-                            value=0.95,
-                            step=0.05,
-                            label="Top-P",
-                            info="Nucleus sampling"
-                        )
-                    num_sequences = gr.Slider(
-                        minimum=1,
-                        maximum=5,
-                        value=1,
-                        step=1,
-                        label="Number of Variations",
-                        info="Generate multiple versions"
-                    )
-                    with gr.Row():
-                        generate_btn = gr.Button("✨ Generate Code", variant="primary", size="lg")
-                        clear_btn = gr.Button("🗑️ Clear All", variant="secondary")
-                with gr.Column(scale=1):
-                    gr.Markdown("### 💻 Generated Python Code")
-                    code_output = gr.Code(
-                        label="Generated Code",
-                        language="python",
-                        lines=12,
-                        elem_classes="output-code"
-                    )
-                    with gr.Row():
-                        with gr.Column():
-                            metrics_output = gr.Textbox(
-                                label="📊 Performance Metrics",
-                                lines=8,
-                                interactive=False,
-                                elem_classes="metrics-box"
-                            )
-                        with gr.Column():
-                            bleu_output = gr.Textbox(
-                                label="🎯 BLEU Scores",
-                                lines=8,
-                                interactive=False,
-                                elem_classes="metrics-box"
-                            )
-                    alternatives_output = gr.Markdown(
-                        label="🔄 Alternative Generations"
-                    )
-        # Tab 2: Information & Guide
-        with gr.Tab("📖 Guide & Examples"):
-            gr.Markdown("""
-            ## 📚 How to Use
-            ### 1️⃣ Load Your Model
-            - Upload the `best_model.pkl` file (trained GPT-2 model)
-            - Click "Load Model" and wait for confirmation
-            - You'll see model configuration and training metrics
-            ### 2️⃣ Generate Code
-            - **Quick Start**: Select an example from the dropdown
-            - **Custom Input**: Type your own pseudo-code description
-            - **Optional**: Add reference code to calculate BLEU scores
-            - Adjust generation parameters for different outputs
-            - Click "Generate Code"
-            ### 3️⃣ Understand the Metrics
-            #### 🎯 BLEU Score (Bilingual Evaluation Understudy)
-            - Measures similarity between generated and reference code
-            - **BLEU-1**: Word-level similarity (unigrams)
-            - **BLEU-2**: 2-word phrase similarity (bigrams)
-            - **BLEU-3**: 3-word phrase similarity (trigrams)
-            - **BLEU-4**: 4-word phrase similarity (most comprehensive)
-            **Score Interpretation:**
-            - 🟢 **> 0.4**: Excellent match - Generated code is very similar to reference
-            - 🟡 **0.3-0.4**: Good match - Code captures most key elements
-            - 🟠 **0.2-0.3**: Fair match - Some similarity exists
-            - 🔴 **< 0.2**: Poor match - Significant differences
-            #### 📈 Additional Metrics
-            - **Precision**: How many generated words appear in reference
-            - **Recall**: How many reference words appear in generated code
-            - **F1-Score**: Harmonic mean of precision and recall
-            - **Length Ratio**: Generated vs reference code length
-            - **Character Overlap**: Character-level similarity
-            ### 🎛️ Generation Parameters
-            | Parameter | Low Value | High Value | Use Case |
-            |-----------|-----------|------------|----------|
-            | **Temperature** | 0.1-0.3 | 0.8-1.2 | Low: Deterministic, focused<br>High: Creative, diverse |
-            | **Top-K** | 10-30 | 60-100 | Low: Conservative choices<br>High: More variety |
-            | **Top-P** | 0.5-0.8 | 0.9-1.0 | Low: Safe predictions<br>High: Exploratory |
-            | **Max Length** | 50-100 | 200-500 | Short: Simple code<br>Long: Complex implementations |
-            ---
-            ## 💡 Example Pseudo-Code Prompts
-            ### Basic Operations
-            ```
-            create a list of numbers from 1 to 10
-            define a function to calculate the sum of two numbers
-            iterate through a list and print each element
-            ```
-            ### Conditionals & Logic
-            ```
-            check if a number is even or odd
-            find the maximum of three numbers
-            validate if a string is empty
-            ```
-            ### Data Structures
-            ```
-            sort a list in descending order
-            remove duplicates from a list
-            merge two dictionaries
-            ```
-            ### Algorithms
-            ```
-            implement binary search algorithm
-            create a recursive function to calculate factorial
-            generate fibonacci sequence up to n terms
-            check if a string is palindrome
-            ```
-            ### Advanced
-            ```
-            create a class to represent a student with name and grades
-            implement a function to read CSV file and return dataframe
-            create a decorator to measure function execution time
-            ```
-            ---
-            ## 🎓 About the Model
-            This model is fine-tuned on the **SPOC (Search-based Pseudo-code to Code)** dataset:
-            - 📄 Paper: [SPOC: Search-based Pseudo-code to Code](https://arxiv.org/pdf/1906.04908)
-            - 🏛️ Source: Stanford University
-            - 🤖 Base Model: GPT-2 (Decoder-Only Transformer)
-            - 📊 Training: 10,000+ pseudo-code to code pairs
-            - 🎯 Task: Causal Language Modeling
-            ---
-            ## ⚠️ Limitations
-            - Model may not handle very complex algorithms perfectly
-            - Generated code should be tested before production use
-            - Best results with clear, specific pseudo-code descriptions
-            - Model trained on C++ code, adapted for Python generation
-            ---
-            ## 🤝 Tips for Best Results
-            1. ✅ **Be Specific**: "create a function to sort list in ascending order" vs "sort list"
-            2. ✅ **Use Action Words**: "create", "define", "implement", "calculate"
-            3. ✅ **Mention Data Types**: "list", "string", "dictionary", "integer"
-            4. ✅ **Include Details**: "recursive function" vs just "function"
-            5. ✅ **Try Variations**: Generate multiple times with different temperatures
-            """)
-        # Tab 3: History
-        with gr.Tab("📜 History"):
-            gr.Markdown("## 📊 Generation History")
-            history_display = gr.Textbox(
-                label="Recent Generations",
-                lines=20,
-                interactive=False
             )
-            refresh_history_btn = gr.Button("🔄 Refresh History", variant="secondary")
-    gr.Markdown("""
-    ---
-    ### 🌟 Features
-    - ✅ Upload and use custom trained models
-    - ✅ BLEU score calculation for quality assessment
-    - ✅ Multiple evaluation metrics (Precision, Recall, F1)
-    - ✅ Generate multiple code variations
-    - ✅ Real-time performance tracking
-    - ✅ Example prompts library
-    - ✅ Generation history
-    ### 📝 Citation
-    If you use this model, please cite:
-    ```
-    @article{kulal2019spoc,
-      title={SPOC: Search-based Pseudo-code to Code},
-      author={Kulal, Sumith and Pasupat, Panupong and Chandra, Kartik and Lee, Mina and Padon, Oded and Aiken, Alex and Liang, Percy},
-      journal={arXiv preprint arXiv:1906.04908},
-      year={2019}
-    }
-    ```
-    **Built with ❤️ using HuggingFace Transformers & Gradio**
-    """)
-    # Event handlers
-    example_dropdown.change(
-        fn=show_examples,
-        inputs=[example_dropdown],
-        outputs=[pseudo_input]
-    )
-    generate_btn.click(
-        fn=generate_code_from_pseudo,
-        inputs=[pseudo_input, max_length, temperature, top_k, top_p, num_sequences, reference_code],
-        outputs=[code_output, metrics_output, bleu_output, alternatives_output]
     )
-    clear_btn.click(
-        fn=clear_all,
-        inputs=[],
-        outputs=[pseudo_input, reference_code, code_output, metrics_output, bleu_output,
-                max_length, temperature, top_k, top_p, num_sequences]
     )
-    refresh_history_btn.click(
-        fn=show_history,
-        inputs=[],
-        outputs=[history_display]
     )
-# Launch the interface
 if __name__ == "__main__":
-    demo.launch(share=False)

 import gradio as gr
 import torch
+import pickle
+from transformers import GPT2Tokenizer, GPT2LMHeadModel
+# Load model and tokenizer from pickle files
+print("Loading model and tokenizer...")
+try:
+    # Load LoRA model
+    with open('gpt2_pseudo2code_lora_model.pkl', 'rb') as f:
+        model = pickle.load(f)
+    print("✓ Model loaded successfully")
+    # Load tokenizer
+    with open('gpt2_pseudo2code_tokenizer.pkl', 'rb') as f:
+        tokenizer = pickle.load(f)
+    print("✓ Tokenizer loaded successfully")
+    # Move model to appropriate device
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    model = model.to(device)
+    model.eval()
+    print(f"✓ Model moved to {device}")
+except Exception as e:
+    print(f"Error loading model: {e}")
+    raise
+def generate_code(pseudocode, indent, line, max_length=128, temperature=0.7, top_p=0.9):
+    """
+    Generate code from pseudo-code with line and indent information.
+    Args:
+        pseudocode: Input pseudo-code string
+        indent: Indentation level
+        line: Line number
+        max_length: Maximum length of generated sequence
+        temperature: Sampling temperature
+        top_p: Nucleus sampling parameter
+    Returns:
+        Generated code string
+    """
     try:
+        # Format input with line and indent information
+        prompt = f"Pseudocode: {pseudocode} | Indent: {indent} | Line: {line}\nCode:"
+        # Tokenize input
+        inputs = tokenizer(prompt, return_tensors='pt', padding=True)
+        # Move to same device as model
+        device = next(model.parameters()).device
+        inputs = {k: v.to(device) for k, v in inputs.items()}
+        # Generate
+        model.eval()
         with torch.no_grad():
+            outputs = model.generate(
                 **inputs,
+                max_length=max_length,
+                temperature=temperature,
+                top_p=top_p,
                 do_sample=True,
+                pad_token_id=tokenizer.eos_token_id,
+                eos_token_id=tokenizer.eos_token_id,
+                num_return_sequences=1
             )
+        # Decode output
+        generated_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
+        # Extract only the code part
+        if "Code:" in generated_text:
+            code = generated_text.split("Code:")[1].strip()
         else:
+            code = generated_text.strip()
+        return code
+    except Exception as e:
+        return f"Error generating code: {str(e)}"
+def gradio_generate_code(pseudocode, indent, line, temperature=0.7, top_p=0.9, max_length=128):
+    """
+    Wrapper function for Gradio interface.
+    """
+    if not pseudocode.strip():
+        return "⚠️ Please enter some pseudocode!"
+    try:
+        indent = int(indent)
+        line = int(line)
+        generated_code = generate_code(
+            pseudocode,
+            indent,
+            line,
+            max_length=int(max_length),
+            temperature=float(temperature),
+            top_p=float(top_p)
+        )
+        return generated_code
+    except ValueError:
+        return "⚠️ Indent and Line must be valid numbers!"
+    except Exception as e:
+        return f"❌ Error: {str(e)}"
+# Example pseudocodes
+examples = [
+    ["create integer n", 1, 1, 0.7, 0.9, 128],
+    ["read n", 1, 2, 0.7, 0.9, 128],
+    ["for i from 0 to n", 1, 3, 0.7, 0.9, 128],
+    ["print i", 2, 4, 0.7, 0.9, 128],
+    ["if n is equal to 0", 1, 5, 0.7, 0.9, 128],
+    ["create string s", 1, 1, 0.7, 0.9, 128],
+    ["read s", 1, 2, 0.7, 0.9, 128],
+]
+# Create Gradio interface
+with gr.Blocks(theme=gr.themes.Soft(), title="Pseudo-Code to Code Generator") as demo:
+    gr.Markdown(
+        """
+        # 🐍 Pseudo-Code to Code Generator (GPT-2 + LoRA)
+        Convert natural language pseudo-code to executable code using a fine-tuned GPT-2 model with LoRA.
+        **Model Details:**
+        - Base Model: GPT-2
+        - Training: SPOC Dataset (C++ code examples)
+        - Optimization: LoRA (Low-Rank Adaptation) + 16-bit precision
+        - Trained on: 20,000 pseudo-code to code pairs
+        **Note:** The model was trained on C++ code examples from the SPOC dataset, so it generates C++-style code.
+        """
+    )
+    with gr.Row():
+        with gr.Column(scale=1):
+            gr.Markdown("### 📝 Input")
+            pseudocode_input = gr.Textbox(
+                label="Pseudocode",
+                placeholder="Enter your pseudocode here...\nExample: create integer n",
+                lines=5,
+                max_lines=10
+            )
             with gr.Row():
+                indent_input = gr.Number(
+                    label="Indent Level",
+                    value=1,
+                    precision=0,
+                    info="Indentation level (0=no indent, 1=first level, etc.)"
+                )
+                line_input = gr.Number(
+                    label="Line Number",
+                    value=1,
+                    precision=0,
+                    info="Line number in the program"
+                )
+            gr.Markdown("### ⚙️ Generation Parameters")
+            with gr.Row():
+                temperature_slider = gr.Slider(
+                    minimum=0.1,
+                    maximum=1.5,
+                    value=0.7,
+                    step=0.1,
+                    label="Temperature",
+                    info="Higher = more creative/random"
+                )
+                top_p_slider = gr.Slider(
+                    minimum=0.1,
+                    maximum=1.0,
+                    value=0.9,
+                    step=0.05,
+                    label="Top-p (Nucleus Sampling)",
+                    info="Probability threshold for sampling"
+                )
+            max_length_slider = gr.Slider(
+                minimum=64,
+                maximum=256,
+                value=128,
+                step=16,
+                label="Max Length",
+                info="Maximum tokens to generate"
+            )
+            generate_btn = gr.Button("🚀 Generate Code", variant="primary", size="lg")
+        with gr.Column(scale=1):
+            gr.Markdown("### 💻 Generated Code")
+            output = gr.Textbox(
+                label="Generated Code",
+                lines=15,
+                max_lines=20,
+                show_copy_button=True
             )
+    gr.Markdown("### 📚 Examples")
+    gr.Examples(
+        examples=examples,
+        inputs=[pseudocode_input, indent_input, line_input, temperature_slider, top_p_slider, max_length_slider],
+        outputs=output,
+        fn=gradio_generate_code,
+        cache_examples=False,
     )
+    gr.Markdown(
+        """
+        ---
+        ### ℹ️ How to Use:
+        1. **Enter pseudocode**: Write your natural language description
+        2. **Set indent level**: Specify the indentation (0 for no indent, 1 for first level, etc.)
+        3. **Set line number**: Indicate the line position in your program
+        4. **Adjust parameters** (optional): Fine-tune temperature and top-p for different results
+        5. **Click Generate**: Get your code!
+        ### 💡 Tips:
+        - Higher temperature (0.8-1.2) = more creative but potentially less accurate
+        - Lower temperature (0.5-0.7) = more conservative and predictable
+        - Top-p controls diversity; 0.9 is usually a good balance
+        - The model generates C++-style code as it was trained on the SPOC dataset
+        ### 🔗 Resources:
+        - [SPOC Dataset](https://github.com/sumith1896/spoc)
+        - [Research Paper](https://arxiv.org/pdf/1906.04908)
+        - Model trained with LoRA for efficiency
+        """
     )
+    # Connect button to function
+    generate_btn.click(
+        fn=gradio_generate_code,
+        inputs=[pseudocode_input, indent_input, line_input, temperature_slider, top_p_slider, max_length_slider],
+        outputs=output
     )
+# Launch the app
 if __name__ == "__main__":
+    demo.launch()