Spaces:

Zlovoblachko
/

lang_learn_app

Sleeping

App Files Files Community

Zlovoblachko commited on May 30, 2025

Commit

62e8dda

1 Parent(s): 4b3ae07

databank added

Browse files

Files changed (1) hide show

app.py +451 -32

app.py CHANGED Viewed

@@ -133,6 +133,48 @@ class HuggingFaceT5GEDInference:
         return error_spans
     def _preprocess_inputs(self, text, max_length=128):
         """Preprocess input text exactly as during training"""
         # Get GED predictions
@@ -242,19 +284,19 @@ class HuggingFaceT5GEDInference:
         """Enhanced analysis method for Gradio integration"""
         if not text.strip():
             return "Model not available or empty text", ""
         try:
             # Get corrected text
             corrected_text = self.correct_text(text)
-            # Get error spans
             error_spans = self._get_error_spans(text)
             # Generate HTML output
             html_output = self.generate_html_analysis(text, corrected_text, error_spans)
             return corrected_text, html_output
         except Exception as e:
             return f"Error during analysis: {str(e)}", ""
@@ -317,6 +359,21 @@ class HuggingFaceT5GEDInference:
         </div>
         """
         return html
 # Initialize SQLite database for storing submissions and exercises
 def init_database():
@@ -375,11 +432,154 @@ def init_database():
         created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
     )''')
     conn.commit()
     conn.close()
 # Initialize database and components
 init_database()
 print("Initializing enhanced grammar checker...")
 grammar_checker = HuggingFaceT5GEDInference()
 print("Grammar checker initialized successfully!")
@@ -424,26 +624,49 @@ def analyze_student_writing(text, student_name, task_title="General Writing Task
     return corrected_text, html_analysis
 def create_exercise_from_text(text, exercise_title="Grammar Exercise"):
-    """Create an exercise from text with errors using enhanced analysis"""
     if not text.strip():
         return "Please enter text to create an exercise.", ""
-    # Analyze text to find sentences with errors
     sentences = nltk.sent_tokenize(text)
     exercise_sentences = []
     for sentence in sentences:
-        corrected, _ = grammar_checker.analyze_text(sentence)
-        if sentence.strip() != corrected.strip():  # Has errors
             exercise_sentences.append({
                 "original": sentence.strip(),
-                "corrected": corrected.strip()
             })
     if not exercise_sentences:
         return "No errors found in the text. Cannot create exercise.", ""
     # Store exercise in database
     conn = sqlite3.connect('language_app.db')
     c = conn.cursor()
@@ -452,7 +675,7 @@ def create_exercise_from_text(text, exercise_title="Grammar Exercise"):
                  VALUES (?, ?, ?)""",
               (exercise_title,
                "Correct the grammatical errors in the following sentences:",
-               json.dumps(exercise_sentences)))
     exercise_id = c.lastrowid
     conn.commit()
@@ -464,15 +687,18 @@ def create_exercise_from_text(text, exercise_title="Grammar Exercise"):
         <h3>{exercise_title}</h3>
         <p><strong>Exercise ID: {exercise_id}</strong></p>
         <p><strong>Instructions:</strong> Correct the grammatical errors in the following sentences:</p>
         <ol>
     """
-    for i, sentence_data in enumerate(exercise_sentences, 1):
-        exercise_html += f"<li style='margin: 10px 0; padding: 10px; background-color: #f8f9fa; border-radius: 4px;'>{sentence_data['original']}</li>"
     exercise_html += "</ol></div>"
-    return f"Exercise created with {len(exercise_sentences)} sentences! Exercise ID: {exercise_id}", exercise_html
 def attempt_exercise(exercise_id, student_responses, student_name):
     """Submit exercise attempt and get score using enhanced analysis"""
@@ -504,20 +730,28 @@ def attempt_exercise(exercise_id, student_responses, student_name):
     # Calculate score using enhanced analysis
     correct_count = 0
-    feedback = []
     for i, (sentence_data, response) in enumerate(zip(exercise_sentences, responses), 1):
-        correct_answer = sentence_data['corrected']
         # Use the model to check if the response is correct
-        response_corrected, _ = grammar_checker.analyze_text(response)
         is_correct = response_corrected.strip() == response.strip()  # No further corrections needed
         if is_correct:
             correct_count += 1
-            feedback.append(f"✅ Sentence {i}: Excellent! No errors detected.")
-        else:
-            feedback.append(f"❌ Sentence {i}: Your answer: '{response}' | Suggested improvement: '{response_corrected}' | Expected: '{correct_answer}'")
     score = (correct_count / len(exercise_sentences)) * 100
@@ -525,7 +759,7 @@ def attempt_exercise(exercise_id, student_responses, student_name):
     attempt_data = {
         "responses": responses,
         "score": score,
-        "feedback": feedback
     }
     c.execute("""INSERT INTO exercise_attempts (exercise_id, student_name, responses, score)
@@ -535,18 +769,185 @@ def attempt_exercise(exercise_id, student_responses, student_name):
     conn.commit()
     conn.close()
     feedback_html = f"""
-    <div style='font-family: Arial, sans-serif; padding: 20px; border: 1px solid #ddd; border-radius: 8px;'>
-        <h3>Exercise Results</h3>
-        <p><strong>Score: {score:.1f}%</strong> ({correct_count}/{len(exercise_sentences)} correct)</p>
-        <div style='margin-top: 15px;'>
-            {'<br>'.join(feedback)}
         </div>
     </div>
     """
     return f"Score: {score:.1f}%", feedback_html
 def get_student_progress(student_name):
     """Get student's submission and exercise history"""
     if not student_name.strip():
@@ -653,28 +1054,46 @@ with gr.Blocks(title="Language Learning App - Enhanced Grammar Checker", theme=g
         # Exercise Attempt Tab
         with gr.TabItem("✏️ Exercise Practice"):
             gr.Markdown("## Practice Grammar Exercises")
             with gr.Row():
                 with gr.Column():
                     exercise_id_input = gr.Textbox(label="Exercise ID", placeholder="Enter exercise ID")
                     student_name_exercise = gr.Textbox(label="Your Name", placeholder="Enter your name")
                     responses_input = gr.Textbox(
                         label="Your Answers",
-                        lines=6,
-                        placeholder="Enter your corrected sentences (one per line)..."
                     )
-                    submit_exercise_btn = gr.Button("Submit Answers", variant="primary")
                 with gr.Column():
                     score_output = gr.Textbox(label="Your Score")
                     feedback_output = gr.HTML(label="Detailed Feedback")
             submit_exercise_btn.click(
                 attempt_exercise,
                 inputs=[exercise_id_input, responses_input, student_name_exercise],
                 outputs=[score_output, feedback_output]
             )
         # Progress Tracking Tab
         with gr.TabItem("📊 Student Progress"):
             gr.Markdown("## View Student Progress")

         return error_spans
+    def _get_error_spans_detailed(self, text):
+        """Extract error spans with detailed second_level_tag categories"""
+        ged_tags_str, tokens, predictions = self._get_ged_predictions(text)
+        error_spans = []
+        error_types = []
+        clean_tokens = []
+        # Correct id2label mapping
+        id2label = {
+            0: "correct",
+            1: "ORTH",
+            2: "FORM",
+            3: "MORPH",
+            4: "DET",
+            5: "POS",
+            6: "VERB",
+            7: "NUM",
+            8: "WORD",
+            9: "PUNCT",
+            10: "RED",
+            11: "MULTIWORD",
+            12: "SPELL"
+        }
+        for token, pred in zip(tokens, predictions):
+            if token.startswith("##") or token in ["[CLS]", "[SEP]", "[PAD]"]:
+                continue
+            clean_tokens.append(token)
+            if pred != 0:  # 0 is correct, others are various error types
+                error_type = id2label.get(pred, "OTHER")
+                error_types.append(error_type)
+                error_spans.append({
+                    "token": token,
+                    "type": error_type,
+                    "position": len(clean_tokens) - 1
+                })
+        return error_spans, list(set(error_types))
     def _preprocess_inputs(self, text, max_length=128):
         """Preprocess input text exactly as during training"""
         # Get GED predictions
         """Enhanced analysis method for Gradio integration"""
         if not text.strip():
             return "Model not available or empty text", ""
         try:
             # Get corrected text
             corrected_text = self.correct_text(text)
+            # Get error spans (use the original method for display)
             error_spans = self._get_error_spans(text)
             # Generate HTML output
             html_output = self.generate_html_analysis(text, corrected_text, error_spans)
             return corrected_text, html_output
         except Exception as e:
             return f"Error during analysis: {str(e)}", ""
         </div>
         """
         return html
+def clear_and_reload_database():
+    """Clear and reload the sentence database"""
+    conn = sqlite3.connect('language_app.db')
+    c = conn.cursor()
+    # Clear existing data
+    c.execute("DELETE FROM sentence_database")
+    conn.commit()
+    print("Cleared existing sentence database")
+    conn.close()
+    # Reload
+    load_sentence_database()
 # Initialize SQLite database for storing submissions and exercises
 def init_database():
         created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
     )''')
+    # Sentence database table - ADD THIS
+    c.execute('''CREATE TABLE IF NOT EXISTS sentence_database (
+        id INTEGER PRIMARY KEY AUTOINCREMENT,
+        text TEXT NOT NULL,
+        tags TEXT NOT NULL,
+        error_types TEXT NOT NULL
+    )''')
     conn.commit()
     conn.close()
+def load_sentence_database(jsonl_file_path='sentencewise_full.jsonl'):
+    """Load sentence database from JSONL file"""
+    print(f"Debug: Attempting to load from: {jsonl_file_path}")
+    print(f"Debug: Current working directory: {os.getcwd()}")
+    print(f"Debug: File exists: {os.path.exists(jsonl_file_path)}")
+    conn = sqlite3.connect('language_app.db')
+    c = conn.cursor()
+    # Create sentence database table
+    c.execute('''CREATE TABLE IF NOT EXISTS sentence_database (
+        id INTEGER PRIMARY KEY AUTOINCREMENT,
+        text TEXT NOT NULL,
+        tags TEXT NOT NULL,
+        error_types TEXT NOT NULL
+    )''')
+    # Check if data already loaded
+    c.execute("SELECT COUNT(*) FROM sentence_database")
+    current_count = c.fetchone()[0]
+    if current_count > 0:
+        print(f"Sentence database already loaded with {current_count} sentences")
+        conn.close()
+        return
+    # Load JSONL file
+    try:
+        print(f"Debug: Opening file {jsonl_file_path}")
+        with open(jsonl_file_path, 'r', encoding='utf-8') as f:
+            lines_processed = 0
+            for line_num, line in enumerate(f, 1):
+                try:
+                    line = line.strip()
+                    if not line:  # Skip empty lines
+                        continue
+                    data = json.loads(line)
+                    text = data.get('text', '')
+                    tags = data.get('tags', [])
+                    if not text or not tags:
+                        print(f"Debug: Skipping line {line_num} - missing text or tags")
+                        continue
+                    # Extract second_level_tag error types
+                    error_types = []
+                    for tag in tags:
+                        second_level = tag.get('second_level_tag', '')
+                        if second_level:
+                            error_types.append(second_level)
+                    error_types = list(set(error_types))  # Remove duplicates
+                    # Debug: Print first few entries
+                    if line_num <= 3:
+                        print(f"Debug line {line_num}: text='{text[:50]}...', error_types={error_types}")
+                        print(f"Debug: Raw tags for line {line_num}: {tags}")
+                    if error_types:  # Only insert if we have error types
+                        c.execute("""INSERT INTO sentence_database (text, tags, error_types)
+                                    VALUES (?, ?, ?)""",
+                                  (text, json.dumps(tags), json.dumps(error_types)))
+                        lines_processed += 1
+                    if line_num % 1000 == 0:
+                        print(f"Processed {line_num} lines, inserted {lines_processed} sentences...")
+                except json.JSONDecodeError as e:
+                    print(f"JSON decode error on line {line_num}: {e}")
+                    print(f"Line content: {line[:100]}...")
+                    continue
+                except Exception as e:
+                    print(f"Error processing line {line_num}: {e}")
+                    continue
+        conn.commit()
+        print(f"Successfully loaded sentence database with {lines_processed} sentences from {line_num} total lines")
+    except FileNotFoundError:
+        print(f"Error: {jsonl_file_path} not found in {os.getcwd()}")
+        print("Available files:")
+        try:
+            files = os.listdir('.')
+            for f in files:
+                if f.endswith('.jsonl') or f.endswith('.json'):
+                    print(f"  - {f}")
+        except:
+            print("  Could not list files")
+    except Exception as e:
+        print(f"Error loading sentence database: {e}")
+    conn.close()
+def find_similar_sentences(error_types, limit=5):
+    """Find sentences with similar error types from database"""
+    if not error_types:
+        return []
+    conn = sqlite3.connect('language_app.db')
+    c = conn.cursor()
+    # Build query to find sentences with matching error types
+    similar_sentences = []
+    for error_type in error_types:
+        c.execute("""SELECT text, tags FROM sentence_database
+                     WHERE error_types LIKE ?
+                     ORDER BY RANDOM()
+                     LIMIT ?""", (f'%"{error_type}"%', limit))
+        results = c.fetchall()
+        for text, tags_json in results:
+            similar_sentences.append({
+                'text': text,
+                'tags': json.loads(tags_json)
+            })
+    conn.close()
+    # Remove duplicates and limit to requested number
+    seen_texts = set()
+    unique_sentences = []
+    for sentence in similar_sentences:
+        if sentence['text'] not in seen_texts:
+            seen_texts.add(sentence['text'])
+            unique_sentences.append(sentence)
+            if len(unique_sentences) >= limit:
+                break
+    return unique_sentences
 # Initialize database and components
 init_database()
+print("Clearing and loading sentence database...")
+clear_and_reload_database()
 print("Initializing enhanced grammar checker...")
 grammar_checker = HuggingFaceT5GEDInference()
 print("Grammar checker initialized successfully!")
     return corrected_text, html_analysis
 def create_exercise_from_text(text, exercise_title="Grammar Exercise"):
+    """Create an exercise from text with errors using sentence database"""
     if not text.strip():
         return "Please enter text to create an exercise.", ""
+    # Analyze text to extract error types
     sentences = nltk.sent_tokenize(text)
     exercise_sentences = []
+    all_error_types = []
     for sentence in sentences:
+        # Get detailed error analysis
+        error_spans, error_types = grammar_checker._get_error_spans_detailed(sentence)
+        if error_types:  # Has errors
+            corrected, _ = grammar_checker.analyze_text(sentence)
             exercise_sentences.append({
                 "original": sentence.strip(),
+                "corrected": corrected.strip(),
+                "error_types": error_types
             })
+            all_error_types.extend(error_types)
     if not exercise_sentences:
         return "No errors found in the text. Cannot create exercise.", ""
+    # Find similar sentences from database
+    unique_error_types = list(set(all_error_types))
+    similar_sentences = find_similar_sentences(unique_error_types, limit=5)
+    # Combine original sentences with similar ones from database
+    all_exercise_sentences = exercise_sentences.copy()
+    for similar in similar_sentences:
+        # Get corrected version of similar sentence
+        corrected, _ = grammar_checker.analyze_text(similar['text'])
+        all_exercise_sentences.append({
+            "original": similar['text'],
+            "corrected": corrected,
+            "error_types": [tag.get('second_level_tag', '') for tag in similar['tags']]
+        })
     # Store exercise in database
     conn = sqlite3.connect('language_app.db')
     c = conn.cursor()
                  VALUES (?, ?, ?)""",
               (exercise_title,
                "Correct the grammatical errors in the following sentences:",
+               json.dumps(all_exercise_sentences)))
     exercise_id = c.lastrowid
     conn.commit()
         <h3>{exercise_title}</h3>
         <p><strong>Exercise ID: {exercise_id}</strong></p>
         <p><strong>Instructions:</strong> Correct the grammatical errors in the following sentences:</p>
+        <p><em>Error types found: {', '.join(unique_error_types)}</em></p>
         <ol>
     """
+    for i, sentence_data in enumerate(all_exercise_sentences, 1):
+        error_info = f" (Error types: {', '.join(sentence_data.get('error_types', []))})" if sentence_data.get('error_types') else ""
+        exercise_html += f"<li style='margin: 10px 0; padding: 10px; background-color: #f8f9fa; border-radius: 4px;'>{sentence_data['original']}{error_info}</li>"
     exercise_html += "</ol></div>"
+    return f"Exercise created with {len(all_exercise_sentences)} sentences ({len(exercise_sentences)} original + {len(similar_sentences)} from database)! Exercise ID: {exercise_id}", exercise_html
 def attempt_exercise(exercise_id, student_responses, student_name):
     """Submit exercise attempt and get score using enhanced analysis"""
     # Calculate score using enhanced analysis
     correct_count = 0
+    detailed_results = []
     for i, (sentence_data, response) in enumerate(zip(exercise_sentences, responses), 1):
+        original = sentence_data['original']
+        expected = sentence_data['corrected']
         # Use the model to check if the response is correct
+        response_corrected, response_analysis = grammar_checker.analyze_text(response)
         is_correct = response_corrected.strip() == response.strip()  # No further corrections needed
         if is_correct:
             correct_count += 1
+        detailed_results.append({
+            'sentence_num': i,
+            'original': original,
+            'student_response': response,
+            'expected': expected,
+            'model_correction': response_corrected,
+            'is_correct': is_correct,
+            'analysis_html': response_analysis
+        })
     score = (correct_count / len(exercise_sentences)) * 100
     attempt_data = {
         "responses": responses,
         "score": score,
+        "detailed_results": detailed_results
     }
     c.execute("""INSERT INTO exercise_attempts (exercise_id, student_name, responses, score)
     conn.commit()
     conn.close()
+    # Create beautiful HTML results
+    score_color = "#28a745" if score >= 70 else "#ffc107" if score >= 50 else "#dc3545"
     feedback_html = f"""
+    <div style='font-family: Arial, sans-serif; max-width: 1000px; margin: 0 auto;'>
+        <!-- Header Section -->
+        <div style='background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); color: white; padding: 30px; border-radius: 10px 10px 0 0; text-align: center;'>
+            <h2 style='margin: 0; font-size: 28px;'>📊 Exercise Results</h2>
+            <div style='margin-top: 15px; font-size: 48px; font-weight: bold; color: {score_color};'>{score:.1f}%</div>
+            <p style='margin: 10px 0 0 0; font-size: 18px; opacity: 0.9;'>{correct_count} out of {len(exercise_sentences)} sentences correct</p>
+        </div>
+        <!-- Performance Badge -->
+        <div style='background-color: #f8f9fa; padding: 20px; text-align: center; border-left: 1px solid #ddd; border-right: 1px solid #ddd;'>
+    """
+    if score >= 90:
+        feedback_html += """<span style='background-color: #28a745; color: white; padding: 8px 20px; border-radius: 20px; font-weight: bold;'>🏆 Excellent Work!</span>"""
+    elif score >= 70:
+        feedback_html += """<span style='background-color: #17a2b8; color: white; padding: 8px 20px; border-radius: 20px; font-weight: bold;'>👍 Good Job!</span>"""
+    elif score >= 50:
+        feedback_html += """<span style='background-color: #ffc107; color: white; padding: 8px 20px; border-radius: 20px; font-weight: bold;'>📚 Keep Practicing!</span>"""
+    else:
+        feedback_html += """<span style='background-color: #dc3545; color: white; padding: 8px 20px; border-radius: 20px; font-weight: bold;'>💪 Try Again!</span>"""
+    feedback_html += """
+        </div>
+        <!-- Detailed Results -->
+        <div style='background-color: white; border: 1px solid #ddd; border-radius: 0 0 10px 10px;'>
+    """
+    for result in detailed_results:
+        # Determine colors and icons
+        if result['is_correct']:
+            border_color = "#28a745"
+            icon = "✅"
+            status_bg = "#d4edda"
+            status_text = "Correct!"
+        else:
+            border_color = "#dc3545"
+            icon = "❌"
+            status_bg = "#f8d7da"
+            status_text = "Needs Improvement"
+        feedback_html += f"""
+        <div style='border-left: 4px solid {border_color}; margin: 20px; padding: 20px; background-color: #fafafa; border-radius: 8px;'>
+            <div style='display: flex; align-items: center; margin-bottom: 15px;'>
+                <span style='font-size: 24px; margin-right: 10px;'>{icon}</span>
+                <h4 style='margin: 0; color: #333;'>Sentence {result['sentence_num']}</h4>
+                <span style='margin-left: auto; background-color: {status_bg}; padding: 4px 12px; border-radius: 12px; font-size: 12px; font-weight: bold;'>{status_text}</span>
+            </div>
+            <div style='margin-bottom: 15px;'>
+                <div style='margin-bottom: 10px;'>
+                    <strong style='color: #6c757d;'>📝 Original:</strong>
+                    <div style='background-color: #e9ecef; padding: 10px; border-radius: 6px; margin-top: 5px; font-style: italic;'>{result['original']}</div>
+                </div>
+                <div style='margin-bottom: 10px;'>
+                    <strong style='color: #007bff;'>✏️ Your Answer:</strong>
+                    <div style='background-color: #e7f3ff; padding: 10px; border-radius: 6px; margin-top: 5px;'>{result['student_response']}</div>
+                </div>
+        """
+        # Only show model analysis if there were errors in student's response
+        if not result['is_correct'] and result['analysis_html']:
+            feedback_html += f"""
+                <div style='margin-top: 15px; padding: 15px; background-color: #fff3cd; border-radius: 6px; border-left: 3px solid #ffc107;'>
+                    <strong style='color: #856404;'>🔍 Grammar Analysis of Your Response:</strong>
+                    <div style='margin-top: 10px; font-size: 14px;'>
+                        {result['analysis_html']}
+                    </div>
+                </div>
+            """
+        feedback_html += """
+            </div>
+        </div>
+        """
+    feedback_html += """
+        </div>
+        <!-- Footer -->
+        <div style='text-align: center; margin-top: 30px; color: #6c757d; font-size: 14px;'>
+            <p>💡 <strong>Tip:</strong> Review the grammar analysis above to understand common error patterns and improve your writing!</p>
         </div>
     </div>
     """
     return f"Score: {score:.1f}%", feedback_html
+def preview_exercise(exercise_id):
+    """Preview an exercise before attempting it"""
+    if not exercise_id.strip():
+        return "Please enter an exercise ID.", ""
+    try:
+        exercise_id = int(exercise_id)
+    except:
+        return "Please enter a valid exercise ID.", ""
+    # Get exercise from database
+    conn = sqlite3.connect('language_app.db')
+    c = conn.cursor()
+    c.execute("SELECT title, instructions, sentences FROM exercises WHERE id = ?", (exercise_id,))
+    result = c.fetchone()
+    if not result:
+        return "Exercise not found.", ""
+    title, instructions, sentences_json = result
+    exercise_sentences = json.loads(sentences_json)
+    conn.close()
+    # Create preview HTML
+    preview_html = f"""
+    <div style='font-family: Arial, sans-serif; max-width: 800px; margin: 0 auto;'>
+        <!-- Header -->
+        <div style='background: linear-gradient(135deg, #4CAF50 0%, #45a049 100%); color: white; padding: 25px; border-radius: 10px 10px 0 0; text-align: center;'>
+            <h2 style='margin: 0; font-size: 24px;'>📋 {title}</h2>
+            <p style='margin: 10px 0 0 0; font-size: 16px; opacity: 0.9;'>Exercise ID: {exercise_id}</p>
+        </div>
+        <!-- Instructions -->
+        <div style='background-color: #e8f5e9; padding: 20px; border-left: 1px solid #ddd; border-right: 1px solid #ddd;'>
+            <h3 style='margin: 0 0 10px 0; color: #2e7d32;'>📝 Instructions:</h3>
+            <p style='margin: 0; font-size: 16px; line-height: 1.5;'>{instructions}</p>
+            <p style='margin: 10px 0 0 0; font-size: 14px; color: #666; font-style: italic;'>
+                💡 Tip: Read each sentence carefully and identify grammatical errors before writing your corrections.
+            </p>
+        </div>
+        <!-- Sentences -->
+        <div style='background-color: white; border: 1px solid #ddd; border-radius: 0 0 10px 10px; padding: 20px;'>
+            <h3 style='margin: 0 0 20px 0; color: #333;'>📚 Sentences to Correct ({len(exercise_sentences)} total):</h3>
+            <ol style='padding-left: 20px;'>
+    """
+    for i, sentence_data in enumerate(exercise_sentences, 1):
+        original = sentence_data['original']
+        error_types = sentence_data.get('error_types', [])
+        # Add error type hints if available
+        error_hint = ""
+        if error_types:
+            error_hint = f"<br><small style='color: #666; font-style: italic;'>💡 Focus on: {', '.join(error_types)}</small>"
+        preview_html += f"""
+            <li style='margin: 15px 0; padding: 15px; background-color: #f8f9fa; border-radius: 6px; border-left: 3px solid #4CAF50;'>
+                <div style='font-size: 16px; line-height: 1.5; margin-bottom: 5px;'>{original}</div>
+                {error_hint}
+            </li>
+        """
+    preview_html += f"""
+            </ol>
+            <div style='margin-top: 30px; padding: 20px; background-color: #f0f8ff; border-radius: 8px; border: 1px solid #b3d9ff;'>
+                <h4 style='margin: 0 0 10px 0; color: #0066cc;'>🎯 How to Complete This Exercise:</h4>
+                <ol style='margin: 0; padding-left: 20px; color: #333;'>
+                    <li>Read each sentence carefully</li>
+                    <li>Identify grammatical errors (spelling, grammar, word choice, etc.)</li>
+                    <li>Write your corrected version of each sentence</li>
+                    <li>Enter all your answers in the text box below (one sentence per line)</li>
+                    <li>Submit to get immediate feedback and scoring</li>
+                </ol>
+            </div>
+        </div>
+    </div>
+    """
+    return f"Exercise '{title}' loaded successfully! {len(exercise_sentences)} sentences to correct.", preview_html
 def get_student_progress(student_name):
     """Get student's submission and exercise history"""
     if not student_name.strip():
         # Exercise Attempt Tab
         with gr.TabItem("✏️ Exercise Practice"):
             gr.Markdown("## Practice Grammar Exercises")
             with gr.Row():
                 with gr.Column():
                     exercise_id_input = gr.Textbox(label="Exercise ID", placeholder="Enter exercise ID")
+                    # Preview section
+                    with gr.Row():
+                        preview_btn = gr.Button("👀 Preview Exercise", variant="secondary")
+                    preview_result = gr.Textbox(label="Preview Status", lines=1)
+                    preview_display = gr.HTML(label="Exercise Preview")
+                    # Separator
+                    gr.Markdown("---")
+                    # Attempt section
+                    gr.Markdown("### 📝 Complete the Exercise")
                     student_name_exercise = gr.Textbox(label="Your Name", placeholder="Enter your name")
                     responses_input = gr.Textbox(
                         label="Your Answers",
+                        lines=8,
+                        placeholder="After previewing the exercise above, enter your corrected sentences here (one per line)..."
                     )
+                    submit_exercise_btn = gr.Button("✅ Submit Answers", variant="primary")
                 with gr.Column():
                     score_output = gr.Textbox(label="Your Score")
                     feedback_output = gr.HTML(label="Detailed Feedback")
+            # Connect the buttons
+            preview_btn.click(
+                preview_exercise,
+                inputs=[exercise_id_input],
+                outputs=[preview_result, preview_display]
+            )
             submit_exercise_btn.click(
                 attempt_exercise,
                 inputs=[exercise_id_input, responses_input, student_name_exercise],
                 outputs=[score_output, feedback_output]
             )
         # Progress Tracking Tab
         with gr.TabItem("📊 Student Progress"):
             gr.Markdown("## View Student Progress")