Spaces:

NavyDevilDoc
/

AI_Toolkit

Sleeping

App Files Files Community

NavyDevilDoc commited on Dec 22, 2025

Commit

73edd8f

verified ·

1 Parent(s): 90ae931

Update src/core/QuizEngine.py

Browse files

Files changed (1) hide show

src/core/QuizEngine.py +22 -14

src/core/QuizEngine.py CHANGED Viewed

@@ -31,35 +31,43 @@ class QuizEngine:
         user_dir = os.path.join(self.source_dir, username)
         if not os.path.exists(user_dir): return None
-        # 1. Get files
         files = [f for f in os.listdir(user_dir) if f.lower().endswith(('.txt', '.md'))]
         if not files: return None
-        # Retry Loop: Try up to 5 times to find a "worthy" chunk
-        for attempt in range(5):
             selected_file = random.choice(files)
             try:
-                with open(os.path.join(user_dir, selected_file), 'r', encoding='utf-8', errors='ignore') as f:
                     text = f.read()
-                # DEFENSE 1: Aggressive Heuristic Filtering
-                # Split by double newline (paragraphs)
                 paragraphs = text.split('\n\n')
                 candidates = []
                 for p in paragraphs:
                     p = p.strip()
-                    # A. Too short?
-                    if len(p) < 250: continue
-                    # B. Looks like a list item or table row? (starts with number/bullet)
-                    if p[0].isdigit() or p.startswith(('-', '*', '•')): continue
-                    # C. Looks like administrative noise?
                     if "intentionally left blank" in p.lower(): continue
                     candidates.append(p)
                 if not candidates: continue
-                # Pick a random survivor
                 selected_context = random.choice(candidates)
                 return {
@@ -69,10 +77,10 @@ class QuizEngine:
                 }
             except Exception as e:
-                self.logger.error(f"Error fetching context: {e}")
                 continue
-        return None # Failed to find good text after 5 tries
     def construct_question_generation_prompt(self, context_text):
         """

         user_dir = os.path.join(self.source_dir, username)
         if not os.path.exists(user_dir): return None
         files = [f for f in os.listdir(user_dir) if f.lower().endswith(('.txt', '.md'))]
         if not files: return None
+        # Try up to 10 times to find a file with valid chunks
+        for attempt in range(10):
             selected_file = random.choice(files)
             try:
+                file_path = os.path.join(user_dir, selected_file)
+                with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
                     text = f.read()
+                # DEFENSE 1: Revised Filtering
+                # We split by double newline to get paragraphs
                 paragraphs = text.split('\n\n')
                 candidates = []
                 for p in paragraphs:
                     p = p.strip()
+                    # A. Absolute junk filter (too short to be a question)
+                    if len(p) < 150: continue
+                    # B. Administrative noise filter
                     if "intentionally left blank" in p.lower(): continue
+                    if "table of contents" in p.lower(): continue
+                    # C. The "Number" Filter (RELAXED)
+                    # Old rule: if p[0].isdigit(): continue
+                    # New rule: If it starts with a number but is long, KEEP IT.
+                    # We only ban "short" numbered lines (likely headers/TOC)
+                    if p[0].isdigit() and len(p) < 250:
+                        continue
                     candidates.append(p)
                 if not candidates: continue
+                # Success!
                 selected_context = random.choice(candidates)
                 return {
                 }
             except Exception as e:
+                self.logger.error(f"Error fetching context from {selected_file}: {e}")
                 continue
+        return None
     def construct_question_generation_prompt(self, context_text):
         """