Spaces:

Sukmadi
/

test-generator

Sleeping

App Files Files Community

Sukmadi commited on Sep 17, 2025

Commit

0d5d779

1 Parent(s): 390bb82

update 2 difficulty endpoint and 2 original endpoint

Browse files

Files changed (3) hide show

app.py +134 -27
generator.py +37 -28
utils.py +45 -45

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 # Import the user's RAGMCQ implementation
-from generator import RAGMCQWithDifficulty
 from utils import log_pipeline
 app = FastAPI(title="RAG MCQ Generator API")
@@ -23,7 +23,8 @@ app.add_middleware(
 )
 # global rag instance
-rag: Optional[RAGMCQWithDifficulty] = None
 class GenerateResponse(BaseModel):
     mcqs: dict
@@ -34,10 +35,11 @@ class ListResponse(BaseModel):
 @app.on_event("startup")
 def startup_event():
-    global rag
     # instantiate the heavy object once
-    rag = RAGMCQWithDifficulty()
     print("RAGMCQ instance created on startup.")
 @app.get("/health")
@@ -121,22 +123,23 @@ async def upload_multiple_files(
     return {"files": saved_files}
-@app.post("/generate_saved", response_model=GenerateResponse)
-async def generate_saved_endpoint(
     n_easy_questions: int = Form(3),
     n_medium_questions: int = Form(5),
     n_hard_questions: int = Form(2),
     qdrant_filename: str = Form("default_filename"),
     collection_name: str = Form("programming"),
     mode: str = Form("rag"),
-    questions_per_chunk: int = Form(3),
     top_k: int = Form(3),
     temperature: float = Form(0.2),
     validate_mcqs: bool = Form(False),
     enable_fiddler: bool = Form(False),
 ):
-    global rag
     if rag is None:
         raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
@@ -156,8 +159,8 @@ async def generate_saved_endpoint(
                 collection=collection_name,
                 n_questions=n_questions,
                 mode=mode,
-                questions_per_chunk=questions_per_chunk,
-                top_k=top_k,
                 temperature=temperature,
                 enable_fiddler=enable_fiddler,
                 target_difficulty=difficulty,
@@ -193,30 +196,27 @@ async def generate_saved_endpoint(
             # don't fail the whole request for a validation error — return generator output and note the error
             validation_report = {"error": f"Validation failed: {e}"}
-    # log_pipeline('test/mcq_output.json', content={"mcqs": mcqs, "validation": validation_report})
     return {"mcqs": all_mcqs, "validation": validation_report}
-@app.post("/generate", response_model=GenerateResponse)
-async def generate_endpoint(
     background_tasks: BackgroundTasks,
     file: UploadFile = File(...),
     n_easy_questions: int = Form(3),
     n_medium_questions: int = Form(5),
     n_hard_questions: int = Form(2),
-    qdrant_filename: str = Form("default_filename"),
-    collection_name: str = Form("programming"),
     mode: str = Form("rag"),
-    questions_per_page: int = Form(3),
     top_k: int = Form(3),
     temperature: float = Form(0.2),
     validate_mcqs: bool = Form(False),
     enable_fiddler: bool = Form(False)
 ):
-    global rag
     if rag is None:
         raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
@@ -254,10 +254,9 @@ async def generate_endpoint(
     for difficulty, n_questions in difficulty_counts.items():
         try:
             mcqs = rag.generate_from_pdf(
-                pdf_path=tmp_path,
                 n_questions=n_questions,
                 mode=mode,
-                questions_per_page=questions_per_page,
                 top_k=top_k,
                 temperature=temperature,
                 enable_fiddler=enable_fiddler,
@@ -282,23 +281,131 @@ async def generate_endpoint(
                 counter += 1
         except Exception as e:
-            raise HTTPException(status_code=500, detail=f"Generation from file failed: {e}")
     validation_report = None
     if validate_mcqs:
         try:
-            # rag.build_index_from_pdf(tmp_path)
             # validate_mcqs expects keys as strings and the normalized content
             validation_report = rag.validate_mcqs(all_mcqs, top_k=top_k)
         except Exception as e:
             # don't fail the whole request for a validation error — return generator output and note the error
             validation_report = {"error": f"Validation failed: {e}"}
-    # log_pipeline('test/mcq_output.json', content={"mcqs": mcqs, "validation": validation_report})
-    return {"mcqs": all_mcqs, "validation": validation_report}
 if __name__ == "__main__":

 from pydantic import BaseModel
 # Import the user's RAGMCQ implementation
+from generator import RAGMCQWithDifficulty, RAGMCQ
 from utils import log_pipeline
 app = FastAPI(title="RAG MCQ Generator API")
 )
 # global rag instance
+rag: Optional[RAGMCQ] = None
+rag_difficulty: Optional[RAGMCQWithDifficulty] = None
 class GenerateResponse(BaseModel):
     mcqs: dict
 @app.on_event("startup")
 def startup_event():
+    global rag, rag_difficulty
     # instantiate the heavy object once
+    rag = RAGMCQ()
+    rag_difficulty = RAGMCQWithDifficulty()
     print("RAGMCQ instance created on startup.")
 @app.get("/health")
     return {"files": saved_files}
+#? GENERATION with DIFFICULTY
+@app.post("/generate_saved_difficulty", response_model=GenerateResponse)
+async def generate_saved_difficulty_endpoint(
     n_easy_questions: int = Form(3),
     n_medium_questions: int = Form(5),
     n_hard_questions: int = Form(2),
     qdrant_filename: str = Form("default_filename"),
     collection_name: str = Form("programming"),
     mode: str = Form("rag"),
     top_k: int = Form(3),
     temperature: float = Form(0.2),
     validate_mcqs: bool = Form(False),
     enable_fiddler: bool = Form(False),
 ):
+    global rag_difficulty
+    rag = rag_difficulty
     if rag is None:
         raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
                 collection=collection_name,
                 n_questions=n_questions,
                 mode=mode,
+                questions_per_chunk=3,
+                top_k=3,
                 temperature=temperature,
                 enable_fiddler=enable_fiddler,
                 target_difficulty=difficulty,
             # don't fail the whole request for a validation error — return generator output and note the error
             validation_report = {"error": f"Validation failed: {e}"}
     return {"mcqs": all_mcqs, "validation": validation_report}
+@app.post("/generate_difficulty", response_model=GenerateResponse)
+async def generate_difficulty_endpoint(
     background_tasks: BackgroundTasks,
     file: UploadFile = File(...),
+    qdrant_filename: str = Form("default_filename"),
+    collection_name: str = Form("programming"),
     n_easy_questions: int = Form(3),
     n_medium_questions: int = Form(5),
     n_hard_questions: int = Form(2),
     mode: str = Form("rag"),
     top_k: int = Form(3),
     temperature: float = Form(0.2),
     validate_mcqs: bool = Form(False),
     enable_fiddler: bool = Form(False)
 ):
+    global rag_difficulty
+    rag = rag_difficulty
     if rag is None:
         raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
     for difficulty, n_questions in difficulty_counts.items():
         try:
             mcqs = rag.generate_from_pdf(
+                tmp_path,
                 n_questions=n_questions,
                 mode=mode,
                 top_k=top_k,
                 temperature=temperature,
                 enable_fiddler=enable_fiddler,
                 counter += 1
         except Exception as e:
+            raise HTTPException(status_code=500, detail=f"Generation from saved file failed: {e}")
     validation_report = None
     if validate_mcqs:
         try:
             # validate_mcqs expects keys as strings and the normalized content
             validation_report = rag.validate_mcqs(all_mcqs, top_k=top_k)
         except Exception as e:
             # don't fail the whole request for a validation error — return generator output and note the error
             validation_report = {"error": f"Validation failed: {e}"}
+    return {"mcqs": all_mcqs, "validation": validation_report}
+#? ORIGINAL Generation
+@app.post("/generate_saved", response_model=GenerateResponse)
+async def generate_saved_endpoint(
+    qdrant_filename: str = Form("default_filename"),
+    collection_name: str = Form("programming"),
+    mode: str = Form("rag"),
+    n_questions: int = 10,
+    questions_per_chunk: int = Form(3),
+    top_k: int = Form(3),
+    temperature: float = Form(0.2),
+    validate_mcqs: bool = Form(False),
+    enable_fiddler: bool = Form(False),
+):
+    global rag
+    if rag is None:
+        raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
+    try:
+        mcqs = rag.generate_from_qdrant(
+            filename=qdrant_filename,
+            collection=collection_name,
+            mode=mode,
+            n_questions=n_questions,
+            questions_per_chunk=questions_per_chunk,
+            top_k=top_k,
+            temperature=temperature,
+            enable_fiddler=enable_fiddler,
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Generation from saved file failed: {e}")
+    validation_report = None
+    if validate_mcqs:
+        try:
+            # validate_mcqs expects keys as strings and the normalized content
+            validation_report = rag.validate_mcqs(mcqs, top_k=top_k)
+        except Exception as e:
+            # don't fail the whole request for a validation error — return generator output and note the error
+            validation_report = {"error": f"Validation failed: {e}"}
+    return {"mcqs": mcqs, "validation": validation_report}
+@app.post("/generate", response_model=GenerateResponse)
+async def generate_endpoint(
+    background_tasks: BackgroundTasks,
+    file: UploadFile = File(...),
+    n_questions: int = Form(10),
+    qdrant_filename: str = Form("default_filename"),
+    collection_name: str = Form("programming"),
+    mode: str = Form("rag"),
+    questions_per_page: int = Form(3),
+    top_k: int = Form(3),
+    temperature: float = Form(0.2),
+    validate_mcqs: bool = Form(False),
+    enable_fiddler: bool = Form(False)
+):
+    global rag
+    if rag is None:
+        raise HTTPException(status_code=503, detail="RAGMCQ not ready on server.")
+    # basic file validation
+    if not file.filename.lower().endswith(".pdf"):
+        raise HTTPException(status_code=400, detail="Only PDF files are supported.")
+    # save uploaded file to a temp location
+    tmp_path = _save_upload_to_temp(file)
+    # ensure file removed afterward
+    def _cleanup(path: str):
+        try:
+            os.remove(path)
+        except Exception:
+            pass
+    background_tasks.add_task(_cleanup, tmp_path)
+    # save pdf
+    try:
+        rag.save_pdf_to_qdrant(tmp_path, filename=qdrant_filename, collection=collection_name, overwrite=True)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Could not save file to Qdrant Cloud: {e}")
+    # generate
+    try:
+        mcqs = rag.generate_from_pdf(
+            tmp_path,
+            n_questions=n_questions,
+            mode=mode,
+            questions_per_page=questions_per_page,
+            top_k=top_k,
+            temperature=temperature,
+            enable_fiddler=enable_fiddler
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Generation failed: {e}")
+    validation_report = None
+    if validate_mcqs:
+        try:
+            # validate_mcqs expects keys as strings and the normalized content
+            validation_report = rag.validate_mcqs(mcqs, top_k=top_k)
+        except Exception as e:
+            # don't fail the whole request for a validation error — return generator output and note the error
+            validation_report = {"error": f"Validation failed: {e}"}
+    return {"mcqs": mcqs, "validation": validation_report}
 if __name__ == "__main__":

generator.py CHANGED Viewed

@@ -32,7 +32,7 @@ try:
 except Exception:
     _HAS_FAISS = False
-from utils import generate_mcqs_from_text, _post_chat, _safe_extract_json, save_to_local, structure_context_for_llm, new_generate_mcqs_from_text
 from huggingface_hub import login
 login(token=os.environ['HF_MODEL_TOKEN'])
@@ -202,12 +202,12 @@ class RAGMCQ:
                 if not chunk_text.strip():
                     continue
-                to_gen = questions_per_page
                 # ask generator
                 try:
                     mcq_block = generate_mcqs_from_text(
-                        chunk_text, n=to_gen, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     # skip this chunk if generator fails
@@ -259,8 +259,9 @@ class RAGMCQ:
                 # call generator for 1 question (or small batch) with the retrieved context
                 try:
                     # request 1 question at a time to keep diversity
                     mcq_block = generate_mcqs_from_text(
-                        context, n=1, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
@@ -683,7 +684,7 @@ class RAGMCQ:
                 "text": txt,
                 "source_id": source_id,
             }
-            points.append(PointStruct(id=pid, vector=emb.tolist(), payload=payload))
             # upsert in batches
             if len(points) >= batch_size:
@@ -887,9 +888,10 @@ class RAGMCQ:
             for i, txt in enumerate(texts):
                 if not txt.strip():
                     continue
-                to_gen = questions_per_chunk
                 try:
-                    mcq_block = generate_mcqs_from_text(txt, n=to_gen, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler)
                 except Exception as e:
                     print(f"Generator failed on chunk (index {i}): {e}")
                     continue
@@ -933,7 +935,8 @@ class RAGMCQ:
                 context = "\n\n".join(context_parts)
                 try:
-                    mcq_block = generate_mcqs_from_text(context, n=1, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler)
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
@@ -967,12 +970,14 @@ class RAGMCQ:
         else:
             raise ValueError("mode must be 'per_chunk' or 'rag'.")
     def _estimate_difficulty_for_generation(
         self,
         q_text: str,
         options: Dict[str, str],
         correct_text: str,
-        context_text: str = "",
     ) -> Tuple[float, str]:
         def safe_map_sim(s):
             # map potentially [-1,1] cosine-like to [0,1], clamp
@@ -1112,13 +1117,13 @@ class RAGMCQWithDifficulty(RAGMCQ):
                 if not chunk_text.strip():
                     continue
-                to_gen = questions_per_page
                 # ask generator
                 try:
-                    structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=False)
-                    mcq_block = generate_mcqs_from_text(
-                        source_text=chunk_text, n=to_gen, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     # skip this chunk if generator fails
@@ -1170,9 +1175,10 @@ class RAGMCQWithDifficulty(RAGMCQ):
                 # call generator for 1 question (or small batch) with the retrieved context
                 try:
-                    # request 1 question at a time to keep diversity
                     structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=False)
-                    mcq_block = new_generate_mcqs_from_text(structured_context, n=questions_per_page, model=self.generation_model, temperature=temperature, enable_fiddler=False, target_difficulty=target_difficulty)
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
@@ -1264,9 +1270,12 @@ class RAGMCQWithDifficulty(RAGMCQ):
             for i, txt in enumerate(texts):
                 if not txt.strip():
                     continue
-                to_gen = questions_per_chunk
                 try:
-                    mcq_block = new_generate_mcqs_from_text(txt, n=to_gen, model=self.generation_model, temperature=temperature, enable_fiddler=False)
                 except Exception as e:
                     print(f"Generator failed on chunk (index {i}): {e}")
                     continue
@@ -1298,10 +1307,8 @@ class RAGMCQWithDifficulty(RAGMCQ):
                     seed_sent = (stripped[:200] if stripped else "[no text available]")
                 query = f"Create questions about: {seed_sent}"
                 # retrieve top_k chunks from the same file (restricted by filename filter)
                 retrieved = self._retrieve_qdrant(query=query, collection=collection, filename=filename, top_k=top_k)
-                print('retrieved qdrant', retrieved)
                 context_parts = []
                 for payload, score in retrieved:
                     # payload should contain page & chunk_id and text
@@ -1313,9 +1320,11 @@ class RAGMCQWithDifficulty(RAGMCQ):
                 # q generation
                 try:
-                    # Difficulty pipeline: easy, mid, difficult
                     structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=False)
-                    mcq_block = new_generate_mcqs_from_text(structured_context, n=questions_per_chunk, model=self.generation_model, temperature=temperature, enable_fiddler=False, target_difficulty=target_difficulty)
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
@@ -1342,18 +1351,18 @@ class RAGMCQWithDifficulty(RAGMCQ):
                     #? change estimate
                     diff_score, diff_label, components = self._estimate_difficulty_for_generation( # type: ignore
-                        q_text=q_text, options={k: str(v) for k,v in options.items()}, correct_text=str(correct_text), context_text=structured_context, concepts_used=concepts
                     )
                     payload["độ khó"] = {"điểm": diff_score, "mức độ": diff_label}
                     # CHECK n generation: if number of request mcqs < default generation number e.g. 5 - 3 = 2 < 3 then only genearate 2 mcqs
                     if n_questions - qcount < questions_per_chunk:
-                      questions_per_chunk = n_questions - qcount
                     qcount += 1 # count number of question
-                    print('qcount:', qcount)
-                    print('questions_per_chunk:', questions_per_chunk)
                     output[str(qcount)] = mcq_block[item]
                     if qcount >= n_questions:
@@ -1371,7 +1380,7 @@ class RAGMCQWithDifficulty(RAGMCQ):
         q_text: str,
         options: Dict[str, str],
         correct_text: str,
-        context_text: str = "",
         concepts_used: Dict = {}
     ) -> Tuple[float, str]:
         def safe_map_sim(s):
@@ -1468,7 +1477,7 @@ class RAGMCQWithDifficulty(RAGMCQ):
         score += 0.35 * float(distractor_penalty)
         score += 0.20 * float(mean_sim)
         score += 0.22 * float(amb_flag)
-        score += 0.05 * float(question_len_norm)
         score -= 0.20 * float(gap)
         # clamp
@@ -1493,4 +1502,4 @@ class RAGMCQWithDifficulty(RAGMCQ):
         else:
             label = "khó"
-        return score, label, components

 except Exception:
     _HAS_FAISS = False
+from utils import generate_mcqs_from_text, structure_context_for_llm, new_generate_mcqs_from_text
 from huggingface_hub import login
 login(token=os.environ['HF_MODEL_TOKEN'])
                 if not chunk_text.strip():
                     continue
                 # ask generator
                 try:
+                    structured_context = structure_context_for_llm(chunk_text, model=self.generation_model, temperature=0.2, enable_fiddler=enable_fiddler)
                     mcq_block = generate_mcqs_from_text(
+                        structured_context, n=questions_per_page, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     # skip this chunk if generator fails
                 # call generator for 1 question (or small batch) with the retrieved context
                 try:
                     # request 1 question at a time to keep diversity
+                    structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=enable_fiddler)
                     mcq_block = generate_mcqs_from_text(
+                        structured_context, n=1, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                 "text": txt,
                 "source_id": source_id,
             }
+            points.append(PointStruct(id=pid, vector=emb.tolist(), payload=payload)) # pyright: ignore[reportPossiblyUnboundVariable]
             # upsert in batches
             if len(points) >= batch_size:
             for i, txt in enumerate(texts):
                 if not txt.strip():
                     continue
                 try:
+                    structured_context = structure_context_for_llm(txt, model=self.generation_model, temperature=0.2, enable_fiddler=enable_fiddler)
+                    mcq_block = generate_mcqs_from_text(structured_context, n=questions_per_chunk, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler)
                 except Exception as e:
                     print(f"Generator failed on chunk (index {i}): {e}")
                     continue
                 context = "\n\n".join(context_parts)
                 try:
+                    structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=enable_fiddler)
+                    mcq_block = generate_mcqs_from_text(structured_context, n=questions_per_chunk, model=self.generation_model, temperature=temperature, enable_fiddler=enable_fiddler)
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
         else:
             raise ValueError("mode must be 'per_chunk' or 'rag'.")
     def _estimate_difficulty_for_generation(
         self,
         q_text: str,
         options: Dict[str, str],
         correct_text: str,
+        context_text: str,
     ) -> Tuple[float, str]:
         def safe_map_sim(s):
             # map potentially [-1,1] cosine-like to [0,1], clamp
                 if not chunk_text.strip():
                     continue
                 # ask generator
                 try:
+                    structured_context = structure_context_for_llm(chunk_text, model=self.generation_model, temperature=0.2, enable_fiddler=enable_fiddler)
+                    mcq_block = new_generate_mcqs_from_text(
+                        source_text=structured_context, n=questions_per_page, model=self.generation_model, temperature=temperature, target_difficulty=target_difficulty ,enable_fiddler=enable_fiddler
                     )
                 except Exception as e:
                     # skip this chunk if generator fails
                 # call generator for 1 question (or small batch) with the retrieved context
                 try:
                     structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=False)
+                    mcq_block = new_generate_mcqs_from_text(
+                        source_text=structured_context, n=questions_per_page, model=self.generation_model, temperature=temperature, target_difficulty=target_difficulty ,enable_fiddler=enable_fiddler
+                    )
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
             for i, txt in enumerate(texts):
                 if not txt.strip():
                     continue
                 try:
+                    structured_context = structure_context_for_llm(txt, model=self.generation_model, temperature=0.2, enable_fiddler=False)
+                    mcq_block = new_generate_mcqs_from_text(
+                        source_text=structured_context, n=questions_per_chunk, model=self.generation_model,
+                        temperature=temperature, target_difficulty=target_difficulty ,enable_fiddler=enable_fiddler
+                    )
                 except Exception as e:
                     print(f"Generator failed on chunk (index {i}): {e}")
                     continue
                     seed_sent = (stripped[:200] if stripped else "[no text available]")
                 query = f"Create questions about: {seed_sent}"
                 # retrieve top_k chunks from the same file (restricted by filename filter)
                 retrieved = self._retrieve_qdrant(query=query, collection=collection, filename=filename, top_k=top_k)
                 context_parts = []
                 for payload, score in retrieved:
                     # payload should contain page & chunk_id and text
                 # q generation
                 try:
                     structured_context = structure_context_for_llm(context, model=self.generation_model, temperature=0.2, enable_fiddler=False)
+                    mcq_block = new_generate_mcqs_from_text(
+                        source_text=structured_context, n=questions_per_chunk, model=self.generation_model,
+                        temperature=temperature, target_difficulty=target_difficulty ,enable_fiddler=enable_fiddler
+                    )
                 except Exception as e:
                     print(f"Generator failed during RAG attempt {attempts}: {e}")
                     continue
                     #? change estimate
                     diff_score, diff_label, components = self._estimate_difficulty_for_generation( # type: ignore
+                        q_text=q_text, options={k: str(v) for k,v in options.items()}, correct_text=str(correct_text), context_text=structured_context, concepts_used=concepts # type: ignore
                     )
                     payload["độ khó"] = {"điểm": diff_score, "mức độ": diff_label}
                     # CHECK n generation: if number of request mcqs < default generation number e.g. 5 - 3 = 2 < 3 then only genearate 2 mcqs
                     if n_questions - qcount < questions_per_chunk:
+                        questions_per_chunk = n_questions - qcount
                     qcount += 1 # count number of question
+                    # print('qcount:', qcount)
+                    # print('questions_per_chunk:', questions_per_chunk)
                     output[str(qcount)] = mcq_block[item]
                     if qcount >= n_questions:
         q_text: str,
         options: Dict[str, str],
         correct_text: str,
+        context_text: str,
         concepts_used: Dict = {}
     ) -> Tuple[float, str]:
         def safe_map_sim(s):
         score += 0.35 * float(distractor_penalty)
         score += 0.20 * float(mean_sim)
         score += 0.22 * float(amb_flag)
+        score += 0.08 * float(question_len_norm)
         score -= 0.20 * float(gap)
         # clamp
         else:
             label = "khó"
+        return score, label, components # type: ignore

utils.py CHANGED Viewed

@@ -99,7 +99,7 @@ def structure_context_for_llm(
         "content": (
             "Bạn là một trợ lý hữu ích chuyên xử lý và cấu trúc văn bản để phục vụ mô hình ngôn ngữ (LLM). Trả lời bằng Tiếng Việt\n"
             "Nhiệm vụ của bạn là:\n"
-            "- Nếu văn bản dài trên 500 từ chia văn bản thành 2 đoạn (chunk) có ý nghĩa rõ ràng.\n"
             "- Mỗi chunk phải **tự chứa đủ thông tin** (self-contained) để LLM có thể hiểu độc lập.\n"
             "- Xác định **chủ đề chính (topic)** của mỗi chunk và dùng nó làm KEY trong JSON.\n"
             "- Trong mỗi topic, tổ chức thông tin thành cấu trúc rõ ràng gồm các trường:\n"
@@ -140,7 +140,7 @@ def structure_context_for_llm(
 def new_generate_mcqs_from_text(
-    source_text: str,
     n: int = 3,
     model: str = "openai/openai/gpt-oss-120b",
     temperature: float = 0.2,
@@ -151,60 +151,60 @@ def new_generate_mcqs_from_text(
     expected_concepts = {
-      "easy": 1,
-      "medium": 2,
-      "hard": (3, 4)
     }
     if isinstance(expected_concepts[target_difficulty], tuple):
-      min_concepts, max_concepts = expected_concepts[target_difficulty]
-      concept_range = f"{min_concepts}-{max_concepts}"
     else:
-      concept_range = expected_concepts[target_difficulty]
     difficulty_prompts = {
-      "easy": (
-          "- Câu hỏi DỄ: kiểm tra duy nhất 1 khái niệm chính cơ bản dễ hiểu, định nghĩa, hoặc công thức đơn giản."
-          "- Đáp án có thể tìm thấy trực tiếp trong văn bản."
-          "- Ngữ cảnh đủ để hiểu khái niệm chính."
-          "- Distractors khác biệt rõ ràng, dễ loại bỏ."
-          "- Độ dài câu hỏi ngắn gọn không quá 10-20 từ hoặc ít hơn 120 ký tự, tập trung vào một ý duy nhất.\n"
-      ),
-      "medium": (
-          "- Câu hỏi TRUNG BÌNH kiểm tra khái niệm chính trong văn bản"
-          "- Nếu câu hỏi thuộc dạng áp dụng và suy luận thiếu dữ liệu để trả lời câu hỏi, thêm nội dung hoặc ví dụ từ văn bản nguồn."
-          "- Các Distractors không quá giống nhau."
-          "- Độ dài câu hỏi vừa phải khoảng 23–30 từ hoặc khoảng 150 - 180 ký tự, có thêm chi tiết phụ để suy luận.\n"
-      ),
-      "hard": (
-          "- Câu hỏi KHÓ kiểm tra thông tin được phân tích/tổng hợp"
-          "- Nếu câu hỏi thuộc dạng áp dụng và suy luận thiếu dữ liệu để trả lời câu hỏi, thêm nội dung hoặc ví dụ từ văn bản nguồn."
-          "- Ít nhất 2 distractors gần giống đáp án đúng, độ tương đồng cao. "
-          f"- Đáp án yêu cầu học sinh suy luận hoặc áp dụng công thức vào ví dụ nếu có."
-          "- Độ dài câu hỏi dài hơn 35 từ hoặc hơn 200 ký tự.\n \n"
-      )
     }
     difficult_criteria = difficulty_prompts[target_difficulty] # "easy", "medium", "hard"
     print(concept_range)
     system_message = {
-      "role": "system",
-      "content": (
-          "Bạn là một trợ lý hữu ích chuyên tạo câu hỏi trắc nghiệm (MCQ). Luôn trả lời bằng tiếng việt"
-          f"Đảm bảo chỉ tạo sinh câu trắc nghiệm có độ khó sau {difficult_criteria}"
-          f"Quan trọng: Mỗi câu hỏi chỉ sử dụng chính xác {concept_range} khái niệm chính (mỗi khái niệm chính có 1 danh sách khái niệm phụ) từ văn bản nguồn. "
-          "Mỗi câu hỏi và đáp án phải dựa trên thông tin từ văn bản nguồn. Không được đưa kiến thức ngoài vào."
-          "Chỉ TRẢ VỀ duy nhất một đối tượng JSON theo đúng schema sau và không kèm giải thích hay trường thêm:\n\n"
-          "{\n"
-          '  "1": { "câu hỏi": "...", "lựa chọn": {"a":"...","b":"...","c":"...","d":"..."}, "đáp án":"...", "khái niệm sử dụng": {"khái niệm chính":["khái niệm phụ", "..."], "..."]}},\n'
-          '  "2": { ... }\n'
-          "}\n\n"
-          "Lưu ý:\n"
-          f"- Tạo đúng {n} mục, đánh số từ 1 tới {n}.\n"
-          "- Khóa 'lựa chọn' phải có các phím a, b, c, d.\n"
-          "- 'đáp án' phải là toàn văn đáp án đúng (không phải ký tự chữ cái), và giá trị này phải khớp chính xác với một trong các giá trị trong 'options'.\n"
-          "- Toàn bộ thông tin cần thiết để trả lời phải nằm trong chính câu hỏi, không tham chiếu lại văn bản nguồn."
-          f"- Sử dụng chính xác {concept_range} khái niệm chính"
         )
     }

         "content": (
             "Bạn là một trợ lý hữu ích chuyên xử lý và cấu trúc văn bản để phục vụ mô hình ngôn ngữ (LLM). Trả lời bằng Tiếng Việt\n"
             "Nhiệm vụ của bạn là:\n"
+            "- Nếu văn bản dài trên 500 từ chia văn bản thành các chunk có ý nghĩa rõ ràng.\n"
             "- Mỗi chunk phải **tự chứa đủ thông tin** (self-contained) để LLM có thể hiểu độc lập.\n"
             "- Xác định **chủ đề chính (topic)** của mỗi chunk và dùng nó làm KEY trong JSON.\n"
             "- Trong mỗi topic, tổ chức thông tin thành cấu trúc rõ ràng gồm các trường:\n"
 def new_generate_mcqs_from_text(
+    source_text: Dict,
     n: int = 3,
     model: str = "openai/openai/gpt-oss-120b",
     temperature: float = 0.2,
     expected_concepts = {
+        "easy": 1,
+        "medium": 2,
+        "hard": (3, 4)
     }
     if isinstance(expected_concepts[target_difficulty], tuple):
+        min_concepts, max_concepts = expected_concepts[target_difficulty]
+        concept_range = f"{min_concepts}-{max_concepts}"
     else:
+        concept_range = expected_concepts[target_difficulty]
     difficulty_prompts = {
+        "easy": (
+            "- Câu hỏi DỄ: kiểm tra duy nhất 1 khái niệm chính cơ bản dễ hiểu, định nghĩa, hoặc công thức đơn giản."
+            "- Đáp án có thể tìm thấy trực tiếp trong văn bản."
+            "- Ngữ cảnh đủ để hiểu khái niệm chính."
+            "- Distractors khác biệt rõ ràng, dễ loại bỏ."
+            "- Độ dài câu hỏi ngắn gọn không quá 10-20 từ hoặc ít hơn 120 ký tự, tập trung vào một ý duy nhất.\n"
+        ),
+        "medium": (
+            "- Câu hỏi TRUNG BÌNH kiểm tra khái niệm chính trong văn bản"
+            "- Nếu câu hỏi thuộc dạng áp dụng và suy luận thiếu dữ liệu để trả lời câu hỏi, thêm nội dung hoặc ví dụ từ văn bản nguồn."
+            "- Các Distractors không quá giống nhau."
+            "- Độ dài câu hỏi vừa phải khoảng 23–30 từ hoặc khoảng 150 - 180 ký tự, có thêm chi tiết phụ để suy luận.\n"
+        ),
+        "hard": (
+            "- Câu hỏi KHÓ kiểm tra thông tin được phân tích/tổng hợp"
+            "- Nếu câu hỏi thuộc dạng áp dụng và suy luận thiếu dữ liệu để trả lời câu hỏi, thêm nội dung hoặc ví dụ từ văn bản nguồn."
+            "- Ít nhất 2 distractors gần giống đáp án đúng, độ tương đồng cao. "
+            f"- Đáp án yêu cầu học sinh suy luận hoặc áp dụng công thức vào ví dụ nếu có."
+            "- Độ dài câu hỏi dài hơn 35 từ hoặc hơn 200 ký tự.\n \n"
+        )
     }
     difficult_criteria = difficulty_prompts[target_difficulty] # "easy", "medium", "hard"
     print(concept_range)
     system_message = {
+        "role": "system",
+        "content": (
+            "Bạn là một trợ lý hữu ích chuyên tạo câu hỏi trắc nghiệm (MCQ). Luôn trả lời bằng tiếng việt"
+            f"Đảm bảo chỉ tạo sinh câu trắc nghiệm có độ khó sau {difficult_criteria}"
+            f"Quan trọng: Mỗi câu hỏi chỉ sử dụng chính xác {concept_range} khái niệm chính (mỗi khái niệm chính có 1 danh sách khái niệm phụ) từ văn bản nguồn. "
+            "Mỗi câu hỏi và đáp án phải dựa trên thông tin từ văn bản nguồn. Không được đưa kiến thức ngoài vào."
+            "Chỉ TRẢ VỀ duy nhất một đối tượng JSON theo đúng schema sau và không kèm giải thích hay trường thêm:\n\n"
+            "{\n"
+            '  "1": { "câu hỏi": "...", "lựa chọn": {"a":"...","b":"...","c":"...","d":"..."}, "đáp án":"...", "khái niệm sử dụng": {"khái niệm chính":["khái niệm phụ", "..."], "..."]}},\n'
+            '  "2": { ... }\n'
+            "}\n\n"
+            "Lưu ý:\n"
+            f"- Tạo đúng {n} mục, đánh số từ 1 tới {n}.\n"
+            "- Khóa 'lựa chọn' phải có các phím a, b, c, d.\n"
+            "- 'đáp án' phải là toàn văn đáp án đúng (không phải ký tự chữ cái), và giá trị này phải khớp chính xác với một trong các giá trị trong 'options'.\n"
+            "- Toàn bộ thông tin cần thiết để trả lời phải nằm trong chính câu hỏi, không tham chiếu lại văn bản nguồn."
+            f"- Sử dụng chính xác {concept_range} khái niệm chính"
         )
     }