pratikshahp commited on
Commit
17a9ace
·
verified ·
1 Parent(s): 7701e24

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -20,14 +20,15 @@ def generate_mcqs(text, num_questions=5):
20
  if not text.strip():
21
  return ["No text extracted from the PDF. Unable to generate MCQs."]
22
 
23
- # Tokenize the input text
24
- inputs = tokenizer(text, return_tensors="pt", max_length=512, truncation=True)
 
25
 
26
  mcqs = []
27
  generator = pipeline("text-generation", model=model, tokenizer=tokenizer)
28
  for _ in range(num_questions):
29
  # Generate a single MCQ at a time
30
- mcq = generator(text, max_length=512, max_new_tokens=100)[0]["generated_text"]
31
  mcqs.append(mcq)
32
 
33
  return mcqs
 
20
  if not text.strip():
21
  return ["No text extracted from the PDF. Unable to generate MCQs."]
22
 
23
+ # Truncate text to fit within the model's max token limit
24
+ max_input_length = 512 - 100 # Reserve space for generated tokens
25
+ inputs = tokenizer(text, return_tensors="pt", max_length=max_input_length, truncation=True)
26
 
27
  mcqs = []
28
  generator = pipeline("text-generation", model=model, tokenizer=tokenizer)
29
  for _ in range(num_questions):
30
  # Generate a single MCQ at a time
31
+ mcq = generator(tokenizer.decode(inputs['input_ids'][0]), max_new_tokens=100)[0]["generated_text"]
32
  mcqs.append(mcq)
33
 
34
  return mcqs