Spaces:

mkdirjason
/

Generating_English_Question

Sleeping

App Files Files Community

Generating_English_Question / app.py

mkdirjason

first_init

902e3f2 verified about 1 year ago

raw

history blame

6.47 kB

	!pip install gradio
	!pip install easyocr
	!pip install pdfplumber

	from transformers import pipeline
	import gradio as gr
	import easyocr
	import pdfplumber
	import random

	#適用於Interface、Block
	title = "<h1>產生英文題目</h1>"
	description = """這是一個利用hugging face 產生英文題目的小專案"""
	textbox = gr.Textbox(label="請輸入英文文章:", placeholder="While lily is setting...", lines=5)

	#加入磚
	demo = gr.Blocks()

	# 加載 Hugging Face 上的問答模型
	question_generator = pipeline("text2text-generation", model="valhalla/t5-base-qg-hl")

	# def question_generate(context):
	# # 讓模型根據文章生成問題
	# question_result = []
	# for i in range(5):
	# question = question_generator(f"question: {context}",
	# max_length=100,
	# do_sample = True, # 啟用採樣以增加多樣性
	# temperature=0.8 + (i * 0.1), # 逐漸增加溫度參數來獲得更多樣的結果
	# top_p=0.9
	# )
	# question_result.append(f"Q{i+1}. {question[0]['generated_text']}")

	# return "\n".join(question_result) #以換行符號返回多個問題

	def question_generator_with_answer(context):

	#產生題目
	question_data = question_generator(f"question:{context}",
	max_length=100, do_sample=True, temperature=0.8, top_p=0.9)
	question = question_data[0]['generated_text']

	#產生正確答案
	answer_data = question_generator(f"answer:{context}",
	max_length=100, do_sample=True, temperature=1, top_p=0.9)
	correct_answer = answer_data[0]['generated_text']

	#產生錯誤答案
	wrong_answers = set()
	while len(wrong_answers) < 3:
	wrong_data = question_generator(f"answer: {context}", max_length=50,
	do_sample=True, temperature=1.0, top_p=0.8)
	wrong_answer = wrong_data[0]['generated_text']
	if wrong_answer != correct_answer and "?" not in wrong_answer: # 避免重複正確答案
	wrong_answers.add(wrong_answer)


	# 將正確答案加入選項，並打亂順序
	choices = list(wrong_answers) + [correct_answer]
	random.shuffle(choices)


	# 回傳題目與選項
	return {
	"question": question,
	"choices": choices,
	"correct_answer": correct_answer
	}

	def format_question_output(context):
	question_result=[]
	for j in range(4):
	result = question_generator_with_answer(context)
	question_text = f"{result['question']}\n"
	choices_text = "\n".join([f"{chr(65+i)}. {choice}" for i, choice in enumerate(result['choices'])])
	question_result.append(f"\nQ{j+1}.{question_text}\n{choices_text}\n")
	return "\n".join(question_result) #用換行來連接

	# def format_question_output(context):
	# result = question_generator_with_answer(context)
	# question_text = f"{result['question']}\n\n"
	# choices_text = "\n".join([f"{chr(65+i)}. {choice}" for i, choice in enumerate(result['choices'])])
	# return f"{question_text}\n{choices_text}\n\n✅ 正確答案: {result['correct_answer']}"


	#pdf辨識
	def extract_text_from_pdf(pdf_path):
	text = ""
	with pdfplumber.open(pdf_path.name) as pdf:
	for page in pdf.pages:
	text += page.extract_text() + "\n"
	ls = format_question_output(text)
	return ls



	#圖片辨識(辨識度太低)
	def OCR(photo):
	text_inner = ""
	questions = []
	reader = easyocr.Reader(['en', 'ch_tra'])
	results = reader.readtext(photo)
	for (bbox, text, prob) in results:
	text_inner += text
	return text_inner


	#確認辨識結果沒有問題後，產生題目
	def OCR_gen(text):
	if not text.strip(): # 確保輸入的 text 不是空的
	return "錯誤：OCR 沒有輸出任何可用的文字，請重新檢查圖片內容。"
	ls = format_question_output(text)
	return ls


	with demo:
	gr.Markdown(title)
	gr.Markdown(description)
	with gr.Tabs():
	with gr.TabItem("輸入文字"):
	with gr.Row():
	text_input = gr.Textbox(label="請輸入英文文章:", placeholder="While lily is setting...", lines=5)
	with gr.Column():
	text_output = gr.Textbox(label="題目")
	text_button = gr.Button("產生題目")
	with gr.TabItem("PDF文件辨識"):
	with gr.Row():
	PDF_input = gr.File(label="請上傳PDF文件")
	with gr.Column():
	PDF_output = gr.Textbox()
	PDF_button = gr.Button("產生題目")
	with gr.TabItem("圖片辨識"):
	with gr.Row():
	image_input = gr.Image()
	#解析圖片文字
	with gr.Column():
	img_tem = gr.Textbox(placeholder="請確認辨識結果",label="辨識結果")
	img_button = gr.Button("開始解析")
	image_button = gr.Button("產生題目")
	# #產生題目
	with gr.Column():
	image_output = gr.Textbox(label="題目")

	#判別有沒有輸入文章
	def validate_and_generate(text):
	if not text.strip():
	return "請輸入文章以產生題目"
	return format_question_output(text)

	#文字輸入物件
	text_button.click(validate_and_generate, inputs=text_input, outputs=text_output)

	#判別有沒有上傳檔案
	def test_PDF(file):
	if not file:
	return "請上傳PDF文件以產生題目"
	return extract_text_from_pdf(file)

	#PDF輸入
	PDF_button.click(test_PDF, inputs=PDF_input, outputs=PDF_output)

	#判別有沒有上傳照片
	def test_image(image):
	if image is None:
	return "請上傳圖片以產生題目"
	return OCR(image)

	#辨識文章
	img_button.click(test_image, inputs=image_input, outputs=img_tem)


	#檢查辨識結果有沒有存在
	def test_finished(text):
	if (not text.strip() or text == "請上傳圖片以產生題目"):
	return "請確認文章已經輸入"
	return OCR_gen(text)
	image_button.click(test_finished, inputs=img_tem, outputs=image_output)



	demo.launch()