Spaces:

IvanMiao
/

LogosAI

Running

App Files Files Community

IvanMiao commited on Jun 9, 2025

Commit

af744f3

1 Parent(s): 4399bf8

feat: translation, add dropdowns

Browse files

Files changed (5) hide show

.gitignore +6 -0
app.py +57 -13
process/interpretation.py +8 -10
process/ocr.py +4 -1
process/translation.py +32 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,6 @@

+.gradio/
+.env
+__pycache__/
+process/__pycache__/
+pyproject.toml
+uv.lock

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import gradio as gr
 from process.ocr import perform_raw_ocr, correct_text_with_ai
 from process.interpretation import get_interpretation
 from process.gradio_css import CUSTOM_CSS
@@ -52,7 +53,7 @@ def ai_correct(current_text: str):
 		yield error_msg, error_msg + "\n\n"
-def interpretation_workflow(text: str, genre: str, learn_language, target_language):
 	if not GEMINI_API_KEY:
 		yield "Error: Gemini api key not found."
 		return
@@ -63,15 +64,33 @@ def interpretation_workflow(text: str, genre: str, learn_language, target_langua
 		yield "Error: Language not selected"
 	if genre.lower() in ["general", "news"]:
-		yield f"⏳ Generating interpretation for {genre}..."
 		result = get_interpretation(genre.lower(), GEMINI_API_KEY, text, learn_language, target_language)
 		yield result
 	else:
 		yield "not implemented yet"
-with gr.Blocks(theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
-	gr.Markdown("# 📚 LogosAI - Language Professor Agent", elem_classes=["section-header"])
 	# --- API Key ---
 	with gr.Accordion("API Configuration", open=True):
@@ -103,7 +122,7 @@ with gr.Blocks(theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
 	# --- Text Processing ---
 	gr.Markdown("---")
-	with gr.Tab("Text Processing"):
 		with gr.Row():
 			with gr.Column(scale=1):
@@ -113,20 +132,20 @@ with gr.Blocks(theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
 					file_types=["image", ".pdf", ".txt"]
 					)
 				process_button = gr.Button("1. File Process (OCR/Read)", variant="primary")
-				ai_correct_button = gr.Button("2. AI Correct", variant="secondary")
 			with gr.Column(scale=2):
 				gr.Markdown("### Processed result")
 				with gr.Tabs():
 					with gr.Tab("Raw Text"):
 						text_display = gr.Textbox(
-							label="Raw Output / Editable Text",
 							lines=15,
 							max_lines=20,
 							show_copy_button=True,
 							value="",
 							interactive=True
 						)
-					with gr.Tab("Formatted View"):
 						text_markdown = gr.Markdown(
 							value="*Processed text will appear here...*\n\n",
 						)
@@ -146,14 +165,14 @@ with gr.Blocks(theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
 	)
 	# --- Text Interpertation ---
-	with gr.Tab("🎓 Text Interpretation"):
 		gr.Markdown("### Configure Interpretation Settings")
 		with gr.Row():
 			with gr.Column(scale=1):
-				prof_language_seletor = gr.Radio(["EN", "ZH", "FR"], label="Prof's Language")
-				learn_language_seletor = gr.Radio(["EN", "ZH", "FR"], label="Language to Learn")
-				style_seletor = gr.Radio(["General", "Paper", "News", "Narrative", "Poem", "Philosophy"], label="Genre")
 				interpret_button = gr.Button("Generate Interpretation", variant="primary")
 			with gr.Column(scale=2):
@@ -169,5 +188,30 @@ with gr.Blocks(theme=gr.themes.Soft(), css=CUSTOM_CSS) as demo:
 		outputs=interpretation_output
 	)
 if __name__ == "__main__":
-	demo.launch(share=True)

 import gradio as gr
 from process.ocr import perform_raw_ocr, correct_text_with_ai
 from process.interpretation import get_interpretation
+from process.translation import get_tranlaton
 from process.gradio_css import CUSTOM_CSS
 		yield error_msg, error_msg + "\n\n"
+def interpretation_workflow(text: str, genre: str, learn_language: str, target_language: str):
 	if not GEMINI_API_KEY:
 		yield "Error: Gemini api key not found."
 		return
 		yield "Error: Language not selected"
 	if genre.lower() in ["general", "news"]:
+		yield f"⏳ Generating interpretation for genre: {[genre]}...(10s - 2min)"
 		result = get_interpretation(genre.lower(), GEMINI_API_KEY, text, learn_language, target_language)
 		yield result
 	else:
 		yield "not implemented yet"
+def translation_workflow(text: str, target_language: str):
+	if not GEMINI_API_KEY:
+		yield "Error: Gemini api key not found."
+		return
+	if not text or text.strip() == "":
+		yield "Error: Text is empty"
+		return
+	if not target_language:
+		yield "Error: Language not selected"
+	if target_language in ["Deutsch", "English", "Français", "Русский язык", "中文"]:
+		yield f"⏳ Generating interpretation for target_language: {[target_language]}..."
+		result = get_tranlaton(text, GEMINI_API_KEY, target_language)
+		yield result
+	else:
+		yield "not implemented yet"
+with gr.Blocks(theme=gr.themes.Monochrome(), css=CUSTOM_CSS) as demo:
+	gr.Markdown("# 📚 LogosAI - Intensive Reading in Any Language", elem_classes=["section-header"])
 	# --- API Key ---
 	with gr.Accordion("API Configuration", open=True):
 	# --- Text Processing ---
 	gr.Markdown("---")
+	with gr.Tab("Text"):
 		with gr.Row():
 			with gr.Column(scale=1):
 					file_types=["image", ".pdf", ".txt"]
 					)
 				process_button = gr.Button("1. File Process (OCR/Read)", variant="primary")
+				ai_correct_button = gr.Button("2. AI Correct", variant="primary")
 			with gr.Column(scale=2):
 				gr.Markdown("### Processed result")
 				with gr.Tabs():
 					with gr.Tab("Raw Text"):
 						text_display = gr.Textbox(
+							label="Raw Text(editable)",
 							lines=15,
 							max_lines=20,
 							show_copy_button=True,
 							value="",
 							interactive=True
 						)
+					with gr.Tab("Formatted Text"):
 						text_markdown = gr.Markdown(
 							value="*Processed text will appear here...*\n\n",
 						)
 	)
 	# --- Text Interpertation ---
+	with gr.Tab("🎓 Interpretation"):
 		gr.Markdown("### Configure Interpretation Settings")
 		with gr.Row():
 			with gr.Column(scale=1):
+				prof_language_seletor = gr.Dropdown(["DE", "EN", "FR", "RU", "ZH"], label="Prof's Language", value="EN")
+				learn_language_seletor = gr.Dropdown(["DE", "EN", "FR", "RU", "ZH"], label="Language to Learn", value="EN")
+				style_seletor = gr.Dropdown(["General", "Paper", "News", "Narrative", "Poem", "Philosophy"], label="Genre")
 				interpret_button = gr.Button("Generate Interpretation", variant="primary")
 			with gr.Column(scale=2):
 		outputs=interpretation_output
 	)
+	with gr.Tab("Translation"):
+		gr.Markdown("### Configure Translation Settings")
+		with gr.Row():
+			with gr.Column(scale=1):
+				target_language_selector = gr.Dropdown(
+					["Deutsch", "English", "Français", "Русский язык", "中文"],
+					value="English",
+					label="Target Language",
+					interactive=True)
+				translation_button = gr.Button("Translate!", variant="primary")
+			with gr.Column(scale=2):
+				interpretation_output = gr.Markdown(
+					value="*Translation will appear here ...*\n\n",
+					show_copy_button=True
+					)
+	translation_button.click(
+		fn=translation_workflow,
+		inputs=[text_display, target_language_selector],
+		outputs=interpretation_output
+	)
 if __name__ == "__main__":
+	demo.launch()

process/interpretation.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from google import genai
 from google.genai import types
-from process.sys_prompt import GENERAL_PROMPT ,NEWS_PROMPT
 NARRATIVE_PROMPT = ""
@@ -8,10 +8,10 @@ POEM_PROMPT = ""
 PHILO_PROMPT = ""
 def get_interpretation(genre: str,
-					   api_key: str,
-					   text: str,
-					   learn_language: str,
-					   prof_language: str) -> str:
 	if not api_key:
 		return "Error: Gemini API Key not found."
@@ -20,7 +20,7 @@ def get_interpretation(genre: str,
 	client = genai.Client(api_key=api_key)
-	lang_map ={"ZH": "Chinese", "EN": "English", "FR": "French"}
 	learn_lang = lang_map.get(learn_language.upper(), "English")
 	prof_lang = lang_map.get(prof_language.upper(), "English")
 	genres = {
@@ -30,10 +30,8 @@ def get_interpretation(genre: str,
 		"poem": POEM_PROMPT,
 		"philosophy": PHILO_PROMPT
 		}
-	if genre.lower() == "general":
-		sys_prompt = genres["general"].replace("[LEARN_LANGUAGE]", learn_lang).replace("[PROF_LANGUAGE]", prof_lang)
-	elif genre.lower() == "news":
-		sys_prompt = genres["news"].replace("[LEARN_LANGUAGE]", learn_lang).replace("[PROF_LANGUAGE]", prof_lang)
 	response = client.models.generate_content(
 		model="gemini-2.5-flash-preview-05-20",

 from google import genai
 from google.genai import types
+from process.sys_prompt import GENERAL_PROMPT, NEWS_PROMPT
 NARRATIVE_PROMPT = ""
 PHILO_PROMPT = ""
 def get_interpretation(genre: str,
+						api_key: str,
+						text: str,
+						learn_language: str,
+						prof_language: str) -> str:
 	if not api_key:
 		return "Error: Gemini API Key not found."
 	client = genai.Client(api_key=api_key)
+	lang_map ={"DE": "German", "EN": "English", "FR": "French", "RU":"Russian", "ZH": "Chinese"}
 	learn_lang = lang_map.get(learn_language.upper(), "English")
 	prof_lang = lang_map.get(prof_language.upper(), "English")
 	genres = {
 		"poem": POEM_PROMPT,
 		"philosophy": PHILO_PROMPT
 		}
+	if genre.lower() in ["general", "news"]:
+		sys_prompt = genres[genre.lower()].replace("[LEARN_LANGUAGE]", learn_lang).replace("[PROF_LANGUAGE]", prof_lang)
 	response = client.models.generate_content(
 		model="gemini-2.5-flash-preview-05-20",

process/ocr.py CHANGED Viewed

@@ -86,7 +86,10 @@ def correct_text_with_ai(text: str, api_key: str):
 def perform_raw_ocr(input_file, api_key):
-	file_ext = input_file.name.split('.')[-1].lower()
 	if file_ext == "txt":
 		with open(input_file, "r", encoding="utf-8") as f:

 def perform_raw_ocr(input_file, api_key):
+	if input_file != None:
+		file_ext = input_file.name.split('.')[-1].lower()
+	else:
+		return "File/Text not found"
 	if file_ext == "txt":
 		with open(input_file, "r", encoding="utf-8") as f:

process/translation.py ADDED Viewed

	@@ -0,0 +1,32 @@

+from google import genai
+from google.genai import types
+SYS_PROMPT_TRANSLATION = """
+You are an expert translator.
+Your sole purpose is to accurately and faithfully translate the provided text into the [TARGET_LANGUAGE].
+Do not add any extra information, explanations, or stylistic changes.
+Maintain the original meaning and tone as closely as possible.
+"""
+def get_tranlaton(text: str, api_key: str, target_language: str) -> str:
+	if not api_key:
+		return "Error: Gemini API Key not found."
+	if not text:
+		return "Error: text not found."
+	client = genai.Client(api_key=api_key)
+	lang_map = {"Deutsch": "German", "English": "English", "Français": "French", "Русский язык": "Russain", "中文": "Chinese"}
+	tar_lang = lang_map.get(target_language, "English")
+	sys_prompt = SYS_PROMPT_TRANSLATION.replace("[TARGET_LANGUAGE]", tar_lang)
+	response = client.models.generate_content(
+		model="gemini-2.5-flash-preview-05-20",
+		config=types.GenerateContentConfig(
+			system_instruction=sys_prompt,
+			temperature=0.1,
+			),
+		contents=[text]
+	)
+	return response.text