Spaces:

Curify
/

manga_translation

Runtime error

File size: 3,862 Bytes

94373b1
0dea357
94373b1
 
51f4c53
0cc8e22
8b00075
8ab5188
0cc8e22
94373b1
11f2eae
 
 
41abb42
11f2eae
 
41abb42
 
 
 
 
46c683e
11f2eae
 
 
 
46c683e
 
 
 
 
 
11f2eae
46c683e
 
 
 
 
 
 
 
 
41abb42
46c683e
8c6ca99
11f2eae
46c683e
 
 
 
 
fbb8ef8
46c683e
11f2eae
0438fe3
46c683e
 
fbb8ef8
8c6ca99
46c683e
 
 
 
11f2eae
94373b1
955e685
46c683e
 
9a92885
46c683e
955e685
46c683e
2722237
 
94373b1
d179d12
955e685
46c683e
d179d12
955e685
46c683e
94373b1
46c683e
 
94373b1
 
 
46c683e
94373b1
46c683e
 
2722237
 
46c683e
94373b1
46c683e
 
955e685
46c683e
 
94373b1
955e685

import gradio as gr
import numpy as np
import os
from io import BytesIO
from PIL import Image, ImageDraw, ImageFont
from utils.azure_translate import translate_text_azure
from utils.image_utils import split_image, encode_image_to_html
from utils.ocr_utils import extract_and_translate_chunk
from utils.polygon_utils import draw_translated_text_convex, render_translated_chunk

def load_and_split_image(file_obj, num_chunks):
    from PIL import Image
    import os
    if file_obj is not None:
        image_path = file_obj.name if hasattr(file_obj, 'name') else file_obj
        filename = os.path.basename(image_path)
    else:
        image_path = "00_sample.jpg"
        filename = "00_sample.jpg"

    image = Image.open(image_path).convert("RGB")
    chunks = split_image(image, num_chunks)
    return filename, image, chunks

def pipeline(file_obj, num_chunks):
    filename, image, chunks = load_and_split_image(file_obj, num_chunks)

    all_translations = []
    all_tables = []
    translated_images = []

    for chunk in chunks:
        translations = extract_and_translate_chunk(chunk)
        table_data = [[t["original"], t["translated"]] for t in translations]
        all_translations.append(translations)
        all_tables.extend(table_data)
        translated_img = render_translated_chunk(chunk, translations)
        translated_images.append(translated_img)

    original_html = "".join([encode_image_to_html(c) for c in chunks])
    translated_html = "".join([encode_image_to_html(t) for t in translated_images])

    return filename, original_html, translated_html, all_tables, all_translations

def update_and_render(file_obj, translations, updated_table, num_chunks, font_scale=1.0):
    _, image, chunks = load_and_split_image(file_obj, num_chunks)
    new_images = []

    index = 0
    for i, chunk in enumerate(chunks):
        updated_translations = []
        for j in range(len(translations[i])):
            updated_translations.append({
                "translated": updated_table.iloc[index, 1],
                "polygon": translations[i][j]["polygon"]
            })
            index += 1

        new_image = render_translated_chunk(chunk, updated_translations, font_path="NotoSansSC-Regular.ttf", font_scale=font_scale)
        new_images.append(new_image)

    translated_html = "".join([encode_image_to_html(t) for t in new_images])
    return translated_html
    
with gr.Blocks() as demo:
    gr.Markdown("# 🄹 Manga Translator with OCR & Azure")

    with gr.Row():
        file_input = gr.File(label="Upload Manga Image", type="filepath", file_types=[".jpg", ".png"])
        chunk_slider = gr.Slider(1, 10, value=4, step=1, label="Split into X Chunks")
        font_scale_slider = gr.Slider(0.5, 2.0, value=1.0, step=0.05, label="Font Size Scale")

    filename_display = gr.Textbox(label="📂 Uploaded File", interactive=False)

    with gr.Row():
        with gr.Column():
            gr.Markdown("### 📅 Original Preview (Scrollable, Fixed Height)")
            original_html = gr.HTML()
        with gr.Column():
            gr.Markdown("### 🄯 Translated Preview (Scrollable, Fixed Height)")
            translated_html = gr.HTML()

    translation_table = gr.Dataframe(headers=["Original", "Translated"], interactive=True)
    translations_state = gr.State()

    with gr.Row():
        translate_btn = gr.Button("Extract & Translate")
        render_btn = gr.Button("Apply Manual Edits")

    translate_btn.click(
        fn=pipeline,
        inputs=[file_input, chunk_slider],
        outputs=[filename_display, original_html, translated_html, translation_table, translations_state]
    )

    render_btn.click(
        fn=update_and_render,
        inputs=[file_input, translations_state, translation_table, chunk_slider, font_scale_slider],
        outputs=translated_html
    )

    demo.launch()