Spaces:

ginigen
/

Every-Text

Runtime error

App Files Files Community

ginipick commited on Mar 18

Commit

15cc8b5

verified ·

1 Parent(s): f8cac3e

Update app.py

Browse files

Files changed (1) hide show

app.py +64 -25

app.py CHANGED Viewed

@@ -7,6 +7,8 @@ import base64
 import mimetypes
 import json
 import io
 import torch
 from PIL import Image
@@ -122,7 +124,7 @@ def generate_by_google_genai(text, file_name, model="gemini-2.0-flash-exp"):
     # 임시 파일로 이미지 받을 준비
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         temp_path = tmp.name
-        # 응답 스트림을 받으면서 이미지/텍스트 구분 처리
         for chunk in client.models.generate_content_stream(
             model=model,
             contents=contents,
@@ -148,8 +150,28 @@ def generate_by_google_genai(text, file_name, model="gemini-2.0-flash-exp"):
     return image_path, text_response
 #######################################
-# 3. Gradio 함수
-#    (1) FLUX로 이미지 생성 -> (2) Google GenAI로 텍스트 교체
 #######################################
 def generate_initial_image(prompt, text, height, width, steps, scale, seed):
@@ -162,8 +184,7 @@ def generate_initial_image(prompt, text, height, width, steps, scale, seed):
         combined_prompt = prompt.replace("<text>", text)
     else:
         combined_prompt = f"{prompt} with clear readable text that says '{text}'"
-    # 디버그용: 최종 들어가는 프롬프트를 확인
     print(f"[DEBUG] Final combined_prompt: {combined_prompt}")
     with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
@@ -183,47 +204,43 @@ def change_text_in_image(original_image, new_text):
     """
     Google GenAI의 gemini 모델을 통해,
     업로드된 이미지 내부의 문구를 `new_text`로 변경해주는 함수.
     """
     try:
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             original_path = tmp.name
             original_image.save(original_path)
-        # Gemini 모델 호출
         image_path, text_response = generate_by_google_genai(
             text=f"Change the text in this image to: '{new_text}'",
             file_name=original_path
         )
         if image_path:
-            # Gradio 구버전에는 decode_base64_to_image가 없으므로 PIL로 처리
             with open(image_path, "rb") as f:
                 image_data = f.read()
             modified_img = Image.open(io.BytesIO(image_data))
             return modified_img, ""
         else:
-            # 이미지가 없이 텍스트만 반환된 경우
             return None, text_response
     except Exception as e:
         raise gr.Error(f"Error: {e}")
 #######################################
-# 4. Gradio 인터페이스 구성
 #######################################
-with gr.Blocks(title="Flux + Google GenAI Text Replacement") as demo:
     gr.Markdown(
         """
-        # Flux 기반 이미지 생성 + Google GenAI를 통한 텍스트 변환
-        **Usage**:
-        - You can include `<text>` in the prompt. For example:
-          `white cat with speech bubble says <text>`
-        - Then, type the actual text in "Text to Include in the Image" (ex: "Hello" or "안녕").
-        - If `<text>` is not found in your prompt, the text will be automatically appended as:
-          `with clear readable text that says '<text>'`.
-        - Finally, you can optionally change the text again via Gemini.
         ---
         """
@@ -253,25 +270,47 @@ with gr.Blocks(title="Flux + Google GenAI Text Replacement") as demo:
             generated_image = gr.Image(label="Generated Image (with text)", type="pil")
         with gr.Column():
-            gr.Markdown("## 2) Step 2: 생성된 이미지 내 텍스트 수정")
             new_text_input = gr.Textbox(
-                label="새로 바꿀 텍스트",
-                placeholder="예) Hello world"
             )
-            modify_btn = gr.Button("Change Text in Image via Gemini", variant="secondary")
             output_img = gr.Image(label="Modified Image", type="pil")
             output_txt = gr.Textbox(label="(If only text returned)")
-    # 버튼 액션 연결
     generate_btn.click(
         fn=generate_initial_image,
         inputs=[prompt_input, text_input, height, width, steps, scale, seed],
         outputs=[generated_image]
     )
-    modify_btn.click(
         fn=change_text_in_image,
-        inputs=[generated_image, new_text_input],
         outputs=[output_img, output_txt]
     )

 import mimetypes
 import json
 import io
+import random
+import string
 import torch
 from PIL import Image
     # 임시 파일로 이미지 받을 준비
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         temp_path = tmp.name
+        # 응답 스트림 처리
         for chunk in client.models.generate_content_stream(
             model=model,
             contents=contents,
     return image_path, text_response
 #######################################
+# 3. 임의 알파벳 생성용 함수
+#######################################
+def generate_random_letters(length: int) -> str:
+    """
+    length 길이의 임의의 알파벳 문자열을 생성해 반환.
+    대문자+소문자(a-z, A-Z) 범위에서 랜덤 뽑기.
+    """
+    letters = string.ascii_uppercase + string.ascii_lowercase
+    return "".join(random.choice(letters) for _ in range(length))
+def fill_text_input_with_random(new_text: str) -> str:
+    """
+    "새로 바꿀 텍스트"의 길이를 세어, 그 길이만큼 임의의 알파벳 문자열 생성 후 반환.
+    이 반환값이 곧 "이미지 안에 들어갈 텍스트" UI(=text_input)에 표시됨.
+    """
+    length = len(new_text)
+    random_letters = generate_random_letters(length)
+    return random_letters
+#######################################
+# 4. Gradio 함수
 #######################################
 def generate_initial_image(prompt, text, height, width, steps, scale, seed):
         combined_prompt = prompt.replace("<text>", text)
     else:
         combined_prompt = f"{prompt} with clear readable text that says '{text}'"
     print(f"[DEBUG] Final combined_prompt: {combined_prompt}")
     with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
     """
     Google GenAI의 gemini 모델을 통해,
     업로드된 이미지 내부의 문구를 `new_text`로 변경해주는 함수.
+    (여기서는 new_text가 이미 임의의 알파벳으로 채워진 상태가 됨)
     """
     try:
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             original_path = tmp.name
             original_image.save(original_path)
         image_path, text_response = generate_by_google_genai(
             text=f"Change the text in this image to: '{new_text}'",
             file_name=original_path
         )
         if image_path:
             with open(image_path, "rb") as f:
                 image_data = f.read()
             modified_img = Image.open(io.BytesIO(image_data))
             return modified_img, ""
         else:
             return None, text_response
     except Exception as e:
         raise gr.Error(f"Error: {e}")
 #######################################
+# 5. Gradio 인터페이스 구성
 #######################################
+with gr.Blocks(title="Flux + Google GenAI + Random Text Replacement") as demo:
     gr.Markdown(
         """
+        # Flux 기반 이미지 생성 + Google GenAI + 임의 알파벳 치환
+        **기능 요약**
+        1) "새로 바꿀 텍스트"에 입력된 문자열 길이를 측정
+        2) 그 길이만큼 **무작위 알파벳**(대소문자)으로 구성된 문자열을 만들어
+        3) "이미지 안에 들어갈 텍스트" 칸에 자동으로 입력 (즉, 실제 바뀔 텍스트는 완전히 랜덤)
+        4) 그 후 Google GenAI(gemini)로 이미지 문자를 교체
         ---
         """
             generated_image = gr.Image(label="Generated Image (with text)", type="pil")
         with gr.Column():
+            gr.Markdown(
+                """
+                ## 2) Step 2: "새로 바꿀 텍스트" 길이를 기준으로
+                임의 알파벳을 "이미지 안에 들어갈 텍스트"로 자동 설정 → 이미지 교체
+                """
+            )
             new_text_input = gr.Textbox(
+                label="새로 바꿀 텍스트 (입력된 길이를 기준으로 무작위 알파벳 생성)",
+                placeholder="예) Hello123 (길이 8이면, 8글자 랜덤)"
             )
+            # (A) 먼저 "새로 바꿀 텍스트" 글자수를 세어, 무작위 알파벳으로 text_input 채우기
+            # (B) 그런 뒤 change_text_in_image() 실행
+            modify_btn = gr.Button("Generate Random Letters & Change Text in Image", variant="secondary")
+            # 최종 결과
             output_img = gr.Image(label="Modified Image", type="pil")
             output_txt = gr.Textbox(label="(If only text returned)")
+    ###########################
+    # 1) Step1 버튼 액션
+    ###########################
     generate_btn.click(
         fn=generate_initial_image,
         inputs=[prompt_input, text_input, height, width, steps, scale, seed],
         outputs=[generated_image]
     )
+    ###########################
+    # 2) Step2 버튼 액션
+    ###########################
+    # (A) 무작위 알파벳 생성해 text_input에 반영
+    chain = modify_btn.click(
+        fn=fill_text_input_with_random,
+        inputs=[new_text_input],
+        outputs=[text_input]
+    )
+    # (B) 방금 업데이트된 text_input 값을 이용해, 이미지 텍스트 교체
+    chain.then(
         fn=change_text_in_image,
+        inputs=[generated_image, text_input],
         outputs=[output_img, output_txt]
     )