Spaces:

Adun
/

typhoon-ocr-finetuned-v1.x

Running on Zero

App Files Files Community

Adun commited on Jun 29

Commit

d482a87

verified ·

1 Parent(s): 0b31002

Upload app.py

Browse files

Files changed (1) hide show

app.py +9 -6

app.py CHANGED Viewed

@@ -35,6 +35,8 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 # Load Adun/typhoon_ocr-7B-v1.4
 MODEL_ID_M = "Adun/typhoon_ocr-7B-v1.4"
 processor_m = AutoProcessor.from_pretrained(MODEL_ID_M, trust_remote_code=True)
@@ -103,14 +105,14 @@ def downsample_video(video_path):
 @spaces.GPU
 def generate_image(model_name: str, text: str, image: Image.Image,
-                   max_new_tokens: int = 1024,
-                   temperature: float = 0.6,
                    top_p: float = 0.9,
                    top_k: int = 50,
                    repetition_penalty: float = 1.2):
     """Generate responses for image input using the selected model."""
     # Model selection
-    if model_name == "Adun/Typhoon-OCR-7B-1.4":
         processor = processor_m
         model = model_m
     # elif model_name == "MonkeyOCR-Recognition":
@@ -196,8 +198,9 @@ def generate_video(model_name: str, text: str, video_path: str,
                    top_k: int = 50,
                    repetition_penalty: float = 1.2):
     """Generate responses for video input using the selected model."""
     # Model selection
-    if model_name == "Adun/typhoon_ocr-7B-v1.4":
         processor = processor_m
         model = model_m
     # elif model_name == "MonkeyOCR-Recognition":
@@ -333,9 +336,9 @@ with gr.Blocks(css=css, theme="bethecloud/storj_theme") as demo:
         with gr.Column():
             output = gr.Textbox(label="Output", interactive=False, lines=3, scale=2)
             model_choice = gr.Radio(
-                choices=["Adun/typhoon_ocr-7B-v1.4", "Typhoon-OCR-7B"],
                 label="Select Model",
-                value="Adun/typhoon_ocr-7B-v1.4"
             )
             gr.Markdown("**Model Info 💻** | [Report Bug](https://huggingface.co/spaces/Adun/typhoon-ocr-finetuned-v1.x/discussions)")

 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+model_name = "typhoon_ocr-7B-v1.4(finetuned)"
 # Load Adun/typhoon_ocr-7B-v1.4
 MODEL_ID_M = "Adun/typhoon_ocr-7B-v1.4"
 processor_m = AutoProcessor.from_pretrained(MODEL_ID_M, trust_remote_code=True)
 @spaces.GPU
 def generate_image(model_name: str, text: str, image: Image.Image,
+                   max_new_tokens: int = 2048,
+                   temperature: float = 0.1,
                    top_p: float = 0.9,
                    top_k: int = 50,
                    repetition_penalty: float = 1.2):
     """Generate responses for image input using the selected model."""
     # Model selection
+    if model_name == "typhoon_ocr-7B-v1.4(finetuned)":
         processor = processor_m
         model = model_m
     # elif model_name == "MonkeyOCR-Recognition":
                    top_k: int = 50,
                    repetition_penalty: float = 1.2):
     """Generate responses for video input using the selected model."""
     # Model selection
+    if model_name == "typhoon_ocr-7B-v1.4(finetuned)":
         processor = processor_m
         model = model_m
     # elif model_name == "MonkeyOCR-Recognition":
         with gr.Column():
             output = gr.Textbox(label="Output", interactive=False, lines=3, scale=2)
             model_choice = gr.Radio(
+                choices=["typhoon_ocr-7B-v1.4(finetuned)", "Typhoon-OCR-7B"],
                 label="Select Model",
+                value="typhoon_ocr-7B-v1.4(finetuned)"
             )
             gr.Markdown("**Model Info 💻** | [Report Bug](https://huggingface.co/spaces/Adun/typhoon-ocr-finetuned-v1.x/discussions)")