Spaces:

DocUA
/

LightOnOCR-1B-Demo

Sleeping

App Files Files Community

DocUA commited on Jan 6

Commit

f7c3947

1 Parent(s): 03c4021

feat: remove temperature parameter from UI and hardcode inference temperature to 0.0

Browse files

Files changed (2) hide show

LightOnOCR-1B-Demo +1 -1
hf_space/app.py +9 -16

LightOnOCR-1B-Demo CHANGED Viewed

	@@ -1 +1 @@
1	- Subproject commit ~~625560a9e67d828b7561e830fb258b221ce29ee7~~


1	+ Subproject commit 394149f9369a36c1654e32e50356409c68447727

hf_space/app.py CHANGED Viewed

@@ -55,14 +55,15 @@ def process_pdf(pdf_path, num_pages=1, scale=2.0):
     return images, total_pages
 @spaces.GPU(duration=120)  # Increase duration for OCR
-def run_inference(image, temperature, max_tokens):
     """Run inference on GPU."""
     global BACKEND
     if BACKEND is None:
         load_backend()
-    return BACKEND.process_image(image, temperature=temperature, max_tokens=max_tokens)
-def process_input(file_input, scale, temperature, max_tokens, num_pages):
     """Process uploaded file with OCR."""
     if file_input is None:
         yield "Idle", "Please upload an image or PDF first.", "", "", None
@@ -71,7 +72,8 @@ def process_input(file_input, scale, temperature, max_tokens, num_pages):
     images_to_process = []
     page_info = ""
     display_image = None
     file_path = Path(file_input) if isinstance(file_input, str) else Path(file_input.name)
     if not file_path.exists():
         yield "Error", f"File not accessible: {file_path}", "", "", None
@@ -107,8 +109,8 @@ def process_input(file_input, scale, temperature, max_tokens, num_pages):
         for i, img in enumerate(images_to_process):
             try:
                 print(f"Processing page {i+1}/{len(images_to_process)}...")
-                # Run inference on GPU
-                text = run_inference(img, temperature=temperature, max_tokens=max_tokens)
                 all_texts.append(text.strip())
                 # Update progress
@@ -179,15 +181,6 @@ with gr.Blocks(title="📖 LightOnOCR-1B Demo", theme=gr.themes.Soft()) as demo:
                     label="PDF Pages",
                     info="Number of pages to process (max 10)"
                 )
-                temperature = gr.Slider(
-                    minimum=0.0,
-                    maximum=1.0,
-                    value=0.1,
-                    step=0.05,
-                    label="Temperature",
-                    info="0 = deterministic"
-                )
             page_info = gr.Textbox(
                 label="Processing Info",
@@ -221,7 +214,7 @@ with gr.Blocks(title="📖 LightOnOCR-1B Demo", theme=gr.themes.Soft()) as demo:
     # Event handlers
     submit_btn.click(
         fn=process_input,
-        inputs=[file_input, scale_slider, temperature, max_tokens_slider, num_pages],
         outputs=[status_display, output_text, raw_output, page_info, rendered_image]
     )

     return images, total_pages
 @spaces.GPU(duration=120)  # Increase duration for OCR
+def run_inference(image, max_tokens):
     """Run inference on GPU."""
     global BACKEND
     if BACKEND is None:
         load_backend()
+    return BACKEND.process_image(image, temperature=0.0, max_tokens=max_tokens)
+def process_input(file_input, scale, max_tokens, num_pages):
     """Process uploaded file with OCR."""
     if file_input is None:
         yield "Idle", "Please upload an image or PDF first.", "", "", None
     images_to_process = []
     page_info = ""
     display_image = None
+    # ... (rest of image loading logic same as before, simplified for diff clarity)
     file_path = Path(file_input) if isinstance(file_input, str) else Path(file_input.name)
     if not file_path.exists():
         yield "Error", f"File not accessible: {file_path}", "", "", None
         for i, img in enumerate(images_to_process):
             try:
                 print(f"Processing page {i+1}/{len(images_to_process)}...")
+                # Run inference on GPU (hardcoded temp=0.0)
+                text = run_inference(img, max_tokens=max_tokens)
                 all_texts.append(text.strip())
                 # Update progress
                     label="PDF Pages",
                     info="Number of pages to process (max 10)"
                 )
             page_info = gr.Textbox(
                 label="Processing Info",
     # Event handlers
     submit_btn.click(
         fn=process_input,
+        inputs=[file_input, scale_slider, max_tokens_slider, num_pages],
         outputs=[status_display, output_text, raw_output, page_info, rendered_image]
     )