Infinity-Parser-Demo

Sleeping

App Files Files Community

GiantPandas commited on Dec 30, 2025

Commit

2502d01

verified ·

1 Parent(s): ac1f276

Update app.py

Browse files

Files changed (1) hide show

app.py +42 -24

app.py CHANGED Viewed

@@ -54,6 +54,27 @@ preset_prompts = [
     "Reformat this document as Markdown with clear sections and lists.",
 ]
 def send_pdf_to_parse(file_path, server_ip, port, route="/upload", api_key=None):
     url = f"{openai_api_base}{route}"
@@ -66,9 +87,6 @@ def send_pdf_to_parse(file_path, server_ip, port, route="/upload", api_key=None)
         response = requests.post(url, files=files, headers=headers)
     return response
 async def send_pdf_async_aiohttp(file_path, server_ip, route="/upload", Authorization=None):
     """使用aiohttp异步发送PDF"""
     url = f"{server_ip}{route}"
@@ -95,32 +113,16 @@ def extract_makrdown(text):
         return m.group(1).strip()
     else:
         return text
-openai_api_key = "EMPTY"
-openai_api_base = os.environ.get("openai_api_base")
-IP = os.environ.get("IP")
-PORT = os.environ.get("PORT")
-Authorization = os.environ.get("Authorization")
-client = AsyncOpenAI(
-    api_key=openai_api_key,
-    base_url=openai_api_base + "/v1",
-    http_client=httpx.AsyncClient(verify=False)
-)
-async def request(messages):
     chat_completion_from_base64 = await client.chat.completions.create(
         messages=messages,
         extra_headers={
             "Authorization": f"Bearer {Authorization}"
         },
-        model="Qwen2_5VL",
         max_completion_tokens=4096,
         stream=True,
         temperature=0.0,
@@ -204,7 +206,10 @@ def download_markdown_file(md_text):
     return str(filepath)
-async def doc_parser(doc_path, prompt):
     doc_path = Path(doc_path)
     if not doc_path.is_file():
@@ -231,7 +236,7 @@ async def doc_parser(doc_path, prompt):
     all_pages_raw = []
     for query in queries:
         pages = ""
-        async for chunk in request(query):
             pages += chunk
             yield extract_makrdown(pages), pages
         all_pages.append(extract_makrdown(pages))
@@ -417,6 +422,15 @@ if __name__ == '__main__':
                 ]
             with gr.Column(variant='panel', scale=5):
                 with gr.Accordion("Examples", open=True):
                     example_root = "examples"
                     file_path = [
@@ -520,6 +534,10 @@ if __name__ == '__main__':
             fn=doc_parser,
             inputs=[file, prompts],
             outputs=[md, md_text]
         )
         clear_bu.add([file, md, md_text])

     "Reformat this document as Markdown with clear sections and lists.",
 ]
+openai_api_key = "EMPTY"
+AVAILABLE_MODELS = {
+    "infinity_parser1": {
+            "name": os.environ.get("infinity_parser1_name"),
+            "client": AsyncOpenAI(
+                api_key=openai_api_key,
+                base_url=os.environ.get("infinity_parser1_api") + "/v1",
+            ),
+            "Authorization": os.environ.get("infinity_parser1_Authorization")
+        },
+    "infinity_parser2": {
+            "name": os.environ.get("infinity_parser2_name"),
+            "client": AsyncOpenAI(
+                api_key=openai_api_key,
+                base_url=os.environ.get("infinity_parser2_api") + "/v1",
+            ),
+            "Authorization": os.environ.get("infinity_parser2_Authorization")
+        }
+}
 def send_pdf_to_parse(file_path, server_ip, port, route="/upload", api_key=None):
     url = f"{openai_api_base}{route}"
         response = requests.post(url, files=files, headers=headers)
     return response
 async def send_pdf_async_aiohttp(file_path, server_ip, route="/upload", Authorization=None):
     """使用aiohttp异步发送PDF"""
     url = f"{server_ip}{route}"
         return m.group(1).strip()
     else:
         return text
+async def request(messages, model_name, client, Authorization):
     chat_completion_from_base64 = await client.chat.completions.create(
         messages=messages,
         extra_headers={
             "Authorization": f"Bearer {Authorization}"
         },
+        model=model_name,
         max_completion_tokens=4096,
         stream=True,
         temperature=0.0,
     return str(filepath)
+async def doc_parser(doc_path, prompt, model_id):
+    model_name = AVAILABLE_MODELS[model_id]["name"]
+    client = AVAILABLE_MODELS[model_id]["client"]
+    Authorization = AVAILABLE_MODELS[model_id]["Authorization"]
     doc_path = Path(doc_path)
     if not doc_path.is_file():
     all_pages_raw = []
     for query in queries:
         pages = ""
+        async for chunk in request(query, model_name, client, Authorization):
             pages += chunk
             yield extract_makrdown(pages), pages
         all_pages.append(extract_makrdown(pages))
                 ]
             with gr.Column(variant='panel', scale=5):
+                model_selector = gr.Dropdown(
+                    choices=[(v["name"], k) for k, v in AVAILABLE_MODELS.items()],
+                    value=list(AVAILABLE_MODELS.keys())[0],  # 默认选择第一个模型
+                    label="Model Selection",
+                    info="Select the model to use for parsing",
+                    interactive=True,
+                )
                 with gr.Accordion("Examples", open=True):
                     example_root = "examples"
                     file_path = [
             fn=doc_parser,
             inputs=[file, prompts],
             outputs=[md, md_text]
+        ).then(
+            fn=doc_parser,
+            inputs=[file, prompts, model_selector],
+            outputs=[md, md_text]
         )
         clear_bu.add([file, md, md_text])