Spaces:

JunyiAcademy
/

question_image_to_text

Sleeping

App Files Files Community

youngtsai commited on May 17, 2024

Commit

ca6115f

1 Parent(s): a09f7b1

def text_to_json(text):

Browse files

Files changed (1) hide show

app.py +41 -63

app.py CHANGED Viewed

@@ -62,41 +62,22 @@ def process_image(image_url):
     print("======image_to_text=====")
     print(text)
     print("========================")
-    text_refine = text.replace("```json\n", "").replace("\n```", "")
-    question_json = json.loads(text_refine)
     return text, question_json
 def image_to_text(url):
     user_prompt = """
-        請解讀數學題目圖片，圖片請用 zh-TW 解讀
-        [數學用語、題目內的數字、選項上的數字、 數學符號、英文單字] 請一定要用 LATEX markdown 語法(前後用 $ 包起來)，LATEX 這很重要
-        輸出格式為 JSON 格式，包含以下欄位：
-        1. 題號：q_id (數字)
-        2. 題目：question
-        3. 選項：choice_1~choice_4
-        rule: only show the json text format of the response
-        restrictions:
-        - dont show the word:'json' in response
-        - dont show the word:'```' in response
-        EXAMPLE:
-        {{
-            "q_id" : 1,
-            "question": .......,
-            "choice_1": ....,
-            "choice_2": .... ,
-            "choice_3": ....,
-            "choice_4": ....
-        }}
     """
-    response_format = { "type": "json_object" }
     response = OPEN_AI_CLIENT.chat.completions.create(
-        model="gpt-4o",
-        messages=[
         {
           "role": "user",
           "content": [
@@ -111,45 +92,42 @@ def image_to_text(url):
               },
             },
           ],
-          "response_format": response_format
         }
       ],
-      max_tokens=4000,
     )
-    text = response.choices[0].message.content
-    return text
-# def text_to_json(text):
-#     system_prompt = """
-#     你是專業的轉譯器，看得懂題目，並保留 LATEX 語法($$)
-#     """
-#     user_prompt = """
-#       將以內容轉成 json，並保留 latex 語法($$)，請一定要用 LATEX markdown 語法(前後用 $ 包起來的形式)，包含 question 跟 choice 1~4
-#       {
-#       "q_id" : 1,
-#       "question": .......,
-#       "choice_1": ....,
-#       "choice_2": .... ,
-#       "choice_3": ....,
-#       "choice_4": ....
-#       }
-#       ---
-#     """
-#     user_prompt += text
-#     response_to_json = OPEN_AI_CLIENT.chat.completions.create(
-#       model="gpt-4o",
-#       response_format={ "type": "json_object" },
-#       messages=[
-#         {"role": "system", "content": system_prompt},
-#         {"role": "user", "content": user_prompt}
-#       ],
-#       max_tokens=1000,
-#     )
-#     result = response_to_json.choices[0].message.content
-#     return result
 def build_perseus_json(question_json):
     question = question_json['question']

     print("======image_to_text=====")
     print(text)
     print("========================")
+    question_json = json.loads(text_to_json(text))
     return text, question_json
 def image_to_text(url):
     user_prompt = """
+      請解讀數學題目圖片，圖片請用 zh-TW 解讀
+      [數學用語、題目內的數字、選項上的數字、 數學符號、英文單字] 請一定要用 LATEX markdown 語法(前後用 $ 包起來)，LATEX 這很重要
+      輸出為
+      1. 題號：
+      2. 題目：
+      3. 選項：
     """
     response = OPEN_AI_CLIENT.chat.completions.create(
+      model="gpt-4o",
+      messages=[
         {
           "role": "user",
           "content": [
               },
             },
           ],
         }
       ],
+      max_tokens=300,
+    )
+    return response.choices[0].message.content
+def text_to_json(text):
+    system_prompt = """
+    你是專業的轉譯器，看得懂題目，並保留 LATEX 語法($$)
+    """
+    user_prompt = """
+      將以內容轉成 json，並保留 latex 語法($$)，請一定要用 LATEX markdown 語法(前後用 $ 包起來的形式)，包含 question 跟 choice 1~4
+      {
+      "q_id" : 1,
+      "question": .......,
+      "choice_1": ....,
+      "choice_2": .... ,
+      "choice_3": ....,
+      "choice_4": ....
+      }
+      ---
+    """
+    user_prompt += text
+    response_to_json = OPEN_AI_CLIENT.chat.completions.create(
+      model="gpt-4o",
+      response_format={ "type": "json_object" },
+      messages=[
+        {"role": "system", "content": system_prompt},
+        {"role": "user", "content": user_prompt}
+      ],
+      max_tokens=1000,
     )
+    result = response_to_json.choices[0].message.content
+    return result
 def build_perseus_json(question_json):
     question = question_json['question']