Spaces:

ChingCL
/

20122013

Sleeping

App Files Files Community

ChingCL commited on Aug 16, 2024

Commit

4d3db91

verified ·

1 Parent(s): 8598697

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -30

app.py CHANGED Viewed

@@ -1,44 +1,28 @@
 import gradio as gr
 import pandas as pd
 import re
-# 第一個檢查：檢查$符號前後是否有空格
-def check_spacing_around_dollar(df):
-    errors = []
-    for i, row in df.iterrows():
-        for col in df.columns:
-            text = str(row[col])
-            matches = list(re.finditer(r'(\s?\$\S*?\s?|\s?\S*?\$)', text))
-            for match in matches:
-                if not (text[match.start() - 1] == ' ' and text[match.end()] == ' '):
-                    errors.append(f"行 {i+1} 列 '{col}': '{text}'")
-    return errors
-# 第二個檢查：檢查$符號之間是否有空格
-def check_spacing_between_dollars(df):
-    errors = []
-    for i, row in df.iterrows():
-        for col in df.columns:
-            text = str(row[col])
-            matches = list(re.finditer(r'\$\S+?(?=\$)', text))
-            for match in matches:
-                if text[match.end()] != ' ' and text[match.start() - 1] != ' ':
-                    errors.append(f"行 {i+1} 列 '{col}': '{text}'")
-    return errors
-# 第三個檢查：檢查數字前後是否有$
-def check_numbers_surrounded_by_dollar(df):
     errors = []
     for i, row in df.iterrows():
         for col in df.columns:
-            text = str(row[col])
-            matches = list(re.finditer(r'\b\d+\b', text))
             for match in matches:
-                if not (text[match.start() - 1] == '$' and text[match.end()] == '$'):
                     errors.append(f"行 {i+1} 列 '{col}': '{text}'")
     return errors
-# 處理檔案並執行檢查
 def process_file(file):
     if file.name.endswith('.csv'):
         df = pd.read_csv(file.name)
@@ -58,7 +42,6 @@ def process_file(file):
         "第三個檢查": errors3
     }
-# Gradio 介面
 iface = gr.Interface(
     fn=process_file,
     inputs=gr.File(label="上傳 CSV 或 XLSX 檔案"),

 import gradio as gr
 import pandas as pd
 import re
+import json
+def extract_text_from_json(text):
+    try:
+        data = json.loads(text)
+        if isinstance(data, dict) and 'question' in data:
+            return data['question']['content']
+    except json.JSONDecodeError:
+        return text
+    return text
+def check_spacing_around_dollar(df):
     errors = []
     for i, row in df.iterrows():
         for col in df.columns:
+            text = extract_text_from_json(str(row[col]))
+            matches = re.finditer(r'(\$\S+|\S+\$)', text)
             for match in matches:
+                if (match.start() > 0 and text[match.start() - 1] != ' ') or (match.end() < len(text) and text[match.end()] != ' '):
                     errors.append(f"行 {i+1} 列 '{col}': '{text}'")
     return errors
 def process_file(file):
     if file.name.endswith('.csv'):
         df = pd.read_csv(file.name)
         "第三個檢查": errors3
     }
 iface = gr.Interface(
     fn=process_file,
     inputs=gr.File(label="上傳 CSV 或 XLSX 檔案"),