Spaces:

chatbotMOAI
/

MOAI

Sleeping

wenbemi commited on Aug 21, 2025

Commit

80b6b64

verified ·

1 Parent(s): a225344

Update chat_a.py

Files changed (1) hide show

chat_a.py CHANGED Viewed

@@ -2,7 +2,7 @@
 # coding: utf-8
 # In[10]:
-import os, io, pandas as pd
 from huggingface_hub import hf_hub_download
 import pandas as pd
 import torch
@@ -33,17 +33,21 @@ def _read_csv_bytes(b: bytes) -> pd.DataFrame:
     except UnicodeDecodeError:
         return pd.read_csv(io.BytesIO(b), encoding="cp949")
-def load_csv_smart(local_path: str, hub_filename: str,
-                   repo_id: str = HF_DATASET_REPO, repo_type: str = "dataset",
-                   revision: str = HF_DATASET_REV) -> pd.DataFrame:
-    # 1) 로컬 우선
     if os.path.exists(local_path):
         with open(local_path, "rb") as f:
             data = f.read()
         if not _is_pointer_bytes(data):
-            return _read_csv_bytes(data)
-        # 포인터면 허브로 폴백
-    # 2) 허브 다운로드
     cached = hf_hub_download(repo_id=repo_id, filename=hub_filename,
                              repo_type=repo_type, revision=revision)
     try:

 # coding: utf-8
 # In[10]:
+import os, io
 from huggingface_hub import hf_hub_download
 import pandas as pd
 import torch
     except UnicodeDecodeError:
         return pd.read_csv(io.BytesIO(b), encoding="cp949")
+def load_csv_smart(local_path: str,
+                   hub_filename: str | None = None,
+                   repo_id: str = HF_DATASET_REPO,
+                   repo_type: str = "dataset",
+                   revision: str = HF_DATASET_REV):
+    if hub_filename is None:
+        hub_filename = os.path.basename(local_path)
     if os.path.exists(local_path):
         with open(local_path, "rb") as f:
             data = f.read()
         if not _is_pointer_bytes(data):
+            try:
+                return pd.read_csv(io.BytesIO(data), encoding="utf-8")
+            except UnicodeDecodeError:
+                return pd.read_csv(io.BytesIO(data), encoding="cp949")
     cached = hf_hub_download(repo_id=repo_id, filename=hub_filename,
                              repo_type=repo_type, revision=revision)
     try: