wayne0603 commited on
Commit
a67409b
·
verified ·
1 Parent(s): 0f0afda

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -3
app.py CHANGED
@@ -32,22 +32,27 @@ index = None
32
  docs = []
33
 
34
  # ===== 文件解析函数 =====
 
 
35
  def load_file(file_obj):
36
  global index, docs
37
  docs = []
38
  text_data = ""
39
 
40
- ext = os.path.splitext(file_obj.name)[1].lower()
 
 
41
 
42
  try:
43
  if ext == ".pdf":
44
- reader = PdfReader(file_obj.name)
45
  for page in reader.pages:
46
  page_text = page.extract_text()
47
  if page_text:
48
  text_data += page_text + "\n"
49
  elif ext == ".txt":
50
- text_data = file_obj.read().decode("utf-8", errors="ignore")
 
51
  else:
52
  return "仅支持 PDF 或 TXT 文件", None
53
  except Exception as e:
@@ -66,6 +71,7 @@ def load_file(file_obj):
66
  index.add(doc_embeddings)
67
 
68
  return f"已加载 {len(docs)} 个文本块", None
 
69
  # ===== RAG 查询函数 =====
70
  def rag_query(query):
71
  if index is None:
 
32
  docs = []
33
 
34
  # ===== 文件解析函数 =====
35
+
36
+
37
  def load_file(file_obj):
38
  global index, docs
39
  docs = []
40
  text_data = ""
41
 
42
+ # 获取文件路径
43
+ file_path = file_obj.name if hasattr(file_obj, "name") else file_obj
44
+ ext = os.path.splitext(file_path)[1].lower()
45
 
46
  try:
47
  if ext == ".pdf":
48
+ reader = PdfReader(file_path)
49
  for page in reader.pages:
50
  page_text = page.extract_text()
51
  if page_text:
52
  text_data += page_text + "\n"
53
  elif ext == ".txt":
54
+ with open(file_path, "r", encoding="utf-8", errors="ignore") as f:
55
+ text_data = f.read()
56
  else:
57
  return "仅支持 PDF 或 TXT 文件", None
58
  except Exception as e:
 
71
  index.add(doc_embeddings)
72
 
73
  return f"已加载 {len(docs)} 个文本块", None
74
+
75
  # ===== RAG 查询函数 =====
76
  def rag_query(query):
77
  if index is None: