Spaces:

Di12
/

sentiment_analysis

Sleeping

App Files Files Community

Di12 commited on Jul 2, 2025

Commit

6a3a140

verified ·

1 Parent(s): a2f3484

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -3

app.py CHANGED Viewed

@@ -12,6 +12,7 @@ import gradio as gr
 from huggingface_hub import hf_hub_download
 import io
 import matplotlib.pyplot as plt
 # Device configuration: consistent device for model and tensors
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
@@ -221,14 +222,17 @@ def process_input(text_input, file):
         comments = [p.strip() for p in parts if p and p.strip()]
     elif file:
-        # Đọc file CSV hoặc TXT
         if isinstance(file, str):
             # file path
             if file.lower().endswith('.csv'):
                 content = open(file, 'r', encoding='utf-8', errors='ignore').read()
                 lines = content.splitlines()
                 comments = [line.strip() for line in lines if line.strip()]
             else:
                 content = open(file, 'r', encoding='utf-8').read()
                 parts = re.split(r'[.?!]\s*|\n+', content)
@@ -283,7 +287,7 @@ with gr.Blocks() as demo:
     gr.Markdown("Nhập bình luận:")
     text_input = gr.Textbox(lines=6, placeholder="Nhập bình luận tại đây...", label="")
     gr.Markdown("Hoặc tải lên tệp .txt hoặc .csv chứa các bình luận:")
-    file_input = gr.File(label="Tải tệp", file_types=[".txt", ".csv"])
     predict_button = gr.Button("Dự đoán")
     output_table = gr.Dataframe(headers=["Comment", "Dự đoán", 'Khả năng tiêu cực', 'Khả năng bình thường', 'Khả năng tích cực'],
                                 interactive=False,

 from huggingface_hub import hf_hub_download
 import io
 import matplotlib.pyplot as plt
+from docx import Document
 # Device configuration: consistent device for model and tensors
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
         comments = [p.strip() for p in parts if p and p.strip()]
     elif file:
         if isinstance(file, str):
             # file path
             if file.lower().endswith('.csv'):
                 content = open(file, 'r', encoding='utf-8', errors='ignore').read()
                 lines = content.splitlines()
                 comments = [line.strip() for line in lines if line.strip()]
+            elif file.lower().endswith('.docx'):
+                doc = Document(file)
+                content = "\n".join([p.text for p in doc.paragraphs])
+                parts = re.split(r'[.?!]\s*|\n+', content)
+                comments = [p.strip() for p in parts if p.strip()]
             else:
                 content = open(file, 'r', encoding='utf-8').read()
                 parts = re.split(r'[.?!]\s*|\n+', content)
     gr.Markdown("Nhập bình luận:")
     text_input = gr.Textbox(lines=6, placeholder="Nhập bình luận tại đây...", label="")
     gr.Markdown("Hoặc tải lên tệp .txt hoặc .csv chứa các bình luận:")
+    file_input = gr.File(label="Tải tệp", file_types=[".txt", ".csv", ".docx"])
     predict_button = gr.Button("Dự đoán")
     output_table = gr.Dataframe(headers=["Comment", "Dự đoán", 'Khả năng tiêu cực', 'Khả năng bình thường', 'Khả năng tích cực'],
                                 interactive=False,