Spaces:

phongnt251199
/

SentimentModel

Running

App Files Files Community

T-Phong commited on 4 days ago

Commit

b0cb70a

1 Parent(s): 5d72cee

update log

Browse files

Files changed (2) hide show

app.py +23 -4
model.py +22 -4

app.py CHANGED Viewed

@@ -1,5 +1,11 @@
 from flask import Flask, request, jsonify
 from flask_cors import CORS
 from model import predict_sentiment_3sentiment, predict_sentiment_5sentiment
 import pandas as pd
@@ -18,22 +24,29 @@ def predict():
     """
     # Lấy dữ liệu JSON từ request
     json_data = request.get_json()
     # Kiểm tra xem key 'text' có tồn tại và không rỗng không
     if not json_data or 'text' not in json_data or not json_data.get('text', '').strip():
         return jsonify({"error": "Vui lòng cung cấp trường 'text' trong request body."}), 400
     # Kiểm tra xem key 'type' có tồn tại và không rỗng không
     if not json_data or 'type' not in json_data or not json_data.get('type', '').strip():
         return jsonify({"error": "Vui lòng cung cấp trường 'type' trong request body."}), 400
     # Lấy văn bản từ dữ liệu
     text_to_predict = json_data['text']
     sentiment_type = json_data['type']
     # Gọi hàm dự đoán từ model
-    if sentiment_type == "3sentiment":
-        sentiment, score = predict_sentiment_3sentiment(text_to_predict)
-    elif sentiment_type == "5sentiment":
-        sentiment, score = predict_sentiment_5sentiment(text_to_predict)
     # Tạo response
     response = {
@@ -57,22 +70,27 @@ def predict_batch():
     """
     # 1. Kiểm tra xem có file trong request không
     if 'file' not in request.files:
         return jsonify({"error": "Không tìm thấy file trong request (key phải là 'file')."}), 400
     # Dữ liệu form đi kèm với file sẽ nằm trong request.form
     sentiment_type = request.form.get('type')
     # Kiểm tra xem key 'type' có tồn tại và không rỗng không
     if not sentiment_type or sentiment_type.strip() not in ["3sentiment", "5sentiment"]:
         return jsonify({"error": "Vui lòng cung cấp trường 'type' (3sentiment hoặc 5sentiment) trong form data."}), 400
     file = request.files['file']
     # 2. Kiểm tra xem người dùng có chọn file không
     if file.filename == '':
         return jsonify({"error": "Chưa chọn file nào."}), 400
     # 3. Kiểm tra định dạng file
     if not file.filename.endswith(('.xlsx', '.xls')):
         return jsonify({"error": "Định dạng file không hợp lệ. Vui lòng sử dụng file .xlsx hoặc .xls."}), 400
     try:
@@ -96,6 +114,7 @@ def predict_batch():
         return jsonify(results)
     except Exception as e:
         return jsonify({"error": f"Đã xảy ra lỗi khi xử lý file: {str(e)}"}), 500
 if __name__ == "__main__":

 from flask import Flask, request, jsonify
 from flask_cors import CORS
+import logging
+# Cấu hình logging cho app
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 from model import predict_sentiment_3sentiment, predict_sentiment_5sentiment
 import pandas as pd
     """
     # Lấy dữ liệu JSON từ request
     json_data = request.get_json()
+    logger.info(f"Received predict request: {json_data}")
     # Kiểm tra xem key 'text' có tồn tại và không rỗng không
     if not json_data or 'text' not in json_data or not json_data.get('text', '').strip():
+        logger.warning("Missing 'text' in request")
         return jsonify({"error": "Vui lòng cung cấp trường 'text' trong request body."}), 400
     # Kiểm tra xem key 'type' có tồn tại và không rỗng không
     if not json_data or 'type' not in json_data or not json_data.get('type', '').strip():
+        logger.warning("Missing 'type' in request")
         return jsonify({"error": "Vui lòng cung cấp trường 'type' trong request body."}), 400
     # Lấy văn bản từ dữ liệu
     text_to_predict = json_data['text']
     sentiment_type = json_data['type']
     # Gọi hàm dự đoán từ model
+    try:
+        if sentiment_type == "3sentiment":
+            sentiment, score = predict_sentiment_3sentiment(text_to_predict)
+        elif sentiment_type == "5sentiment":
+            sentiment, score = predict_sentiment_5sentiment(text_to_predict)
+    except Exception as e:
+        logger.error(f"Prediction error: {e}")
+        return jsonify({"error": str(e)}), 500
     # Tạo response
     response = {
     """
     # 1. Kiểm tra xem có file trong request không
     if 'file' not in request.files:
+        logger.warning("No file part in request")
         return jsonify({"error": "Không tìm thấy file trong request (key phải là 'file')."}), 400
     # Dữ liệu form đi kèm với file sẽ nằm trong request.form
     sentiment_type = request.form.get('type')
+    logger.info(f"Received batch predict request for type: {sentiment_type}")
     # Kiểm tra xem key 'type' có tồn tại và không rỗng không
     if not sentiment_type or sentiment_type.strip() not in ["3sentiment", "5sentiment"]:
+        logger.warning("Invalid or missing 'type'")
         return jsonify({"error": "Vui lòng cung cấp trường 'type' (3sentiment hoặc 5sentiment) trong form data."}), 400
     file = request.files['file']
     # 2. Kiểm tra xem người dùng có chọn file không
     if file.filename == '':
+        logger.warning("No selected file")
         return jsonify({"error": "Chưa chọn file nào."}), 400
     # 3. Kiểm tra định dạng file
     if not file.filename.endswith(('.xlsx', '.xls')):
+        logger.warning(f"Invalid file format: {file.filename}")
         return jsonify({"error": "Định dạng file không hợp lệ. Vui lòng sử dụng file .xlsx hoặc .xls."}), 400
     try:
         return jsonify(results)
     except Exception as e:
+        logger.error(f"Error processing batch file: {e}")
         return jsonify({"error": f"Đã xảy ra lỗi khi xử lý file: {str(e)}"}), 500
 if __name__ == "__main__":

model.py CHANGED Viewed

@@ -3,18 +3,36 @@
 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 import torch.nn.functional as F
 model_name_3sentiment = "phongnt251199/phobert-sentiment-reviews-v5"
 model_name_5sentiment = "phongnt251199/phobert-sentiment-reviews-v4"
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 # Load tokenizer và model cho 3 nhãn
-tokenizer_3sentiment = AutoTokenizer.from_pretrained(model_name_3sentiment)
-model_3sentiment = AutoModelForSequenceClassification.from_pretrained(model_name_3sentiment, num_labels=3).to(device)
 # Load tokenizer và model như bình thườngclear
-tokenizer_5sentiment = AutoTokenizer.from_pretrained(model_name_5sentiment)
-model_5sentiment = AutoModelForSequenceClassification.from_pretrained(model_name_5sentiment, num_labels=5).to(device)
 def predict_sentiment_3sentiment(text):
     inputs = tokenizer_3sentiment(text, padding=True, truncation=True, max_length=256, return_tensors="pt").to(device)

 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 import torch.nn.functional as F
+import logging
+# Cấu hình logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 model_name_3sentiment = "phongnt251199/phobert-sentiment-reviews-v5"
 model_name_5sentiment = "phongnt251199/phobert-sentiment-reviews-v4"
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+logger.info(f"Device being used: {device}")
 # Load tokenizer và model cho 3 nhãn
+logger.info(f"Start loading model 3sentiment: {model_name_3sentiment}")
+try:
+    tokenizer_3sentiment = AutoTokenizer.from_pretrained(model_name_3sentiment)
+    model_3sentiment = AutoModelForSequenceClassification.from_pretrained(model_name_3sentiment, num_labels=3).to(device)
+    logger.info("Loaded model 3sentiment successfully")
+except Exception as e:
+    logger.error(f"Error loading model 3sentiment: {e}")
+    raise e
 # Load tokenizer và model như bình thườngclear
+logger.info(f"Start loading model 5sentiment: {model_name_5sentiment}")
+try:
+    tokenizer_5sentiment = AutoTokenizer.from_pretrained(model_name_5sentiment)
+    model_5sentiment = AutoModelForSequenceClassification.from_pretrained(model_name_5sentiment, num_labels=5).to(device)
+    logger.info("Loaded model 5sentiment successfully")
+except Exception as e:
+    logger.error(f"Error loading model 5sentiment: {e}")
+    raise e
 def predict_sentiment_3sentiment(text):
     inputs = tokenizer_3sentiment(text, padding=True, truncation=True, max_length=256, return_tensors="pt").to(device)