Spaces:

tudeplom
/

api-stt

Sleeping

App Files Files Community

tudeplom commited on Mar 28

Commit

981b713

verified ·

1 Parent(s): de1cb80

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -30

app.py CHANGED Viewed

@@ -6,25 +6,45 @@ from flask import Flask, request, jsonify
 from flask_cors import CORS
 from vosk import Model, KaldiRecognizer
 # Khởi tạo Flask app
 app = Flask(__name__)
 CORS(app)
-# Đường dẫn model Vosk
-MODEL_PATH = "model"
-if not os.path.exists(MODEL_PATH):
-    raise Exception("Model Vosk không tìm thấy! Đảm bảo đã tải về model đúng thư mục.")
-model = Model(MODEL_PATH)
-def process_audio(file_path):
-    """ Xử lý file audio và trả về văn bản nhận dạng """
     wf = wave.open(file_path, "rb")
-    if wf.getnchannels() != 1:
-        return {"error": "Chỉ hỗ trợ file WAV mono (1 kênh)"}
     rec = KaldiRecognizer(model, wf.getframerate())
     result_text = ""
     while True:
         data = wf.readframes(4000)
         if len(data) == 0:
@@ -33,27 +53,9 @@ def process_audio(file_path):
             result_text += json.loads(rec.Result())["text"] + " "
     wf.close()
-    os.remove(file_path)  # Xóa file sau khi xử lý
-    return {"text": result_text.strip()}
-@app.route("/")
-def home():
-    return "✅ Vosk STT API đang chạy! Gửi file âm thanh đến /stt để nhận dạng."
-@app.route("/stt", methods=["POST"])
-def stt():
-    if "audio" not in request.files:
-        return jsonify({"error": "Không tìm thấy file audio!"}), 400
-    audio_file = request.files["audio"]
-    if not audio_file.filename.endswith(".wav"):
-        return jsonify({"error": "Chỉ hỗ trợ file WAV!"}), 400
-    file_path = "temp.wav"
-    audio_file.save(file_path)
-    result = process_audio(file_path)
-    return jsonify(result)
 if __name__ == "__main__":
-    app.run(host="0.0.0.0", port=7860, debug=True)

 from flask_cors import CORS
 from vosk import Model, KaldiRecognizer
+# Thư mục chứa model
+MODEL_PATH = "model/vosk-model"
+# Kiểm tra model đã tải chưa
+if not os.path.exists(MODEL_PATH):
+    raise Exception(f"❌ Model Vosk không tìm thấy tại {MODEL_PATH}! Kiểm tra lại.")
+# Load model
+print("✅ Đang tải model Vosk...")
+model = Model(MODEL_PATH)
 # Khởi tạo Flask app
 app = Flask(__name__)
 CORS(app)
+@app.route("/")
+def home():
+    return "✅ Vosk STT API đang chạy!"
+@app.route("/stt", methods=["POST"])
+def stt():
+    if "audio" not in request.files:
+        return jsonify({"error": "Không tìm thấy file audio!"}), 400
+    audio_file = request.files["audio"]
+    file_path = "temp.wav"
+    audio_file.save(file_path)
+    # Mở file âm thanh
     wf = wave.open(file_path, "rb")
+    # Kiểm tra file có đúng định dạng WAV mono không
+    if wf.getnchannels() != 1 or wf.getsampwidth() != 2 or wf.getcomptype() != "NONE":
+        os.remove(file_path)
+        return jsonify({"error": "File audio phải là WAV mono PCM!"}), 400
     rec = KaldiRecognizer(model, wf.getframerate())
     result_text = ""
     while True:
         data = wf.readframes(4000)
         if len(data) == 0:
             result_text += json.loads(rec.Result())["text"] + " "
     wf.close()
+    os.remove(file_path)  # Xóa file tạm
+    return jsonify({"text": result_text.strip()})
 if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=7860, debug=True)