| import os |
| import json |
| import wave |
| import numpy as np |
| import soundfile as sf |
| from vosk import Model, KaldiRecognizer |
| from flask import Flask |
| from flask_socketio import SocketIO, emit |
|
|
| |
| app = Flask(__name__) |
| socketio = SocketIO(app, cors_allowed_origins="*") |
|
|
| |
| MODEL_PATH = "model/vosk-model" |
| if not os.path.exists(MODEL_PATH): |
| raise Exception("❌ Model Vosk không tìm thấy!") |
| print("✅ Đang tải model Vosk...") |
| model = Model(MODEL_PATH) |
|
|
| |
| rec = KaldiRecognizer(model, 16000) |
|
|
| |
| @socketio.on("audio_chunk") |
| def handle_audio(audio_data): |
| print(f"📩 Nhận dữ liệu âm thanh: {len(audio_data)} bytes") |
|
|
| |
| audio_np = np.frombuffer(audio_data, dtype=np.int16) |
|
|
| |
| if rec.AcceptWaveform(audio_np.tobytes()): |
| result = json.loads(rec.Result()) |
| text = result.get("text", "") |
| print(f"📤 Kết quả nhận diện: {text}") |
| emit("stt_result", {"text": text}) |
|
|
| |
| if __name__ == "__main__": |
| socketio.run(app, host="0.0.0.0", port=5000, debug=True, allow_unsafe_werkzeug=True) |
|
|