datbkpro commited on
Commit
5b4cd8d
·
verified ·
1 Parent(s): 32592d6

Update config/settings.py

Browse files
Files changed (1) hide show
  1. config/settings.py +17 -18
config/settings.py CHANGED
@@ -4,38 +4,37 @@ from dotenv import load_dotenv
4
  load_dotenv()
5
 
6
  class Settings:
7
- # Ưu tiên lấy từ environment variables (cho Hugging Face)
8
- GROQ_API_KEY = os.getenv("GROQ_API_KEY") or os.getenv("X_GROQ_API_KEY")
9
 
10
- # Kiểm tra API Key
11
- if not GROQ_API_KEY:
12
- print("❌ CẢNH BÁO: Không tìm thấy GROQ_API_KEY")
13
- print("💡 Trên Hugging Face Spaces, hãy thêm biến môi trường:")
14
- print(" - Tên: GROQ_API_KEY")
15
- print(" - Value: gsk_xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx")
16
 
17
- # Multilingual Model Settings
18
- VIETNAMESE_EMBEDDING_MODEL = 'keepitreal/vietnamese-sbert'
19
- VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant"
20
 
21
- MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2'
22
- MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant"
 
 
 
 
23
 
24
  WHISPER_MODEL = "whisper-large-v3-turbo"
25
 
26
  # TTS Settings
27
  MAX_CHUNK_LENGTH = 200
28
  SUPPORTED_LANGUAGES = {
29
- 'vi': 'vi', 'en': 'en', 'fr': 'fr', 'es': 'es',
30
- 'de': 'de', 'ja': 'ja', 'ko': 'ko', 'zh': 'zh'
31
  }
32
 
33
  # RAG Settings
34
- EMBEDDING_DIMENSION = 384
35
  TOP_K_RESULTS = 3
36
 
37
- # SpeechBrain VAD Settings
38
- VAD_MODEL = "speechbrain/vad-crdnn-libriparty"
39
  VAD_THRESHOLD = 0.5
40
  VAD_MIN_SILENCE_DURATION = 0.5
41
  VAD_SPEECH_PAD_DURATION = 0.1
 
4
  load_dotenv()
5
 
6
  class Settings:
7
+ GROQ_API_KEY = os.getenv("GROQ_API_KEY")
 
8
 
9
+ # Multilingual Model Settings - SỬA: Dùng models nhẹ và phổ biến
10
+ VIETNAMESE_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2' # Model nhẹ, hỗ trợ nhiều ngôn ngữ
11
+ VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant" # Model Groq
 
 
 
12
 
13
+ MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2' # Dùng model chung
14
+ MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant" # Model Groq
 
15
 
16
+ # Fallback models
17
+ FALLBACK_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
18
+
19
+ # Default models
20
+ DEFAULT_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
21
+ DEFAULT_LLM_MODEL = "llama-3.1-8b-instant"
22
 
23
  WHISPER_MODEL = "whisper-large-v3-turbo"
24
 
25
  # TTS Settings
26
  MAX_CHUNK_LENGTH = 200
27
  SUPPORTED_LANGUAGES = {
28
+ 'vi': 'Vietnamese', 'en': 'English', 'fr': 'French', 'es': 'Spanish',
29
+ 'de': 'German', 'ja': 'Japanese', 'ko': 'Korean', 'zh': 'Chinese'
30
  }
31
 
32
  # RAG Settings
33
+ EMBEDDING_DIMENSION = 384 # Dimension của all-MiniLM-L6-v2
34
  TOP_K_RESULTS = 3
35
 
36
+ # SpeechBrain VAD Settings - TẠM TẮT để tránh lỗi
37
+ VAD_MODEL = None # Tạm tắt VAD
38
  VAD_THRESHOLD = 0.5
39
  VAD_MIN_SILENCE_DURATION = 0.5
40
  VAD_SPEECH_PAD_DURATION = 0.1