datbkpro commited on
Commit
8289f9b
·
verified ·
1 Parent(s): 66805ac

Update config/settings.py

Browse files
Files changed (1) hide show
  1. config/settings.py +17 -14
config/settings.py CHANGED
@@ -3,8 +3,6 @@ from dotenv import load_dotenv
3
 
4
  load_dotenv()
5
 
6
-
7
-
8
  class Settings:
9
  GROQ_API_KEY = os.getenv("GROQ_API_KEY")
10
 
@@ -12,16 +10,17 @@ class Settings:
12
  VIETNAMESE_EMBEDDING_MODEL = 'keepitreal/vietnamese-sbert'
13
  VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant"
14
 
15
- MULTILINGUAL_EMBEDDING_MODEL = 'Qwen/Qwen3-Embedding-0.6B'
16
  MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant"
17
 
18
  # Fallback models in case primary models fail
19
  FALLBACK_MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
20
 
21
  # Default models (fallback)
22
- DEFAULT_EMBEDDING_MODEL = 'dangvantuan/vietnamese-embedding'
23
- DEFAULT_LLM_MODEL = "Vietnamese_LLaMA2_13B_8K_SFT_General_Domain_Knowledge"
24
 
 
25
  WHISPER_MODEL = "whisper-large-v3"
26
 
27
  # TTS Settings
@@ -31,17 +30,21 @@ class Settings:
31
  'de': 'de', 'ja': 'ja', 'ko': 'ko', 'zh': 'zh'
32
  }
33
 
34
- # RAG Settings
35
- EMBEDDING_DIMENSION = 768 # For Vietnamese model
36
- MULTILINGUAL_EMBEDDING_DIMENSION = 4096 # For Nemotron model
37
-
38
  TOP_K_RESULTS = 3
39
 
40
- # SpeechBrain VAD Settings
41
- VAD_MODEL = "speechbrain/vad-crdnn-libriparty"
42
- VAD_THRESHOLD = 0.5
43
- VAD_MIN_SILENCE_DURATION = 0.8
44
- VAD_SPEECH_PAD_DURATION = 0.2
45
  SAMPLE_RATE = 16000
 
 
 
 
 
 
 
 
 
 
46
 
47
  settings = Settings()
 
3
 
4
  load_dotenv()
5
 
 
 
6
  class Settings:
7
  GROQ_API_KEY = os.getenv("GROQ_API_KEY")
8
 
 
10
  VIETNAMESE_EMBEDDING_MODEL = 'keepitreal/vietnamese-sbert'
11
  VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant"
12
 
13
+ MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2' # Sử dụng model nhẹ hơn
14
  MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant"
15
 
16
  # Fallback models in case primary models fail
17
  FALLBACK_MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
18
 
19
  # Default models (fallback)
20
+ DEFAULT_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
21
+ DEFAULT_LLM_MODEL = "llama-3.1-8b-instant"
22
 
23
+ # Whisper Settings - CẬP NHẬT
24
  WHISPER_MODEL = "whisper-large-v3"
25
 
26
  # TTS Settings
 
30
  'de': 'de', 'ja': 'ja', 'ko': 'ko', 'zh': 'zh'
31
  }
32
 
33
+ # RAG Settings - CẬP NHẬT
34
+ EMBEDDING_DIMENSION = 384 # For all-MiniLM-L6-v2
 
 
35
  TOP_K_RESULTS = 3
36
 
37
+ # Audio Processing Settings - CẬP NHẬT QUAN TRỌNG
 
 
 
 
38
  SAMPLE_RATE = 16000
39
+ AUDIO_CHUNK_SIZE = 1024
40
+ AUDIO_SILENCE_THRESHOLD = 0.005 # Ngưỡng âm lượng thấp hơn
41
+ MIN_AUDIO_DURATION = 0.5 # Giây - âm thanh tối thiểu
42
+ MAX_AUDIO_DURATION = 10.0 # Giây - âm thanh tối đa
43
+
44
+ # SpeechBrain VAD Settings - CẬP NHẬT
45
+ VAD_MODEL = "speechbrain/vad-crdnn-libriparty"
46
+ VAD_THRESHOLD = 0.3 # Giảm threshold để nhạy hơn
47
+ VAD_MIN_SILENCE_DURATION = 1.0 # Tăng thời gian silence
48
+ VAD_SPEECH_PAD_DURATION = 0.3 # Tăng padding
49
 
50
  settings = Settings()