datbkpro commited on
Commit
be8cb43
·
verified ·
1 Parent(s): ebe59f5

Update config/settings.py

Browse files
Files changed (1) hide show
  1. config/settings.py +2 -52
config/settings.py CHANGED
@@ -1,53 +1,4 @@
1
- # import os
2
- # from dotenv import load_dotenv
3
 
4
- # load_dotenv()
5
-
6
- # class Settings:
7
- # GROQ_API_KEY = os.getenv("GROQ_API_KEY")
8
-
9
- # # Multilingual Model Settings
10
- # VIETNAMESE_EMBEDDING_MODEL = 'keepitreal/vietnamese-sbert'
11
- # VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant"
12
-
13
- # MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2' # Sử dụng model nhẹ hơn
14
- # MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant"
15
-
16
- # # Fallback models in case primary models fail
17
- # FALLBACK_MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
18
-
19
- # # Default models (fallback)
20
- # DEFAULT_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
21
- # DEFAULT_LLM_MODEL = "llama-3.1-8b-instant"
22
-
23
- # # Whisper Settings - CẬP NHẬT
24
- # WHISPER_MODEL = "whisper-large-v3"
25
-
26
- # # TTS Settings
27
- # MAX_CHUNK_LENGTH = 200
28
- # SUPPORTED_LANGUAGES = {
29
- # 'vi': 'vi', 'en': 'en', 'fr': 'fr', 'es': 'es',
30
- # 'de': 'de', 'ja': 'ja', 'ko': 'ko', 'zh': 'zh'
31
- # }
32
-
33
- # # RAG Settings - CẬP NHẬT
34
- # EMBEDDING_DIMENSION = 768 # For all-MiniLM-L6-v2
35
- # TOP_K_RESULTS = 5
36
-
37
- # # Audio Processing Settings - CẬP NHẬT QUAN TRỌNG
38
- # SAMPLE_RATE = 16000
39
- # AUDIO_CHUNK_SIZE = 1024
40
- # AUDIO_SILENCE_THRESHOLD = 0.005 # Ngưỡng âm lượng thấp hơn
41
- # MIN_AUDIO_DURATION = 0.5 # Giây - âm thanh tối thiểu
42
- # MAX_AUDIO_DURATION = 10.0 # Giây - âm thanh tối đa
43
-
44
- # # SpeechBrain VAD Settings - CẬP NHẬT
45
- # VAD_MODEL = "snakers4/silero-vad"
46
- # VAD_THRESHOLD = 0.2 # Giảm threshold để nhạy hơn
47
- # VAD_MIN_SILENCE_DURATION = 3 # Tăng thời gian silence
48
- # VAD_SPEECH_PAD_DURATION = 0.3 # Tăng padding
49
-
50
- # settings = Settings()
51
  import os
52
  from dotenv import load_dotenv
53
 
@@ -69,10 +20,9 @@ class Settings:
69
  # Default models
70
  DEFAULT_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
71
  DEFAULT_LLM_MODEL = "llama-3.1-8b-instant"
72
-
73
- # OCR Settings - SỬA LỖI NGÔN NGỮ
74
  OCR_MODEL = "kha-white/manga-ocr-base"
75
- EASYOCR_LANGUAGES = ['vi', 'en'] # SỬA 'zh' thành 'ch_sim'
76
 
77
  # Whisper Settings
78
  WHISPER_MODEL = "whisper-large-v3"
 
 
 
1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  import os
3
  from dotenv import load_dotenv
4
 
 
20
  # Default models
21
  DEFAULT_EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
22
  DEFAULT_LLM_MODEL = "llama-3.1-8b-instant"
23
+
 
24
  OCR_MODEL = "kha-white/manga-ocr-base"
25
+ EASYOCR_LANGUAGES = ['vi', 'en']
26
 
27
  # Whisper Settings
28
  WHISPER_MODEL = "whisper-large-v3"