Pullo-Africa-Protagonist commited on
Commit
b78d5ae
·
verified ·
1 Parent(s): 0b3529e

Create config.json

Browse files
Files changed (1) hide show
  1. config.json +55 -0
config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+
6
+ "chat_type": "text",
7
+
8
+ # Model paths
9
+ "wav_config_path": "./WavTokenizer/configs/wavtokenizer_smalldata_frame75_3s_nq1_code4096_dim512_kmeans200_attn.yaml",
10
+ "wav_model_path": "./CHECKPOINTS/wavtokenizer_large_speech_320_24k.ckpt",
11
+ "encoder_model_path": "charsiu/g2p_multilingual_byT5_tiny_16_layers_100",
12
+ "tokenizer_path": "google/byt5-small",
13
+ "llmvox_checkpoint_path": "./CHECKPOINTS/ckpt_krio_tiny.pt",
14
+
15
+ # LLM settings
16
+ "llm_checkpoint": "meta-llama/Llama-3.1-8B-Instruct",
17
+ #"llm_checkpoint": "microsoft/Phi-4-multimodal-instruct",
18
+ #"llm_checkpoint": "Qwen/Qwen2.5-VL-7B-Instruct"
19
+ "llm_device": "cuda:0",
20
+ "llm_max_tokens": 1000,
21
+ "llm_temperature": 0.7,
22
+ "llm_top_p": 0.95,
23
+ "llm_top_k": 40,
24
+
25
+ # TTS model settings
26
+ "tts_device_1": 1, # GPU ID
27
+ "tts_device_2": 2,
28
+
29
+ # Streaming settings
30
+ "system_prompt": "You are a friendly voicebot that answers questions in a concise way and do not use abbreviation.Give short responses",
31
+ "initial_dump_size_1": 10,
32
+ "initial_dump_size_2": 160,
33
+ "max_dump_size": 1280,
34
+ "max_audio_length": 8000,
35
+
36
+ # Special tokens
37
+ #"eos_token": "<|end|>",
38
+ # "eos_token": "<|im_end|>",
39
+ #"eos_token":"<eos>",
40
+ "eos_token": "<|eot_id|>",
41
+ "pad_token_id": 384,
42
+ "eoa_token_id": 453,
43
+
44
+ # API settings
45
+ "api_host": "0.0.0.0",
46
+ "api_port": 5003,
47
+
48
+ # ASR settings
49
+ "asr_model": "small", # Whisper model variant: tiny, base, small, medium, large
50
+ "asr_device": "cuda:2", # Device for ASR model
51
+ "asr_sample_rate": 16000.0, # Audio sample rate in Hz
52
+ "asr_max_audio_length": 60, # Maximum audio length in seconds
53
+ "asr_default_language": "english", # Default language for transcription
54
+ "asr_enable_translation": False, # Enable translation instead of transcription by default
55
+ }