herimor commited on
Commit
a488840
·
1 Parent(s): fb729b5

Update package and model

Browse files
Files changed (4) hide show
  1. README.md +1 -0
  2. app.py +1 -1
  3. configs/generator.json +1 -1
  4. requirements.txt +1 -3
README.md CHANGED
@@ -16,6 +16,7 @@ tags:
16
  - text-to-speech
17
  - speech-synthesis
18
  preload_from_hub:
 
19
  - kyutai/moshiko-pytorch-bf16 tokenizer-e351c8d8-checkpoint125.safetensors
20
  - sarulab-speech/sidon-v0.1 decoder_cuda.pt
21
  - sarulab-speech/sidon-v0.1 feature_extractor_cuda.pt
 
16
  - text-to-speech
17
  - speech-synthesis
18
  preload_from_hub:
19
+ - herimor/voxtream2 model.safetensors,config.json,phoneme_to_token.json
20
  - kyutai/moshiko-pytorch-bf16 tokenizer-e351c8d8-checkpoint125.safetensors
21
  - sarulab-speech/sidon-v0.1 decoder_cuda.pt
22
  - sarulab-speech/sidon-v0.1 feature_extractor_cuda.pt
app.py CHANGED
@@ -74,7 +74,7 @@ def demo_app(config: SpeechGeneratorConfig, demo_examples, synthesize_fn):
74
  with gr.Blocks(css=CUSTOM_CSS, title="VoXtream2") as demo:
75
  gr.Markdown("# VoXtream2 TTS demo")
76
  gr.Markdown(
77
- "⚠️ First 3-5 runs may have higher latency due to model loading and warmup."
78
  )
79
 
80
  with gr.Row(equal_height=True, elem_id="cols"):
 
74
  with gr.Blocks(css=CUSTOM_CSS, title="VoXtream2") as demo:
75
  gr.Markdown("# VoXtream2 TTS demo")
76
  gr.Markdown(
77
+ "⚠️ The initial latency can be high due to deployment on ZeroGPU. For faster inference, please try local deployment. For more details, please visit [VoXtream GitHub repo](https://github.com/herimor/voxtream)"
78
  )
79
 
80
  with gr.Row(equal_height=True, elem_id="cols"):
configs/generator.json CHANGED
@@ -11,7 +11,7 @@
11
  "topk": 5,
12
  "top_p": 0.9,
13
  "max_audio_length_ms": 60000,
14
- "model_repo": "herimor/debug",
15
  "model_name": "model.safetensors",
16
  "model_config_name": "config.json",
17
  "mimi_sr": 24000,
 
11
  "topk": 5,
12
  "top_p": 0.9,
13
  "max_audio_length_ms": 60000,
14
+ "model_repo": "herimor/voxtream2",
15
  "model_name": "model.safetensors",
16
  "model_config_name": "config.json",
17
  "mimi_sr": 24000,
requirements.txt CHANGED
@@ -1,5 +1,3 @@
1
- --extra-index-url https://test.pypi.org/simple/
2
-
3
- voxtream==0.2.2
4
  gradio_client==1.3.0
5
  pydantic==2.10.6
 
1
+ voxtream==0.2.0
 
 
2
  gradio_client==1.3.0
3
  pydantic==2.10.6