mnhatdaous commited on
Commit
e76369a
·
1 Parent(s): 248479c

Update Gradio demo with training instructions and status

Browse files
Files changed (1) hide show
  1. app.py +41 -2
app.py CHANGED
@@ -40,7 +40,26 @@ def create_demo():
40
 
41
  An unofficial implementation based on improvements of CosyVoice with learnable encoder and DAC-VAE.
42
 
43
- > **Note**: This is a demo interface. To use the actual model, you need to train it first using the provided training pipeline.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  """
45
  )
46
 
@@ -70,7 +89,27 @@ def create_demo():
70
  type="numpy"
71
  )
72
 
73
- with gr.Accordion("📋 Project Information", open=False):
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  gr.Markdown(
75
  """
76
  ### Key Features
 
40
 
41
  An unofficial implementation based on improvements of CosyVoice with learnable encoder and DAC-VAE.
42
 
43
+ > **⚠️ This is a demo interface with placeholder audio. To use the actual model, you need to train it first!**
44
+
45
+ ## 🚀 How to Train Your Own Model:
46
+
47
+ 1. **Follow the [Training Guide](https://github.com/primepake/learnable-speech/blob/main/TRAINING_GUIDE.md)**
48
+ 2. **Use the provided training scripts** in the `scripts/` directory
49
+ 3. **Upload your trained models** to Hugging Face Hub
50
+ 4. **Replace the placeholder code** in this Space with your models
51
+
52
+ ### Quick Start:
53
+ ```bash
54
+ # 1. Prepare your dataset
55
+ ./scripts/prepare_data.sh
56
+
57
+ # 2. Train the model
58
+ ./scripts/train_full_pipeline.sh
59
+
60
+ # 3. Upload to Hugging Face
61
+ python scripts/upload_to_hf.py --username your_username
62
+ ```
63
  """
64
  )
65
 
 
89
  type="numpy"
90
  )
91
 
92
+ with gr.Accordion("🎯 Training Status & Next Steps", open=True):
93
+ gr.Markdown(
94
+ """
95
+ ### 📋 Current Status:
96
+ - ✅ **Demo Interface**: Ready
97
+ - ❌ **Trained Models**: Not available (placeholder audio only)
98
+ - ❌ **Model Inference**: Not implemented yet
99
+
100
+ ### 🔧 To Enable Real Speech Synthesis:
101
+ 1. **Train the models** using the provided pipeline
102
+ 2. **Upload trained checkpoints** to Hugging Face Hub
103
+ 3. **Update the inference code** in `synthesize_speech()` function
104
+ 4. **Test with real model outputs**
105
+
106
+ ### 📚 Resources:
107
+ - [📖 Complete Training Guide](https://github.com/primepake/learnable-speech/blob/main/TRAINING_GUIDE.md)
108
+ - [🛠️ Training Scripts](https://github.com/primepake/learnable-speech/tree/main/scripts)
109
+ - [📄 Research Paper](https://arxiv.org/pdf/2505.07916)
110
+ - [💻 GitHub Repository](https://github.com/primepake/learnable-speech)
111
+ """
112
+ )
113
  gr.Markdown(
114
  """
115
  ### Key Features