harsh2ai
commited on
Commit
Β·
defdb4d
1
Parent(s):
264bf88
Simplify UI: Remove About tab, add links to main section
Browse files
app.py
CHANGED
|
@@ -162,6 +162,16 @@ def create_interface():
|
|
| 162 |
- π **Private Infrastructure**: Secure and controlled deployment
|
| 163 |
""")
|
| 164 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 165 |
# API Status indicator
|
| 166 |
with gr.Row():
|
| 167 |
with gr.Column(scale=4):
|
|
@@ -205,70 +215,6 @@ def create_interface():
|
|
| 205 |
- Speak naturally at a moderate pace
|
| 206 |
- For file upload, ensure audio quality is good (16kHz or higher recommended)
|
| 207 |
- Model handles code-switching between English and Hindi
|
| 208 |
-
|
| 209 |
-
### π§ Backend Configuration
|
| 210 |
-
This Space connects to a private API endpoint for transcription.
|
| 211 |
-
The API endpoint can be configured via the `STT_API_ENDPOINT` secret in Space Settings.
|
| 212 |
-
""")
|
| 213 |
-
|
| 214 |
-
with gr.Tab("βΉοΈ About"):
|
| 215 |
-
gr.Markdown("""
|
| 216 |
-
## About Ringg STT V0
|
| 217 |
-
|
| 218 |
-
Ringg STT V0 is a state-of-the-art speech-to-text system for English and Hindi languages.
|
| 219 |
-
|
| 220 |
-
### π― Model Details
|
| 221 |
-
- **Model**: Ringg STT V0
|
| 222 |
-
- **Languages**: English (EN) & Hindi (HI)
|
| 223 |
-
- **Sample Rate**: 16kHz
|
| 224 |
-
- **Performance**: 2nd place among top bilingual ASR models
|
| 225 |
-
- **Framework**: PyTorch-based deep learning
|
| 226 |
-
|
| 227 |
-
### ποΈ Architecture
|
| 228 |
-
|
| 229 |
-
This Space uses a **frontend-backend architecture**:
|
| 230 |
-
|
| 231 |
-
```
|
| 232 |
-
User β HF Space (Frontend) β API Endpoint β Private Server (Model) β Response
|
| 233 |
-
```
|
| 234 |
-
|
| 235 |
-
- **Frontend**: This Hugging Face Space (Gradio UI)
|
| 236 |
-
- **Backend**: Private inference server with the actual model
|
| 237 |
-
- **Connection**: Secure API calls via ngrok/tunnel
|
| 238 |
-
|
| 239 |
-
### π Key Features
|
| 240 |
-
- **Bilingual Recognition**: Native support for English and Hindi
|
| 241 |
-
- **Real-time Streaming**: Low-latency transcription
|
| 242 |
-
- **High Accuracy**: Optimized for conversational speech
|
| 243 |
-
- **Flexible Input**: Supports microphone streaming and file upload
|
| 244 |
-
- **Private Infrastructure**: Model runs on your own infrastructure
|
| 245 |
-
|
| 246 |
-
### π Use Cases
|
| 247 |
-
- Voice assistants and chatbots
|
| 248 |
-
- Meeting transcription
|
| 249 |
-
- Content creation and subtitling
|
| 250 |
-
- Accessibility applications
|
| 251 |
-
- Voice search and commands
|
| 252 |
-
|
| 253 |
-
### π§ Technical Specifications
|
| 254 |
-
- **Audio Processing**: 16kHz mono, PCM16
|
| 255 |
-
- **Latency**: ~2-3 seconds for streaming
|
| 256 |
-
- **API Protocol**: REST API with base64-encoded audio
|
| 257 |
-
- **Supported Formats**: WAV, MP3, FLAC, M4A, OGG, OPUS
|
| 258 |
-
|
| 259 |
-
### π Limitations
|
| 260 |
-
- Requires active backend API endpoint
|
| 261 |
-
- Works best with clear audio and minimal background noise
|
| 262 |
-
- Accuracy may vary with accents and dialects
|
| 263 |
-
- API latency depends on network and backend performance
|
| 264 |
-
|
| 265 |
-
### π Links
|
| 266 |
-
- **Organization**: [RinggAI on Hugging Face](https://huggingface.co/RinggAI)
|
| 267 |
-
- **TTS Space**: [Ringg TTS V0](https://huggingface.co/spaces/RinggAI/Ringg-TTS-v0.0)
|
| 268 |
-
|
| 269 |
-
---
|
| 270 |
-
|
| 271 |
-
Made with β€οΈ by RinggAI Team
|
| 272 |
""")
|
| 273 |
|
| 274 |
return demo
|
|
|
|
| 162 |
- π **Private Infrastructure**: Secure and controlled deployment
|
| 163 |
""")
|
| 164 |
|
| 165 |
+
gr.Markdown("""
|
| 166 |
+
### π Links
|
| 167 |
+
- **Organization**: [RinggAI on Hugging Face](https://huggingface.co/RinggAI)
|
| 168 |
+
- **TTS Space**: [Ringg TTS V0](https://huggingface.co/spaces/RinggAI/Ringg-TTS-v0.0)
|
| 169 |
+
|
| 170 |
+
---
|
| 171 |
+
|
| 172 |
+
Made with β€οΈ by RinggAI Team
|
| 173 |
+
""")
|
| 174 |
+
|
| 175 |
# API Status indicator
|
| 176 |
with gr.Row():
|
| 177 |
with gr.Column(scale=4):
|
|
|
|
| 215 |
- Speak naturally at a moderate pace
|
| 216 |
- For file upload, ensure audio quality is good (16kHz or higher recommended)
|
| 217 |
- Model handles code-switching between English and Hindi
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 218 |
""")
|
| 219 |
|
| 220 |
return demo
|