Text-to-Speech
Safetensors
English
Chinese
Files changed (1) hide show
  1. SparkAudio_Spark-TTS-0.5B.json +49 -0
SparkAudio_Spark-TTS-0.5B.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bomFormat": "CycloneDX",
3
+ "specVersion": "1.6",
4
+ "serialNumber": "urn:uuid:dd938abe-dbb2-4838-8459-edc51f28df1b",
5
+ "version": 1,
6
+ "metadata": {
7
+ "timestamp": "2025-07-14T14:13:20.770453+00:00",
8
+ "component": {
9
+ "type": "machine-learning-model",
10
+ "bom-ref": "SparkAudio/Spark-TTS-0.5B-bf10ddd8-615d-53b3-b697-f3e446f4c11b",
11
+ "name": "SparkAudio/Spark-TTS-0.5B",
12
+ "externalReferences": [
13
+ {
14
+ "url": "https://huggingface.co/SparkAudio/Spark-TTS-0.5B",
15
+ "type": "documentation"
16
+ }
17
+ ],
18
+ "modelCard": {
19
+ "modelParameters": {
20
+ "task": "text-to-speech"
21
+ }
22
+ },
23
+ "authors": [
24
+ {
25
+ "name": "SparkAudio"
26
+ }
27
+ ],
28
+ "licenses": [
29
+ {
30
+ "license": {
31
+ "id": "CC-BY-NC-SA-4.0",
32
+ "url": "https://spdx.org/licenses/CC-BY-NC-SA-4.0.html"
33
+ }
34
+ }
35
+ ],
36
+ "description": "Spark-TTS is an advanced text-to-speech system that uses the power of large language models (LLM) for highly accurate and natural-sounding voice synthesis. It is designed to be efficient, flexible, and powerful for both research and production use.",
37
+ "tags": [
38
+ "safetensors",
39
+ "text-to-speech",
40
+ "en",
41
+ "zh",
42
+ "arxiv:2503.01710",
43
+ "doi:10.57967/hf/4650",
44
+ "license:cc-by-nc-sa-4.0",
45
+ "region:us"
46
+ ]
47
+ }
48
+ }
49
+ }