Text-to-Speech
F5-TTS
File size: 4,528 Bytes
31d31e0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
{
    "bomFormat": "CycloneDX",
    "specVersion": "1.6",
    "serialNumber": "urn:uuid:af7257f9-86de-47be-b728-482271c21016",
    "version": 1,
    "metadata": {
        "timestamp": "2025-06-05T09:35:47.771137+00:00",
        "component": {
            "type": "machine-learning-model",
            "bom-ref": "SWivid/F5-TTS-1eaa5074-7711-55bb-b142-7f1391dec9d2",
            "name": "SWivid/F5-TTS",
            "externalReferences": [
                {
                    "url": "https://huggingface.co/SWivid/F5-TTS",
                    "type": "documentation"
                }
            ],
            "modelCard": {
                "modelParameters": {
                    "task": "text-to-speech",
                    "datasets": [
                        {
                            "ref": "amphion/Emilia-Dataset-a72e5559-5c47-57e2-9bae-a062ac838d0b"
                        }
                    ]
                },
                "properties": [
                    {
                        "name": "library_name",
                        "value": "f5-tts"
                    }
                ]
            },
            "authors": [
                {
                    "name": "SWivid"
                }
            ],
            "licenses": [
                {
                    "license": {
                        "id": "CC-BY-NC-4.0",
                        "url": "https://spdx.org/licenses/CC-BY-NC-4.0.html"
                    }
                }
            ],
            "tags": [
                "f5-tts",
                "text-to-speech",
                "dataset:amphion/Emilia-Dataset",
                "arxiv:2410.06885",
                "license:cc-by-nc-4.0",
                "region:us"
            ]
        }
    },
    "components": [
        {
            "type": "data",
            "bom-ref": "amphion/Emilia-Dataset-a72e5559-5c47-57e2-9bae-a062ac838d0b",
            "name": "amphion/Emilia-Dataset",
            "data": [
                {
                    "type": "dataset",
                    "bom-ref": "amphion/Emilia-Dataset-a72e5559-5c47-57e2-9bae-a062ac838d0b",
                    "name": "amphion/Emilia-Dataset",
                    "contents": {
                        "url": "https://huggingface.co/datasets/amphion/Emilia-Dataset",
                        "properties": [
                            {
                                "name": "task_categories",
                                "value": "text-to-speech, automatic-speech-recognition"
                            },
                            {
                                "name": "language",
                                "value": "zh, en, ja, fr, de, ko"
                            },
                            {
                                "name": "size_categories",
                                "value": "10M<n<100M"
                            },
                            {
                                "name": "pretty_name",
                                "value": "Emilia"
                            },
                            {
                                "name": "license",
                                "value": "cc-by-4.0"
                            }
                        ]
                    },
                    "governance": {
                        "owners": [
                            {
                                "organization": {
                                    "name": "amphion",
                                    "url": "https://huggingface.co/amphion"
                                }
                            }
                        ]
                    },
                    "description": "\n\t\n\t\t\n\t\tEmilia: An Extensive, Multilingual, and Diverse Speech Dataset for Large-Scale Speech Generation\n\t\n\n\nThis is the official repository \ud83d\udc51 for the Emilia dataset and the source code for the Emilia-Pipe speech data preprocessing pipeline. \n\n\n\n\t\n\t\t\n\t\tNews \ud83d\udd25\n\t\n\n\n2025/02/26: The Emilia-Large dataset, featuring over 200,000 hours of data, is now available!!! Emilia-Large combines the original 101k-hour Emilia dataset (licensed under CC BY-NC 4.0) with the brand-new 114k-hour Emilia-YODAS\u2026 See the full description on the dataset page: https://huggingface.co/datasets/amphion/Emilia-Dataset."
                }
            ]
        }
    ]
}