xjsc0 commited on
Commit
4ef36ed
·
1 Parent(s): 31055ef
Files changed (1) hide show
  1. requirements.txt +110 -183
requirements.txt CHANGED
@@ -1,199 +1,126 @@
1
- absl-py==2.3.1
 
 
 
 
 
2
  accelerate==1.12.0
3
- aiofiles==24.1.0
4
- aiohappyeyeballs==2.6.1
5
- aiohttp==3.12.15
6
- aiosignal==1.4.0
7
- alias-free-torch==0.0.6
8
- annotated-types==0.7.0
9
- antlr4-python3-runtime==4.9.3
10
- anyio==4.11.0
11
- argbind==0.3.9
12
- argparse==1.4.0
13
- async-timeout==5.0.1
14
- attrs==25.3.0
15
- audiobox-aesthetics==0.0.4
16
- audioread==3.0.1
17
- av==16.0.1
18
- beartype==0.22.2
19
  bitsandbytes==0.48.1
20
- brotli==1.1.0
21
- certifi==2025.8.3
22
- cffi==2.0.0
23
- chardet==5.2.0
24
- charset-normalizer==3.4.3
25
- click==8.3.0
26
- cloudpickle==3.1.1
27
- colorama==0.4.6
28
- coloredlogs==15.0.1
29
- configparser==7.2.0
30
- cryptography==46.0.3
31
- datasets==2.21.0
32
- decorator==5.2.1
33
- deprecated==1.2.18
34
  diffusers==0.36.0
35
- dill==0.3.8
36
- distro==1.9.0
37
- dlinfo==2.0.0
38
- docstring-parser==0.17.0
39
- easydict==1.13
40
- einops==0.8.1
41
- einops-exts==0.0.4
42
- einx==0.3.0
43
- ema-pytorch==0.7.7
44
  encodec==0.1.1
45
- exceptiongroup==1.3.0
46
- fastapi==0.118.0
47
- ffmpy==0.6.1
48
- filelock==3.19.1
49
- fire==0.7.1
50
- flatten-dict==0.4.2
51
- frozendict==2.4.6
52
- frozenlist==1.7.0
53
- fsspec==2024.6.1
54
- ftfy==6.3.1
55
- future==1.0.0
56
- gin-config==0.5.0
57
- grpcio==1.75.1
58
- h11==0.16.0
59
- hf-xet==1.1.10
60
- httpcore==1.0.9
61
- httpx==0.28.1
62
- huggingface-hub==0.35.3
63
- humanfriendly==10.0
64
- hydra-core==1.3.2
65
- idna==3.10
66
- importlib-metadata==8.7.1
67
- importlib-resources==6.5.2
68
- jinja2==3.1.6
69
- jiter==0.12.0
70
- joblib==1.5.2
71
- jsonmerge==1.9.2
72
- jsonschema==4.25.1
73
- jsonschema-specifications==2025.9.1
74
  julius==0.2.7
75
- k-diffusion==0.1.1
76
  lameenc==1.8.1
77
- lazy-loader==0.4
78
- librosa==0.10.2.post1
79
- lightning==2.6.1
80
- lightning-utilities==0.15.2
81
- llvmlite==0.45.1
82
- loguru==0.7.3
83
- loralib==0.1.2
84
- markdown==3.9
85
- markdown-it-py==4.0.0
86
- markdown2==2.5.4
87
- markupsafe==3.0.3
88
- mdurl==0.1.2
 
 
 
 
 
89
  midi2audio==0.1.1
90
  mido==1.3.3
91
- ml-collections==1.1.0
 
 
 
 
 
 
 
 
 
 
 
 
 
92
  modelscope==1.32.0
93
- more-itertools==10.8.0
94
- mpmath==1.3.0
95
- msgpack==1.1.1
96
- multidict==6.6.4
97
- multiprocess==0.70.16
98
- munch==4.0.0
99
- muq==0.1.0
100
- music21==9.9.1
101
- mutagen==1.47.0
102
- networkx==3.4.2
103
- nnaudio==0.3.3
104
- numba==0.62.1
105
- numpy
 
 
 
 
 
 
 
 
 
106
  omegaconf==2.3.0
107
- orjson==3.11.3
108
- packaging==25.0
109
- pandas==2.2.3
110
- peft==0.11.1
111
- platformdirs==4.4.0
112
- pooch==1.8.2
113
  prefigure==0.0.10
114
- pretty-midi==0.2.11
115
- propcache==0.3.2
116
- psutil==7.1.0
117
- pycparser==2.23
118
- pydub==0.25.1
119
- pylance==0.23.2
120
- pyloudnorm==0.1.1
121
- pylrc==0.1.2
122
- pyparsing==3.2.5
123
- python-dateutil==2.9.0.post0
124
- python-multipart==0.0.20
125
- pytorch-lightning==2.5.5
126
- pytz==2025.2
127
  pyyaml==6.0.3
128
- qwen-omni-utils==0.0.8
129
- rapidfuzz==2.13.7
130
- referencing==0.36.2
131
- regex==2025.9.18
132
- requests==2.32.5
133
- resampy==0.4.3
134
- retrying==1.4.2
135
- rfc3986==1.5.0
136
- rich==14.1.0
137
- rotary-embedding-torch==0.8.9
138
- rpds-py==0.27.1
139
- ruamel-yaml==0.19.1
140
- safetensors==0.6.2
141
- scikit-learn==1.7.2
142
- scipy==1.15.3
143
- segments==2.3.0
144
- semantic-version==2.10.0
145
- sentencepiece==0.2.1
146
- setuptools==80.9.0
147
- shellingham==1.5.4
148
- six==1.17.0
149
- sniffio==1.3.1
150
- soundfile==0.13.1
151
- sox==1.5.0
152
- soxr==1.0.0
153
- starlette==0.48.0
154
- sympy==1.13.1
155
  tensorboard==2.20.0
156
- tensorboard-data-server==0.7.2
157
  tensorboardx==2.6.4
158
- termcolor==3.1.0
159
- threadpoolctl==3.6.0
160
- tokenizers==0.22.2
161
- tomlkit==0.13.3
162
- torch==2.6.0
163
- torch-complex==0.4.4
164
- torchaudio==2.6.0
165
- torchcodec==0.10.0
166
- torchcrepe==0.0.24
167
- torchdiffeq==0.2.5
168
- torchmetrics==1.8.2
169
- torchsde==0.2.6
170
  tqdm==4.67.1
171
- trampoline==0.1.2
172
- transformers==4.57.6
173
- triton==3.2.0
174
- typeguard==4.4.4
175
- typer==0.19.2
176
- typing-extensions==4.15.0
177
- typing-inspection==0.4.2
178
- tzdata==2025.2
179
  unidecode==1.3.8
180
- urllib3==2.5.0
181
- uvicorn==0.37.0
182
- vector-quantize-pytorch==1.23.2
183
- vocos==0.1.0
184
- wandb==0.22.1
185
- websockets==15.0.1
186
- wrapt==1.17.3
187
- x-transformers==2.1.2
188
- xxhash==3.6.0
189
- yarl==1.20.1
190
- zhconv==1.4.3
191
- zhon==2.1.1
192
- zipp==3.23.0
193
- jieba
194
- pypinyin
195
- descript-audio-codec
196
- cn2an
197
- onnxruntime
198
- phonemizer
199
- py3langid
 
1
+ # ============ Core ML / PyTorch ============
2
+ torch==2.6.0
3
+ torchaudio==2.6.0
4
+ torchvision==0.21.0
5
+ lightning==2.6.1
6
+ pytorch-lightning==2.5.5
7
  accelerate==1.12.0
8
+ transformers==4.57.6
9
+ tokenizers==0.22.2
10
+ safetensors==0.6.2
11
+ peft==0.11.1
 
 
 
 
 
 
 
 
 
 
 
 
12
  bitsandbytes==0.48.1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  diffusers==0.36.0
14
+ datasets==2.21.0
15
+ sentencepiece==0.2.1
16
+
17
+ # ============ Audio Processing ============
18
+ librosa==0.10.2.post1
19
+ soundfile==0.13.1
20
+ torchcrepe==0.0.24
 
 
21
  encodec==0.1.1
22
+ descript-audio-codec==1.0.0
23
+ descript-audiotools==0.7.2
24
+ vocos==0.1.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  julius==0.2.7
 
26
  lameenc==1.8.1
27
+ pyloudnorm==0.1.1
28
+ pydub==0.25.1
29
+ sox==1.5.0
30
+ soxr==1.0.0
31
+ nnaudio==0.3.3
32
+ av==16.0.1
33
+ audioread==3.0.1
34
+ resampy==0.4.3
35
+ pystoi==0.4.1
36
+ torch-stoi==0.2.3
37
+ torch-complex==0.4.4
38
+ audiobox-aesthetics==0.0.4
39
+ torchcodec==0.10.0
40
+
41
+ # ============ Music / MIDI ============
42
+ music21==9.9.1
43
+ pretty-midi==0.2.11
44
  midi2audio==0.1.1
45
  mido==1.3.3
46
+ pylrc==0.1.2
47
+
48
+ # ============ Chinese NLP / TTS ============
49
+ pypinyin==0.55.0
50
+ cn2an==0.5.23
51
+ phonemizer==3.3.0
52
+ jieba==0.42.1
53
+ zhconv==1.4.3
54
+ zhon==2.1.1
55
+ py3langid==0.3.0
56
+ segments==2.3.0
57
+
58
+ # ============ Model Hubs ============
59
+ huggingface-hub==0.35.3
60
  modelscope==1.32.0
61
+
62
+ # ============ Neural Net Utilities ============
63
+ einops==0.8.1
64
+ einops-exts==0.0.4
65
+ einx==0.3.0
66
+ ema-pytorch==0.7.7
67
+ rotary-embedding-torch==0.8.9
68
+ vector-quantize-pytorch==1.23.2
69
+ x-transformers==2.1.2
70
+ x-clip==0.14.4
71
+ alias-free-torch==0.0.6
72
+ loralib==0.1.2
73
+ k-diffusion==0.1.1
74
+ torchdiffeq==0.2.5
75
+ torchsde==0.2.6
76
+ kornia==0.8.2
77
+ dctorch==0.1.2
78
+ clean-fid==0.1.35
79
+ clip-anytorch==2.6.0
80
+
81
+ # ============ Config / CLI ============
82
+ hydra-core==1.3.2
83
  omegaconf==2.3.0
84
+ fire==0.7.1
85
+ argbind==0.3.9
 
 
 
 
86
  prefigure==0.0.10
87
+ gin-config==0.5.0
88
+ ml-collections==1.1.0
89
+ easydict==1.13
 
 
 
 
 
 
 
 
 
 
90
  pyyaml==6.0.3
91
+
92
+ # ============ Web / API (Gradio) ============
93
+ gradio==6.9.0
94
+
95
+ # ============ Monitoring / Logging ============
96
+ wandb==0.22.1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97
  tensorboard==2.20.0
 
98
  tensorboardx==2.6.4
99
+ loguru==0.7.3
100
+
101
+ # ============ Data / Science ============
102
+ numpy==2.2.6
103
+ scipy==1.15.3
104
+ pandas==2.2.3
105
+ scikit-learn==1.7.2
106
+ scikit-image==0.25.2
107
+ matplotlib==3.10.8
108
+ pillow==12.1.1
109
+
110
+ # ============ Misc Utilities ============
111
  tqdm==4.67.1
112
+ regex==2025.9.18
113
+ ftfy==6.3.1
 
 
 
 
 
 
114
  unidecode==1.3.8
115
+ rapidfuzz==2.13.7
116
+ mutagen==1.47.0
117
+ numba==0.62.1
118
+ onnxruntime==1.23.2
119
+ protobuf==3.19.6
120
+ qwen-omni-utils==0.0.8
121
+ muq==0.1.0
122
+ pylance==0.23.2
123
+ proces==0.1.7
124
+ groovy==0.1.2
125
+ randomname==0.2.1
126
+ submitit==1.5.4