Add files using upload-large-folder tool
Browse files- .gitattributes +6 -34
- LICENSE +21 -0
- NOTICE +17 -0
- README.md +47 -3
- dacvae_decode_12s.onnx +3 -0
- dacvae_decode_12s.onnx.data +3 -0
- dacvae_decode_16s.onnx +3 -0
- dacvae_decode_16s.onnx.data +3 -0
- dacvae_decode_1s.onnx +3 -0
- dacvae_decode_1s.onnx.data +3 -0
- dacvae_decode_24s.onnx +3 -0
- dacvae_decode_24s.onnx.data +3 -0
- dacvae_decode_2s.onnx +3 -0
- dacvae_decode_2s.onnx.data +3 -0
- dacvae_decode_30s.onnx +3 -0
- dacvae_decode_30s.onnx.data +3 -0
- dacvae_decode_4s.onnx +3 -0
- dacvae_decode_4s.onnx.data +3 -0
- dacvae_decode_8s.onnx +3 -0
- dacvae_decode_8s.onnx.data +3 -0
- manifest.json +158 -0
- migraphx/dacvae_decode_24s.mxr +3 -0
- migraphx/dacvae_decode_2s.mxr +3 -0
- migraphx/dacvae_decode_30s.mxr +3 -0
- migraphx/dacvae_decode_4s.mxr +3 -0
- migraphx/dacvae_decode_8s.mxr +3 -0
- migraphx/rfdit_context_fp32_30s.mxr +3 -0
- migraphx/rfdit_step_fp32_1s.mxr +3 -0
- migraphx/rfdit_step_fp32_24s.mxr +3 -0
- migraphx/rfdit_step_fp32_2s.mxr +3 -0
- migraphx/rfdit_step_fp32_30s.mxr +3 -0
- rfdit_context_fp32_30s.onnx +3 -0
- rfdit_context_fp32_30s.onnx.data +3 -0
- rfdit_step_fp32_12s.onnx +3 -0
- rfdit_step_fp32_12s.onnx.data +3 -0
- rfdit_step_fp32_16s.onnx +3 -0
- rfdit_step_fp32_16s.onnx.data +3 -0
- rfdit_step_fp32_1s.onnx +3 -0
- rfdit_step_fp32_1s.onnx.data +3 -0
- rfdit_step_fp32_24s.onnx +3 -0
- rfdit_step_fp32_24s.onnx.data +3 -0
- rfdit_step_fp32_2s.onnx +3 -0
- rfdit_step_fp32_2s.onnx.data +3 -0
- rfdit_step_fp32_30s.onnx +3 -0
- rfdit_step_fp32_30s.onnx.data +3 -0
- rfdit_step_fp32_4s.onnx +3 -0
- rfdit_step_fp32_4s.onnx.data +3 -0
- rfdit_step_fp32_8s.onnx +3 -0
- rfdit_step_fp32_8s.onnx.data +3 -0
- tokenizer/llm-jp-3-150m/tokenizer.json +0 -0
.gitattributes
CHANGED
|
@@ -1,35 +1,7 @@
|
|
| 1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
-
*.
|
| 18 |
-
*.
|
| 19 |
-
*.
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.data filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.mxr filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.json text
|
| 5 |
+
README.md text
|
| 6 |
+
LICENSE text
|
| 7 |
+
NOTICE text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
LICENSE
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MIT License
|
| 2 |
+
|
| 3 |
+
Copyright (c) 2026 Aratako
|
| 4 |
+
|
| 5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
| 6 |
+
of this software and associated documentation files (the "Software"), to deal
|
| 7 |
+
in the Software without restriction, including without limitation the rights
|
| 8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
| 9 |
+
copies of the Software, and to permit persons to whom the Software is
|
| 10 |
+
furnished to do so, subject to the following conditions:
|
| 11 |
+
|
| 12 |
+
The above copyright notice and this permission notice shall be included in all
|
| 13 |
+
copies or substantial portions of the Software.
|
| 14 |
+
|
| 15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
| 16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
| 17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
| 18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
| 19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
| 20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
| 21 |
+
SOFTWARE.
|
NOTICE
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Notices
|
| 2 |
+
|
| 3 |
+
This repository contains exported ONNX and MIGraphX artifacts derived from:
|
| 4 |
+
|
| 5 |
+
- Aratako/Irodori-TTS-500M-v2-VoiceDesign
|
| 6 |
+
License: MIT
|
| 7 |
+
https://huggingface.co/Aratako/Irodori-TTS-500M-v2-VoiceDesign
|
| 8 |
+
|
| 9 |
+
- Aratako/Semantic-DACVAE-Japanese-32dim
|
| 10 |
+
License: MIT
|
| 11 |
+
https://huggingface.co/Aratako/Semantic-DACVAE-Japanese-32dim
|
| 12 |
+
|
| 13 |
+
This repository includes tokenizer files from:
|
| 14 |
+
|
| 15 |
+
- llm-jp/llm-jp-3-150m
|
| 16 |
+
License: Apache License 2.0
|
| 17 |
+
https://huggingface.co/llm-jp/llm-jp-3-150m
|
README.md
CHANGED
|
@@ -1,3 +1,47 @@
|
|
| 1 |
-
---
|
| 2 |
-
license: mit
|
| 3 |
-
--
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
pipeline_tag: text-to-speech
|
| 4 |
+
tags:
|
| 5 |
+
- irodori-tts
|
| 6 |
+
- text-to-speech
|
| 7 |
+
- japanese
|
| 8 |
+
- onnx
|
| 9 |
+
- migraphx
|
| 10 |
+
- rocm
|
| 11 |
+
- voice-design
|
| 12 |
+
---
|
| 13 |
+
|
| 14 |
+
# irodori_tts_cpp_artifacts
|
| 15 |
+
|
| 16 |
+
Exported ONNX and MIGraphX artifacts for running `Aratako/Irodori-TTS-500M-v2-VoiceDesign` with the native `irodori_tts_cpp` runtime.
|
| 17 |
+
|
| 18 |
+
This repository contains only the inference artifacts required by the C++ runtime:
|
| 19 |
+
|
| 20 |
+
- `manifest.json`
|
| 21 |
+
- local tokenizer JSON
|
| 22 |
+
- RF-DiT context ONNX / external data / MIGraphX cache
|
| 23 |
+
- RF-DiT step ONNX / external data / MIGraphX cache for 1, 2, 4, 8, 12, 16, 24, and 30 second buckets
|
| 24 |
+
- DACVAE decode ONNX / external data / MIGraphX cache for 1, 2, 4, 8, 12, 16, 24, and 30 second buckets
|
| 25 |
+
|
| 26 |
+
The runtime request path uses the `.mxr` files. ONNX and `.onnx.data` files are included as the cache generation source artifacts.
|
| 27 |
+
|
| 28 |
+
## Download
|
| 29 |
+
|
| 30 |
+
```bash
|
| 31 |
+
huggingface-cli download yoshou/irodori_tts_cpp_artifacts \
|
| 32 |
+
--local-dir artifacts/irodori-500m-v2-voicedesign-test
|
| 33 |
+
```
|
| 34 |
+
|
| 35 |
+
## License
|
| 36 |
+
|
| 37 |
+
The exported Irodori-TTS VoiceDesign artifacts are distributed under the MIT License, following the upstream model license.
|
| 38 |
+
|
| 39 |
+
This repository also includes tokenizer files derived from `llm-jp/llm-jp-3-150m`, which is licensed under the Apache License 2.0. See `NOTICE` for attribution details.
|
| 40 |
+
|
| 41 |
+
Users must also follow the ethical restrictions described in the upstream Irodori-TTS VoiceDesign model card, including no impersonation and no misleading synthetic speech.
|
| 42 |
+
|
| 43 |
+
## Upstream
|
| 44 |
+
|
| 45 |
+
- https://huggingface.co/Aratako/Irodori-TTS-500M-v2-VoiceDesign
|
| 46 |
+
- https://github.com/Aratako/Irodori-TTS
|
| 47 |
+
- https://huggingface.co/llm-jp/llm-jp-3-150m
|
dacvae_decode_12s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2277424ab65a8c44849dadef3df03e03524263b511e31c7916b7853eae42ffe5
|
| 3 |
+
size 584726
|
dacvae_decode_12s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d16ab4fc33fb77504dfdccc5429f8796aefb30e1442d2d075d3afaf7909154
|
| 3 |
+
size 261357568
|
dacvae_decode_16s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0793b233b4e89764ee8ad0f5d0066fceabfd8837f615db5462222869878415b9
|
| 3 |
+
size 584726
|
dacvae_decode_16s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d16ab4fc33fb77504dfdccc5429f8796aefb30e1442d2d075d3afaf7909154
|
| 3 |
+
size 261357568
|
dacvae_decode_1s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f439006695262ca8c37c5b8344a486ed0c46a3b41629a59384972d98a572fe4
|
| 3 |
+
size 573944
|
dacvae_decode_1s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8ae26c9f84714fd443db894d835bdab675edea12963071f5c5c1b503b3e02de
|
| 3 |
+
size 267976704
|
dacvae_decode_24s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2214774fe9492c19532a24154205e13380ac9b34d18e5055d2ffac21cea51ecb
|
| 3 |
+
size 584726
|
dacvae_decode_24s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d16ab4fc33fb77504dfdccc5429f8796aefb30e1442d2d075d3afaf7909154
|
| 3 |
+
size 261357568
|
dacvae_decode_2s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64d6cf4c76f3710ff352143f5e8eff65686418aada6f9970ba09604c6e33b60b
|
| 3 |
+
size 574594
|
dacvae_decode_2s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:955930a3b877d80cc8bf3757405fcd2493395c00acf8dda78bda59073f7502dd
|
| 3 |
+
size 261685248
|
dacvae_decode_30s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cc21c3e21525ce84001ec94d880e2775317380ceff3495f0576ede7a0cbb11e
|
| 3 |
+
size 584726
|
dacvae_decode_30s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d16ab4fc33fb77504dfdccc5429f8796aefb30e1442d2d075d3afaf7909154
|
| 3 |
+
size 261357568
|
dacvae_decode_4s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4838c40e999881ea72a5b0183d1bbbfcd91035a9aa6aa5dc2858b70c3919fe40
|
| 3 |
+
size 574594
|
dacvae_decode_4s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68a2bcb78b347f3b3690c4f7f47bb2b6eaa37b300c4c91fd34627b7ccfbc92f2
|
| 3 |
+
size 261947392
|
dacvae_decode_8s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0597c7296cae06f252b9ef0f8b9831313fe037dbe6445182d13f820155754ed
|
| 3 |
+
size 584628
|
dacvae_decode_8s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d16ab4fc33fb77504dfdccc5429f8796aefb30e1442d2d075d3afaf7909154
|
| 3 |
+
size 261357568
|
manifest.json
ADDED
|
@@ -0,0 +1,158 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint": "/home/ubuntu/.cache/huggingface/hub/models--Aratako--Irodori-TTS-500M-v2-VoiceDesign/snapshots/456e55708e7183f5c7faa1448209d54aa8991451/model.safetensors",
|
| 4 |
+
"opset_version": 18,
|
| 5 |
+
"model": {
|
| 6 |
+
"latent_dim": 32,
|
| 7 |
+
"latent_patch_size": 1,
|
| 8 |
+
"patched_latent_dim": 32,
|
| 9 |
+
"use_speaker_condition": false,
|
| 10 |
+
"use_caption_condition": true
|
| 11 |
+
},
|
| 12 |
+
"tokenizers": {
|
| 13 |
+
"text_repo": "llm-jp/llm-jp-3-150m",
|
| 14 |
+
"text_add_bos": true,
|
| 15 |
+
"caption_repo": "llm-jp/llm-jp-3-150m",
|
| 16 |
+
"caption_add_bos": true
|
| 17 |
+
},
|
| 18 |
+
"rfdit": {
|
| 19 |
+
"context_path": "rfdit_context_fp32_30s.onnx",
|
| 20 |
+
"step_path": "rfdit_step_fp32_30s.onnx",
|
| 21 |
+
"text_len": 256,
|
| 22 |
+
"caption_len": 512,
|
| 23 |
+
"ref_steps": 64,
|
| 24 |
+
"ref_dim": 32,
|
| 25 |
+
"max_patched_steps": 750,
|
| 26 |
+
"has_speaker": false,
|
| 27 |
+
"has_caption": true,
|
| 28 |
+
"step_buckets": {
|
| 29 |
+
"1": {
|
| 30 |
+
"step_path": "rfdit_step_fp32_1s.onnx",
|
| 31 |
+
"seconds": 1.0,
|
| 32 |
+
"latent_steps": 25,
|
| 33 |
+
"max_patched_steps": 25,
|
| 34 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_1s.mxr"
|
| 35 |
+
},
|
| 36 |
+
"2": {
|
| 37 |
+
"step_path": "rfdit_step_fp32_2s.onnx",
|
| 38 |
+
"seconds": 2.0,
|
| 39 |
+
"latent_steps": 50,
|
| 40 |
+
"max_patched_steps": 50,
|
| 41 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_2s.mxr"
|
| 42 |
+
},
|
| 43 |
+
"4": {
|
| 44 |
+
"step_path": "rfdit_step_fp32_4s.onnx",
|
| 45 |
+
"seconds": 4.0,
|
| 46 |
+
"latent_steps": 100,
|
| 47 |
+
"max_patched_steps": 100,
|
| 48 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_4s.mxr"
|
| 49 |
+
},
|
| 50 |
+
"8": {
|
| 51 |
+
"step_path": "rfdit_step_fp32_8s.onnx",
|
| 52 |
+
"seconds": 8.0,
|
| 53 |
+
"latent_steps": 200,
|
| 54 |
+
"max_patched_steps": 200,
|
| 55 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_8s.mxr"
|
| 56 |
+
},
|
| 57 |
+
"12": {
|
| 58 |
+
"step_path": "rfdit_step_fp32_12s.onnx",
|
| 59 |
+
"seconds": 12.0,
|
| 60 |
+
"latent_steps": 300,
|
| 61 |
+
"max_patched_steps": 300,
|
| 62 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_12s.mxr"
|
| 63 |
+
},
|
| 64 |
+
"16": {
|
| 65 |
+
"step_path": "rfdit_step_fp32_16s.onnx",
|
| 66 |
+
"seconds": 16.0,
|
| 67 |
+
"latent_steps": 400,
|
| 68 |
+
"max_patched_steps": 400,
|
| 69 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_16s.mxr"
|
| 70 |
+
},
|
| 71 |
+
"24": {
|
| 72 |
+
"step_path": "rfdit_step_fp32_24s.onnx",
|
| 73 |
+
"seconds": 24.0,
|
| 74 |
+
"latent_steps": 600,
|
| 75 |
+
"max_patched_steps": 600,
|
| 76 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_24s.mxr"
|
| 77 |
+
},
|
| 78 |
+
"30": {
|
| 79 |
+
"step_path": "rfdit_step_fp32_30s.onnx",
|
| 80 |
+
"seconds": 30.0,
|
| 81 |
+
"latent_steps": 750,
|
| 82 |
+
"max_patched_steps": 750,
|
| 83 |
+
"step_migraphx_path": "migraphx/rfdit_step_fp32_30s.mxr"
|
| 84 |
+
}
|
| 85 |
+
},
|
| 86 |
+
"context_migraphx_path": "migraphx/rfdit_context_fp32_30s.mxr"
|
| 87 |
+
},
|
| 88 |
+
"dacvae": {
|
| 89 |
+
"sample_rate": 48000,
|
| 90 |
+
"hop_length": 1920,
|
| 91 |
+
"buckets": {
|
| 92 |
+
"1": {
|
| 93 |
+
"path": "dacvae_decode_1s.onnx",
|
| 94 |
+
"seconds": 1.0,
|
| 95 |
+
"latent_steps": 25,
|
| 96 |
+
"patched_steps": 25,
|
| 97 |
+
"samples": 48000,
|
| 98 |
+
"migraphx_path": "migraphx/dacvae_decode_1s.mxr"
|
| 99 |
+
},
|
| 100 |
+
"2": {
|
| 101 |
+
"path": "dacvae_decode_2s.onnx",
|
| 102 |
+
"seconds": 2.0,
|
| 103 |
+
"latent_steps": 50,
|
| 104 |
+
"patched_steps": 50,
|
| 105 |
+
"samples": 96000,
|
| 106 |
+
"migraphx_path": "migraphx/dacvae_decode_2s.mxr"
|
| 107 |
+
},
|
| 108 |
+
"4": {
|
| 109 |
+
"path": "dacvae_decode_4s.onnx",
|
| 110 |
+
"seconds": 4.0,
|
| 111 |
+
"latent_steps": 100,
|
| 112 |
+
"patched_steps": 100,
|
| 113 |
+
"samples": 192000,
|
| 114 |
+
"migraphx_path": "migraphx/dacvae_decode_4s.mxr"
|
| 115 |
+
},
|
| 116 |
+
"8": {
|
| 117 |
+
"path": "dacvae_decode_8s.onnx",
|
| 118 |
+
"seconds": 8.0,
|
| 119 |
+
"latent_steps": 200,
|
| 120 |
+
"patched_steps": 200,
|
| 121 |
+
"samples": 384000,
|
| 122 |
+
"migraphx_path": "migraphx/dacvae_decode_8s.mxr"
|
| 123 |
+
},
|
| 124 |
+
"12": {
|
| 125 |
+
"path": "dacvae_decode_12s.onnx",
|
| 126 |
+
"seconds": 12.0,
|
| 127 |
+
"latent_steps": 300,
|
| 128 |
+
"patched_steps": 300,
|
| 129 |
+
"samples": 576000,
|
| 130 |
+
"migraphx_path": "migraphx/dacvae_decode_12s.mxr"
|
| 131 |
+
},
|
| 132 |
+
"16": {
|
| 133 |
+
"path": "dacvae_decode_16s.onnx",
|
| 134 |
+
"seconds": 16.0,
|
| 135 |
+
"latent_steps": 400,
|
| 136 |
+
"patched_steps": 400,
|
| 137 |
+
"samples": 768000,
|
| 138 |
+
"migraphx_path": "migraphx/dacvae_decode_16s.mxr"
|
| 139 |
+
},
|
| 140 |
+
"24": {
|
| 141 |
+
"path": "dacvae_decode_24s.onnx",
|
| 142 |
+
"seconds": 24.0,
|
| 143 |
+
"latent_steps": 600,
|
| 144 |
+
"patched_steps": 600,
|
| 145 |
+
"samples": 1152000,
|
| 146 |
+
"migraphx_path": "migraphx/dacvae_decode_24s.mxr"
|
| 147 |
+
},
|
| 148 |
+
"30": {
|
| 149 |
+
"path": "dacvae_decode_30s.onnx",
|
| 150 |
+
"seconds": 30.0,
|
| 151 |
+
"latent_steps": 750,
|
| 152 |
+
"patched_steps": 750,
|
| 153 |
+
"samples": 1440000,
|
| 154 |
+
"migraphx_path": "migraphx/dacvae_decode_30s.mxr"
|
| 155 |
+
}
|
| 156 |
+
}
|
| 157 |
+
}
|
| 158 |
+
}
|
migraphx/dacvae_decode_24s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a090aaf6fd9acbef0722c50720382e384eaa48c5852837ef2805925cd16f80b
|
| 3 |
+
size 269536735
|
migraphx/dacvae_decode_2s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4683c1a8d21f8087a54646b18e0e08d98dfaaf9a73395888ae407b86f8fa7824
|
| 3 |
+
size 262704001
|
migraphx/dacvae_decode_30s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acb446b45c52c306890db5517c0e21d46ccdffd44713ccb78af94185d9862891
|
| 3 |
+
size 271418399
|
migraphx/dacvae_decode_4s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c896707868ebe6609baa7d177ee5941301441c63adb40f4295d3ef776cedd42
|
| 3 |
+
size 263365819
|
migraphx/dacvae_decode_8s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30fe8f7c335a85422172b8f26ed7d9022c079b77719c909f6d5c911c18f0e7c3
|
| 3 |
+
size 264657688
|
migraphx/rfdit_context_fp32_30s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:685199e2b208bbe346c71b7a43338a5101ff52ef11aa24c5433426f70a198f7e
|
| 3 |
+
size 680447917
|
migraphx/rfdit_step_fp32_1s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fba4bd1801cf24bf06f4b7b243ce44fe08ec2be5a8a83769a0ed7b02cebab024
|
| 3 |
+
size 1372331871
|
migraphx/rfdit_step_fp32_24s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:145b21065042c83acad8f7391ac6969d238b619a0700115061c4d063b76e3359
|
| 3 |
+
size 1373225385
|
migraphx/rfdit_step_fp32_2s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8beb2050f3f820d0be8636c9565089e35f4b28f9d8e58d550b9a99f05f61d06
|
| 3 |
+
size 1372165100
|
migraphx/rfdit_step_fp32_30s.mxr
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb87cd96412515a2afc75aaf7a5759a8509bebabe2506014a19f4b1ad3eda0bf
|
| 3 |
+
size 1372972583
|
rfdit_context_fp32_30s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d028976b958adeee2bfece9836542089d72b59c64f61dab1f8b2c62ff2329aef
|
| 3 |
+
size 3051434
|
rfdit_context_fp32_30s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef213503d615f1075107c9b9b2771bc5d06ed7505dab5afc7cddc2154e1da42e
|
| 3 |
+
size 678211584
|
rfdit_step_fp32_12s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:34abe6281b839874ba8e734f42cae24512c93916e0ef978d551f6493c1f7ffcd
|
| 3 |
+
size 2584321
|
rfdit_step_fp32_12s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c00d3b370d8858659620611c86c1db80e0d62c6f32c85661b4b51fe5a9e6d31d
|
| 3 |
+
size 1369833472
|
rfdit_step_fp32_16s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:230f6de542767a18332a20198e96c425ece31142f8aa4a02b1256aaaa085cd67
|
| 3 |
+
size 2584321
|
rfdit_step_fp32_16s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:935e447d8f54ab0406349024d73792e1c830168730d0ac14cb4f17888f82ea6f
|
| 3 |
+
size 1369833472
|
rfdit_step_fp32_1s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0333c06a735242f1ec2da9db8061fc209891bd38e4e04b56d8f88cdc17c90a6f
|
| 3 |
+
size 2576960
|
rfdit_step_fp32_1s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:167048cbc8ac56381c16569756632fee6c5d4294c12ba30d7ffca21526b92ccc
|
| 3 |
+
size 1369767936
|
rfdit_step_fp32_24s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f3eb9f311729a1fa0016c694ed49fc07687ce2b57f1fd483f5b358246eb51c3
|
| 3 |
+
size 2584321
|
rfdit_step_fp32_24s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6aaea3ed92d0073e69621750d1cc78aa238782c135f95746a3844e842054bd1d
|
| 3 |
+
size 1369833472
|
rfdit_step_fp32_2s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:791b0f85eae72855d0c432afc822679a67bc95b6dceba43e8eb1a0be5bc9a290
|
| 3 |
+
size 2610261
|
rfdit_step_fp32_2s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da74b749d04502615ce51efd8a7d7b0c5c25c0ceda570cd96d88d3497bc1dd4e
|
| 3 |
+
size 1370095616
|
rfdit_step_fp32_30s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fea59bfe3f82714144be154d5b9f7bc3aff56897721cf0a1c935ae3ef0126729
|
| 3 |
+
size 2584321
|
rfdit_step_fp32_30s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcca50ec4d088135677feb491dffe417d99469e22b7ef493dd5a20c957ff20cd
|
| 3 |
+
size 1369899008
|
rfdit_step_fp32_4s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad1065ffa3d21f1d31fe2fd6ca6a415694790b8e03ea413fe2214049e9a1ee39
|
| 3 |
+
size 2610423
|
rfdit_step_fp32_4s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4a32061e2b0b6b22acac97e37425657785cce3e0d6a53eb77a8a86187f42ca2
|
| 3 |
+
size 1370423296
|
rfdit_step_fp32_8s.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9d4b2e36b6826fd2b1571bf264a335ded7403b444cbdd5166c1f90be767a810
|
| 3 |
+
size 2580842
|
rfdit_step_fp32_8s.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fef4078abae1973e0b626ca8c953d5ef61778f3df585f9c644d399ba0bc594c9
|
| 3 |
+
size 1369833472
|
tokenizer/llm-jp-3-150m/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|