dia, dia-gguf, mmwillet2 (TTS.cpp)
Browse files- .gitattributes +17 -0
- dia-gguf/.gitattributes +42 -0
- dia-gguf/README.md +30 -0
- dia-gguf/audio1.wav +3 -0
- dia-gguf/audio2.wav +3 -0
- dia-gguf/dia-1.6b-f16.gguf +3 -0
- dia-gguf/dia-1.6b-f32.gguf +3 -0
- dia-gguf/dia-1.6b-q2_k.gguf +3 -0
- dia-gguf/dia-1.6b-q4_0.gguf +3 -0
- dia-gguf/dia-1.6b-q6_k.gguf +3 -0
- dia-gguf/dia_1.6b_fp16.safetensors +3 -0
- dia-gguf/dia_1.6b_fp32.safetensors +3 -0
- dia-gguf/dia_1.6b_fp8_e4m3fn.safetensors +3 -0
- mmwillet2/Dia_GGUF/.gitattributes +44 -0
- mmwillet2/Dia_GGUF/Dia.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_F16.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_F16_DAC_F16.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q4.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q4_DAC_F16.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q5.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q5_DAC_F16.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q8.gguf +3 -0
- mmwillet2/Dia_GGUF/Dia_Q8_DAC_F16.gguf +3 -0
- mmwillet2/Dia_GGUF/README.md +34 -0
- mmwillet2/TTS.cpp.zip +3 -0
- mmwillet2/TTS_ipa_en_us_phonemizer/.gitattributes +36 -0
- mmwillet2/TTS_ipa_en_us_phonemizer/README.md +7 -0
- mmwillet2/TTS_ipa_en_us_phonemizer/tts_en_us_phonemizer.gguf +3 -0
- nari-labs_dia.zip +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,20 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
dia-gguf/audio1.wav filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
dia-gguf/audio2.wav filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
dia-gguf/dia-1.6b-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
dia-gguf/dia-1.6b-f32.gguf filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
dia-gguf/dia-1.6b-q2_k.gguf filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
dia-gguf/dia-1.6b-q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
dia-gguf/dia-1.6b-q6_k.gguf filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
mmwillet2/Dia_GGUF/Dia_F16_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
mmwillet2/Dia_GGUF/Dia_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
mmwillet2/Dia_GGUF/Dia_Q4_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
mmwillet2/Dia_GGUF/Dia_Q4.gguf filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
mmwillet2/Dia_GGUF/Dia_Q5_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
mmwillet2/Dia_GGUF/Dia_Q5.gguf filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
mmwillet2/Dia_GGUF/Dia_Q8_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
mmwillet2/Dia_GGUF/Dia_Q8.gguf filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
mmwillet2/Dia_GGUF/Dia.gguf filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
mmwillet2/TTS_ipa_en_us_phonemizer/tts_en_us_phonemizer.gguf filter=lfs diff=lfs merge=lfs -text
|
dia-gguf/.gitattributes
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
dia-1.6b-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
dia-1.6b-f32.gguf filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
dia-1.6b-q2_k.gguf filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
dia-1.6b-q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
dia-1.6b-q6_k.gguf filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
samples/audio1.wav filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
samples/audio2.wav filter=lfs diff=lfs merge=lfs -text
|
dia-gguf/README.md
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: apache-2.0
|
| 3 |
+
language:
|
| 4 |
+
- en
|
| 5 |
+
base_model:
|
| 6 |
+
- nari-labs/Dia-1.6B
|
| 7 |
+
pipeline_tag: text-to-speech
|
| 8 |
+
tags:
|
| 9 |
+
- gguf-connector
|
| 10 |
+
---
|
| 11 |
+
## gguf quantized and fp8/16/32 scaled dia-1.6b
|
| 12 |
+
- base model from [nari-labs](https://huggingface.co/nari-labs)
|
| 13 |
+
- text-to-speech synthesis
|
| 14 |
+
|
| 15 |
+
### **run it with gguf-connector**
|
| 16 |
+
```
|
| 17 |
+
ggc s2
|
| 18 |
+
```
|
| 19 |
+
|
| 20 |
+

|
| 21 |
+
|
| 22 |
+
| Prompt | Audio Sample |
|
| 23 |
+
|--------|---------------|
|
| 24 |
+
|`[S1] This is an open weights text to dialogue model.`<br/>`[S2] You get full control over scripts and voices.`<br/>`[S1] Wow. Amazing. (laughs)`<br/>`[S2] Try it now on Git hub or Hugging Face.`<br/> | 🎧 **dia-sample-1**<br><audio controls src="https://huggingface.co/calcuis/dia-gguf/resolve/main/samples%5Caudio1.wav"></audio> |
|
| 25 |
+
|`[S1] Hey Connector, why your appearance looks so stupid?`<br/>`[S2] Oh, really? maybe I ate too much smart beans.`<br/>`[S1] Wow. Amazing. (laughs)`<br/>`[S2] Let's go to get some more smart beans and you will become stupid as well.`<br/> | 🎧 **dia-sample-2**<br><audio controls src="https://huggingface.co/calcuis/dia-gguf/resolve/main/samples%5Caudio2.wav"></audio> |
|
| 26 |
+
|
| 27 |
+
### **review/reference**
|
| 28 |
+
- simply execute the command (`ggc s2`) above in console/terminal
|
| 29 |
+
- note: model file(s) will be pulled to local cache automatically during the first launch; then opt to run it entirely offline; i.e., from local URL: http://127.0.0.1:7860 with lazy webui
|
| 30 |
+
- gguf-connector ([pypi](https://pypi.org/project/gguf-connector))
|
dia-gguf/audio1.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ded7776a1ced891b3f770df1996b239328894720c1539e3e15ccf1ba10a544c4
|
| 3 |
+
size 788740
|
dia-gguf/audio2.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cc67e0363c42ca61968f63ce968de4a41223bc2853a7e57dacfde7636a8277b
|
| 3 |
+
size 731004
|
dia-gguf/dia-1.6b-f16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa9ef3bb253ac293ed8af84acde09e747fc5ed8ee21f9aafff96e905f91bd3bd
|
| 3 |
+
size 3222626560
|
dia-gguf/dia-1.6b-f32.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a77c7061a98c6bf54d21446f4e8020d9c7a5920d1b437017aedee128082e9ffd
|
| 3 |
+
size 6444671232
|
dia-gguf/dia-1.6b-q2_k.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cdec4a5ee4d8ec8bb47db2bffb28e5388c2015cf2924fdebd68629bd6d51539
|
| 3 |
+
size 640503680
|
dia-gguf/dia-1.6b-q4_0.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:83d33f28e4693632f89c291e17328ccce79af067f5b3e2054d866ddfc6508d4f
|
| 3 |
+
size 906777344
|
dia-gguf/dia-1.6b-q6_k.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32fdb74d0e7f5e2f07996c782b67ba9b9ea2e9186fb565ce6283fbdbaf4bac82
|
| 3 |
+
size 1426756928
|
dia-gguf/dia_1.6b_fp16.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40ba0e38590ff2a9238c55906ab3441c7dbc7de68f0c349e504f44e235115700
|
| 3 |
+
size 3222363176
|
dia-gguf/dia_1.6b_fp32.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:caba289b60f6d7d1e58fc744f4dc25aae88995fcca46be3d05e220b971486a26
|
| 3 |
+
size 6444682848
|
dia-gguf/dia_1.6b_fp8_e4m3fn.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82eda6cfdb23bdfba59782ee56cc7f166f16b696c316148cacc9a21d686cc6d7
|
| 3 |
+
size 1611202200
|
mmwillet2/Dia_GGUF/.gitattributes
ADDED
|
@@ -0,0 +1,44 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
Dia.gguf filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
Dia_Q4.gguf filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
Dia_Q5.gguf filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
Dia_Q8.gguf filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
Dia_Q4_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
Dia_Q5_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
Dia_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
Dia_Q8_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
Dia_F16_DAC_F16.gguf filter=lfs diff=lfs merge=lfs -text
|
mmwillet2/Dia_GGUF/Dia.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72fe442f5e542ec8c7ec45f105767871db7fc283291ec9450055279742671c61
|
| 3 |
+
size 6661671616
|
mmwillet2/Dia_GGUF/Dia_F16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bd10ec97f10b076a48aaff5e5b8c386d09048ef0285cbd48ca87936d02c7f39
|
| 3 |
+
size 3477522944
|
mmwillet2/Dia_GGUF/Dia_F16_DAC_F16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a9f88ca6cb56c5f7151066466f96531f9562a92d7d5b2a17791dc67029070dc
|
| 3 |
+
size 3369092288
|
mmwillet2/Dia_GGUF/Dia_Q4.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4258bd64aed0dea80898872dad04c12be321661c2f134e0f52fd179068c35020
|
| 3 |
+
size 1188916224
|
mmwillet2/Dia_GGUF/Dia_Q4_DAC_F16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3a659212643abb0681c80178a9193ae4b4e3b9f8d9059824769abf465b9e455
|
| 3 |
+
size 1080485568
|
mmwillet2/Dia_GGUF/Dia_Q5.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06030a54aaa284f817ffb2403ac048c9f82809678fa0b204490a0f77cd16a482
|
| 3 |
+
size 1387925504
|
mmwillet2/Dia_GGUF/Dia_Q5_DAC_F16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72065a8b66c3d9153e3906aa6d0879354bab6fbfb9f733c1ea3b504ccd3ba9f9
|
| 3 |
+
size 1279494848
|
mmwillet2/Dia_GGUF/Dia_Q8.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d171c32c96cfc876ab393e327370129536b0ef7e1c6eb44b2a49226e6c952e5
|
| 3 |
+
size 1984953344
|
mmwillet2/Dia_GGUF/Dia_Q8_DAC_F16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d07a306f0153f8da04b14197a37bd65bf32ea0e00b3cb3239ba2e9aef5b932c
|
| 3 |
+
size 1876522688
|
mmwillet2/Dia_GGUF/README.md
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
base_model:
|
| 4 |
+
- nari-labs/Dia-1.6B
|
| 5 |
+
pipeline_tag: text-to-speech
|
| 6 |
+
---
|
| 7 |
+
## Purpose
|
| 8 |
+
|
| 9 |
+
The purpose of this repository is to store various [TTS.cpp](https://github.com/mmwillet/TTS.cpp) compatible GGUF encoded model files for the [Dia model](https://github.com/nari-labs/dia).
|
| 10 |
+
|
| 11 |
+
### Model Types
|
| 12 |
+
|
| 13 |
+
Currently the model is supported with 4-bit, 5-bit, 8-bit, F16bit and F32bit quantization / precision and all modes are supported with F16 and F32 bit precision DAC. `Dia.gguf` is the non-quantized 32 bit floating point version, `Dia_Q4.gguf`, `Dia_Q5.gguf`, `Dia_Q8.gguf` and `Dia_F16.gguf` are the 4bit, 5bit, 8bit and 16bit quantized versions respectively, and all versions with the prefix `_DAC_F16.gguf` are encoded with a 16bit version of the DAC audio encoder.
|
| 14 |
+
|
| 15 |
+
## Dia
|
| 16 |
+
|
| 17 |
+
This page only contains the GGUF encoded model files of the original Dia model. For the original model please see the repository [here](https://github.com/nari-labs/dia).
|
| 18 |
+
|
| 19 |
+
## How to use
|
| 20 |
+
|
| 21 |
+
See the github repo [here](https://github.com/mmwillet/TTS.cpp) for more information general usage.
|
| 22 |
+
|
| 23 |
+
To compile TTS.cpp simple git clone and then run the the following in the repository's directory to compile (cmake is required):
|
| 24 |
+
|
| 25 |
+
```bash
|
| 26 |
+
cmake -B build
|
| 27 |
+
cmake --build build --config Release
|
| 28 |
+
```
|
| 29 |
+
|
| 30 |
+
After compilation is complete you can download a model file generate speech to a file from the same directory like so:
|
| 31 |
+
|
| 32 |
+
```bash
|
| 33 |
+
build/bin/cli --model-path /model/path/to/downloaded_gguf_file.gguf --prompt "I am saying some words" --save-path /tmp/test.wav
|
| 34 |
+
```
|
mmwillet2/TTS.cpp.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e5874af39a085f7dd2cdccb5b939057e9fba017781ed95051cab8a0b234ba72
|
| 3 |
+
size 47033811
|
mmwillet2/TTS_ipa_en_us_phonemizer/.gitattributes
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tts_en_us_phonemizer.gguf filter=lfs diff=lfs merge=lfs -text
|
mmwillet2/TTS_ipa_en_us_phonemizer/README.md
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
---
|
| 4 |
+
|
| 5 |
+
### Overview
|
| 6 |
+
This repository simply contains the gguf file for the standard [TTS.cpp](https://github.com/mmwillet/TTS.cpp) phonemizer.
|
| 7 |
+
Please direct concerns and questions to the github therein.
|
mmwillet2/TTS_ipa_en_us_phonemizer/tts_en_us_phonemizer.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6d141f44e55ef2ffe1b775de827e88b9e87add6405caf7ee9fe444b11c9d0a0
|
| 3 |
+
size 31743045
|
nari-labs_dia.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d36fb197c75827254629d71d5a276ee8daf48ceabcbca3674cbd057d37b9266
|
| 3 |
+
size 1164320
|