Re-upload with properly quantized decoder (encoder/adaptor bf16)
Browse files- adaptor.safetensors +2 -2
- config.json +1 -5
- decoder-00000.safetensors +2 -2
- decoder-00001.safetensors +2 -2
- decoder-00002.safetensors +2 -2
- decoder-00003.safetensors +2 -2
- decoder-00004.safetensors +2 -2
- decoder.safetensors.index.json +0 -0
- decoder_config.json +11 -1
- encoder.safetensors +2 -2
adaptor.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa531eeb21ba13291d4423dbecb8f5236675fa33ca33a882e38d6e8f3e03d545
|
| 3 |
+
size 127820808
|
config.json
CHANGED
|
@@ -98,9 +98,5 @@
|
|
| 98 |
"vocab_size": 256000
|
| 99 |
},
|
| 100 |
"torch_dtype": "bfloat16",
|
| 101 |
-
"transformers_version": "4.51.3"
|
| 102 |
-
"quantization_config": {
|
| 103 |
-
"bits": 8,
|
| 104 |
-
"group_size": 64
|
| 105 |
-
}
|
| 106 |
}
|
|
|
|
| 98 |
"vocab_size": 256000
|
| 99 |
},
|
| 100 |
"torch_dtype": "bfloat16",
|
| 101 |
+
"transformers_version": "4.51.3"
|
|
|
|
|
|
|
|
|
|
|
|
|
| 102 |
}
|
decoder-00000.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2eca97d08740e4b40d53437a235cce8b7463c36c8d2c40d3906f545b7c2c6587
|
| 3 |
+
size 3098607432
|
decoder-00001.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0aa023decb8da2a60377f77ea1b8fb03d807a3cfffd5520ab91978c8e8406dcd
|
| 3 |
+
size 2277583326
|
decoder-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f4f089718fd85cfe39fecadc4540f6556c0b0faf6dc3a8b16a394d502626773
|
| 3 |
+
size 2254172749
|
decoder-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6cfa73afe59e85f3bc1fefe9bbb67d9d6234ed9feaaae9e5695a1f9af642d7cb
|
| 3 |
+
size 2261993703
|
decoder-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b524b11ba3eadf295aec5161f7665210cc659725355701fefc5f528d3f7ff565
|
| 3 |
+
size 787802694
|
decoder.safetensors.index.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoder_config.json
CHANGED
|
@@ -28,5 +28,15 @@
|
|
| 28 |
"sliding_window_size": 4096,
|
| 29 |
"torch_dtype": "bfloat16",
|
| 30 |
"use_cache": true,
|
| 31 |
-
"vocab_size": 256000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
}
|
|
|
|
| 28 |
"sliding_window_size": 4096,
|
| 29 |
"torch_dtype": "bfloat16",
|
| 30 |
"use_cache": true,
|
| 31 |
+
"vocab_size": 256000,
|
| 32 |
+
"quantization_config": {
|
| 33 |
+
"group_size": 64,
|
| 34 |
+
"bits": 8,
|
| 35 |
+
"mode": "affine"
|
| 36 |
+
},
|
| 37 |
+
"quantization": {
|
| 38 |
+
"group_size": 64,
|
| 39 |
+
"bits": 8,
|
| 40 |
+
"mode": "affine"
|
| 41 |
+
}
|
| 42 |
}
|
encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5614998711501c176a882a25c06c22851b80f8d77de4084212f365253d40ee61
|
| 3 |
+
size 1273987800
|