majentik commited on
Commit
f818655
·
verified ·
1 Parent(s): ba8ef4c

Re-upload with properly quantized decoder (encoder/adaptor bf16)

Browse files
adaptor.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af63eb1c572ab11a30d86dacd012987a44db6250d10e05b4a63462930d292996
3
- size 67917220
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa531eeb21ba13291d4423dbecb8f5236675fa33ca33a882e38d6e8f3e03d545
3
+ size 127820808
config.json CHANGED
@@ -98,9 +98,5 @@
98
  "vocab_size": 256000
99
  },
100
  "torch_dtype": "bfloat16",
101
- "transformers_version": "4.51.3",
102
- "quantization_config": {
103
- "bits": 8,
104
- "group_size": 64
105
- }
106
  }
 
98
  "vocab_size": 256000
99
  },
100
  "torch_dtype": "bfloat16",
101
+ "transformers_version": "4.51.3"
 
 
 
 
102
  }
decoder-00000.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23440da67726f9f2bf880b1719467892b0dac37df44c0b761c2b8e50de3efa58
3
- size 2238447571
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eca97d08740e4b40d53437a235cce8b7463c36c8d2c40d3906f545b7c2c6587
3
+ size 3098607432
decoder-00001.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b50f3ab2ac54dc39115f3e85990f41390ec831e9ef6930376aab9f6a1586873
3
- size 2277583292
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aa023decb8da2a60377f77ea1b8fb03d807a3cfffd5520ab91978c8e8406dcd
3
+ size 2277583326
decoder-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e408ff583abe1f870b4bb6a0b13596f2ad46ee1cea69b5bb280e058c91ffc30
3
- size 2254172711
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f4f089718fd85cfe39fecadc4540f6556c0b0faf6dc3a8b16a394d502626773
3
+ size 2254172749
decoder-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76366f0f1d1cc134b205df3be6a2c765fc44bb81d0117e5b1870342f62da60a8
3
- size 2261993699
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cfa73afe59e85f3bc1fefe9bbb67d9d6234ed9feaaae9e5695a1f9af642d7cb
3
+ size 2261993703
decoder-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b41cc96eb90a0190b4c43e97728d166b6aa2073368c83dbd9117cb8453f59c35
3
- size 787802682
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b524b11ba3eadf295aec5161f7665210cc659725355701fefc5f528d3f7ff565
3
+ size 787802694
decoder.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff
 
decoder_config.json CHANGED
@@ -28,5 +28,15 @@
28
  "sliding_window_size": 4096,
29
  "torch_dtype": "bfloat16",
30
  "use_cache": true,
31
- "vocab_size": 256000
 
 
 
 
 
 
 
 
 
 
32
  }
 
28
  "sliding_window_size": 4096,
29
  "torch_dtype": "bfloat16",
30
  "use_cache": true,
31
+ "vocab_size": 256000,
32
+ "quantization_config": {
33
+ "group_size": 64,
34
+ "bits": 8,
35
+ "mode": "affine"
36
+ },
37
+ "quantization": {
38
+ "group_size": 64,
39
+ "bits": 8,
40
+ "mode": "affine"
41
+ }
42
  }
encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3a35a8bc1d0f5cade3a28e19d7d87bf24beb2d5aaacd5069f88002f74e50668
3
- size 677334445
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5614998711501c176a882a25c06c22851b80f8d77de4084212f365253d40ee61
3
+ size 1273987800