danielhanchen commited on
Commit
8a96bea
·
1 Parent(s): bcda069

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,77 +33,19 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
- BF16/DeepSeek-R1-0528-BF16-00001-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
37
- BF16/DeepSeek-R1-0528-BF16-00025-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
38
- BF16/DeepSeek-R1-0528-BF16-00026-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
39
- BF16/DeepSeek-R1-0528-BF16-00028-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
40
- BF16/DeepSeek-R1-0528-BF16-00030-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
41
- BF16/DeepSeek-R1-0528-BF16-00009-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
42
- BF16/DeepSeek-R1-0528-BF16-00002-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
43
- BF16/DeepSeek-R1-0528-BF16-00005-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
44
- BF16/DeepSeek-R1-0528-BF16-00007-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
45
- BF16/DeepSeek-R1-0528-BF16-00008-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
46
- BF16/DeepSeek-R1-0528-BF16-00006-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
47
- BF16/DeepSeek-R1-0528-BF16-00004-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
48
- BF16/DeepSeek-R1-0528-BF16-00003-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
49
- BF16/DeepSeek-R1-0528-BF16-00010-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
50
- BF16/DeepSeek-R1-0528-BF16-00011-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
51
- BF16/DeepSeek-R1-0528-BF16-00012-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
52
- BF16/DeepSeek-R1-0528-BF16-00013-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
53
- BF16/DeepSeek-R1-0528-BF16-00014-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
54
- BF16/DeepSeek-R1-0528-BF16-00015-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
55
- BF16/DeepSeek-R1-0528-BF16-00017-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
56
- BF16/DeepSeek-R1-0528-BF16-00016-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
57
- BF16/DeepSeek-R1-0528-BF16-00018-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
58
- BF16/DeepSeek-R1-0528-BF16-00019-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
59
- BF16/DeepSeek-R1-0528-BF16-00020-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
60
- BF16/DeepSeek-R1-0528-BF16-00022-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
61
- BF16/DeepSeek-R1-0528-BF16-00021-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
62
- BF16/DeepSeek-R1-0528-BF16-00023-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
63
- BF16/DeepSeek-R1-0528-BF16-00024-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
64
- BF16/DeepSeek-R1-0528-BF16-00027-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
65
- BF16/DeepSeek-R1-0528-BF16-00029-of-00030.gguf filter=lfs diff=lfs merge=lfs -text
66
  Q8_0/DeepSeek-R1-0528-Q8_0-00015-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
67
- Q8_0/DeepSeek-R1-0528-Q8_0-00001-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
68
- Q8_0/DeepSeek-R1-0528-Q8_0-00002-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
69
- Q8_0/DeepSeek-R1-0528-Q8_0-00003-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
70
- Q8_0/DeepSeek-R1-0528-Q8_0-00004-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
71
- Q8_0/DeepSeek-R1-0528-Q8_0-00006-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
72
- Q8_0/DeepSeek-R1-0528-Q8_0-00005-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
73
- Q8_0/DeepSeek-R1-0528-Q8_0-00007-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
74
- Q8_0/DeepSeek-R1-0528-Q8_0-00008-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
75
- Q8_0/DeepSeek-R1-0528-Q8_0-00009-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
76
- Q8_0/DeepSeek-R1-0528-Q8_0-00010-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
77
- Q8_0/DeepSeek-R1-0528-Q8_0-00011-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
78
  Q8_0/DeepSeek-R1-0528-Q8_0-00012-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
79
  Q8_0/DeepSeek-R1-0528-Q8_0-00013-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
80
  Q8_0/DeepSeek-R1-0528-Q8_0-00014-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
81
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00006-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
82
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00008-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
83
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00001-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
84
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00004-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
85
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00005-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
86
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00001-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
87
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00002-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
88
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00007-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
89
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00004-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
90
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00005-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
91
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00003-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
92
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00002-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
93
- UD-Q4_K_XL/DeepSeek-R1-0528-UD-Q4_K_XL-00006-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
94
- UD-Q2_K_XL/DeepSeek-R1-0528-UD-Q2_K_XL-00003-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
95
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00009-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
96
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00006-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
97
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00006-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
98
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00005-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
99
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00005-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
100
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00004-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
101
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00008-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
102
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00007-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
103
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00003-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
104
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00003-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
105
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00004-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
106
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00001-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
107
- Q4_K_M/DeepSeek-R1-0528-Q4_K_M-00002-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
108
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00002-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
109
- UD-Q3_K_XL/DeepSeek-R1-0528-UD-Q3_K_XL-00001-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ imatrix_unsloth.dat filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  Q8_0/DeepSeek-R1-0528-Q8_0-00015-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
38
  Q8_0/DeepSeek-R1-0528-Q8_0-00012-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
39
  Q8_0/DeepSeek-R1-0528-Q8_0-00013-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
40
  Q8_0/DeepSeek-R1-0528-Q8_0-00014-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Q8_0/DeepSeek-R1-0528-Q8_0-00011-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Q8_0/DeepSeek-R1-0528-Q8_0-00010-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Q8_0/DeepSeek-R1-0528-Q8_0-00009-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Q8_0/DeepSeek-R1-0528-Q8_0-00004-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Q8_0/DeepSeek-R1-0528-Q8_0-00008-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Q8_0/DeepSeek-R1-0528-Q8_0-00007-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Q8_0/DeepSeek-R1-0528-Q8_0-00005-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
48
+ Q8_0/DeepSeek-R1-0528-Q8_0-00001-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
49
+ Q8_0/DeepSeek-R1-0528-Q8_0-00002-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
50
+ Q8_0/DeepSeek-R1-0528-Q8_0-00006-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
51
+ Q8_0/DeepSeek-R1-0528-Q8_0-00003-of-00015.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Q8_0/DeepSeek-R1-0528-Q8_0-00001-of-00015.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98ad5bc96231e74658ed5b7bbcec80e494e952b35d3df85bf07e2994b2c10459
3
- size 47784556032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd337661f0d52c87d9216e3f12744a3ed04943e626ec51591648955ceb90d159
3
+ size 47784556320
config.json CHANGED
@@ -35,6 +35,15 @@
35
  "q_lora_rank": 1536,
36
  "qk_nope_head_dim": 128,
37
  "qk_rope_head_dim": 64,
 
 
 
 
 
 
 
 
 
38
  "rms_norm_eps": 1e-06,
39
  "rope_scaling": {
40
  "beta_fast": 32,
 
35
  "q_lora_rank": 1536,
36
  "qk_nope_head_dim": 128,
37
  "qk_rope_head_dim": 64,
38
+ "quantization_config": {
39
+ "activation_scheme": "dynamic",
40
+ "fmt": "e4m3",
41
+ "quant_method": "fp8",
42
+ "weight_block_size": [
43
+ 128,
44
+ 128
45
+ ]
46
+ },
47
  "rms_norm_eps": 1e-06,
48
  "rope_scaling": {
49
  "beta_fast": 32,