Devbora29 commited on
Commit
5860a8b
·
verified ·
1 Parent(s): 96cb6b1

Upload folder using huggingface_hub

Browse files
chat_template.jinja ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if messages[0]["role"] == "system" %}
2
+ {%- set system_message = messages[0]["content"] %}
3
+ {%- set loop_messages = messages[1:] %}
4
+ {%- else %}
5
+ {%- set loop_messages = messages %}
6
+ {%- endif %}
7
+ {%- if not tools is defined %}
8
+ {%- set tools = none %}
9
+ {%- endif %}
10
+ {%- set user_messages = loop_messages | selectattr("role", "equalto", "user") | list %}
11
+
12
+ {#- This block checks for alternating user/assistant messages, skipping tool calling messages #}
13
+ {%- set ns = namespace() %}
14
+ {%- set ns.index = 0 %}
15
+ {%- for message in loop_messages %}
16
+ {%- if not (message.role == "tool" or message.role == "tool_results" or (message.tool_calls is defined and message.tool_calls is not none)) %}
17
+ {%- if (message["role"] == "user") != (ns.index % 2 == 0) %}
18
+ {{- raise_exception("After the optional system message, conversation roles must alternate user/assistant/user/assistant/...") }}
19
+ {%- endif %}
20
+ {%- set ns.index = ns.index + 1 %}
21
+ {%- endif %}
22
+ {%- endfor %}
23
+
24
+ {{- bos_token }}
25
+ {%- for message in loop_messages %}
26
+ {%- if message["role"] == "user" %}
27
+ {%- if tools is not none and (message == user_messages[-1]) %}
28
+ {{- "[AVAILABLE_TOOLS] [" }}
29
+ {%- for tool in tools %}
30
+ {%- set tool = tool.function %}
31
+ {{- '{"type": "function", "function": {' }}
32
+ {%- for key, val in tool.items() if key != "return" %}
33
+ {%- if val is string %}
34
+ {{- '"' + key + '": "' + val + '"' }}
35
+ {%- else %}
36
+ {{- '"' + key + '": ' + val|tojson }}
37
+ {%- endif %}
38
+ {%- if not loop.last %}
39
+ {{- ", " }}
40
+ {%- endif %}
41
+ {%- endfor %}
42
+ {{- "}}" }}
43
+ {%- if not loop.last %}
44
+ {{- ", " }}
45
+ {%- else %}
46
+ {{- "]" }}
47
+ {%- endif %}
48
+ {%- endfor %}
49
+ {{- "[/AVAILABLE_TOOLS]" }}
50
+ {%- endif %}
51
+ {%- if loop.last and system_message is defined %}
52
+ {{- "[INST] " + system_message + "\n\n" + message["content"] + "[/INST]" }}
53
+ {%- else %}
54
+ {{- "[INST] " + message["content"] + "[/INST]" }}
55
+ {%- endif %}
56
+ {%- elif message.tool_calls is defined and message.tool_calls is not none %}
57
+ {{- "[TOOL_CALLS] [" }}
58
+ {%- for tool_call in message.tool_calls %}
59
+ {%- set out = tool_call.function|tojson %}
60
+ {{- out[:-1] }}
61
+ {%- if not tool_call.id is defined or tool_call.id|length != 9 %}
62
+ {{- raise_exception("Tool call IDs should be alphanumeric strings with length 9!") }}
63
+ {%- endif %}
64
+ {{- ', "id": "' + tool_call.id + '"}' }}
65
+ {%- if not loop.last %}
66
+ {{- ", " }}
67
+ {%- else %}
68
+ {{- "]" + eos_token }}
69
+ {%- endif %}
70
+ {%- endfor %}
71
+ {%- elif message["role"] == "assistant" %}
72
+ {{- " " + message["content"]|trim + eos_token}}
73
+ {%- elif message["role"] == "tool_results" or message["role"] == "tool" %}
74
+ {%- if message.content is defined and message.content.content is defined %}
75
+ {%- set content = message.content.content %}
76
+ {%- else %}
77
+ {%- set content = message.content %}
78
+ {%- endif %}
79
+ {{- '[TOOL_RESULTS] {"content": ' + content|string + ", " }}
80
+ {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}
81
+ {{- raise_exception("Tool call IDs should be alphanumeric strings with length 9!") }}
82
+ {%- endif %}
83
+ {{- '"call_id": "' + message.tool_call_id + '"}[/TOOL_RESULTS]' }}
84
+ {%- else %}
85
+ {{- raise_exception("Only user and assistant roles are supported, with the exception of an initial optional system message!") }}
86
+ {%- endif %}
87
+ {%- endfor %}
config.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MistralForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 1,
7
+ "dtype": "bfloat16",
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "pad_token_id": 0,
20
+ "quantization_config": {
21
+ "bits": 4,
22
+ "checkpoint_format": "gptq",
23
+ "desc_act": false,
24
+ "format": "gptq",
25
+ "group_size": 128,
26
+ "lm_head": false,
27
+ "meta": {
28
+ "act_group_aware": true,
29
+ "auto_forward_data_parallel": true,
30
+ "damp_auto_increment": 0.01,
31
+ "damp_percent": 0.05,
32
+ "fallback": {
33
+ "smooth": null,
34
+ "strategy": "rtn",
35
+ "threshold": "0.5%"
36
+ },
37
+ "foem": null,
38
+ "gc_mode": "interval",
39
+ "gptaq": null,
40
+ "hessian": {
41
+ "chunk_bytes": null,
42
+ "chunk_size": null,
43
+ "staging_dtype": "float32"
44
+ },
45
+ "mock_quantization": false,
46
+ "mse": 0.0,
47
+ "offload_to_disk": true,
48
+ "offload_to_disk_path": "./gptqmodel_offload/orcmjeui-tnqhqrfy/",
49
+ "pack_impl": "cpu",
50
+ "quantizer": [
51
+ "gptqmodel:6.0.3"
52
+ ],
53
+ "static_groups": false,
54
+ "true_sequential": true,
55
+ "uri": "https://github.com/modelcloud/gptqmodel",
56
+ "vram_strategy": "exclusive",
57
+ "wait_for_submodule_finalizers": false
58
+ },
59
+ "method": "gptq",
60
+ "pack_dtype": "int32",
61
+ "quant_method": "gptq",
62
+ "sym": true
63
+ },
64
+ "rms_norm_eps": 1e-05,
65
+ "rope_parameters": {
66
+ "rope_theta": 1000000.0,
67
+ "rope_type": "default"
68
+ },
69
+ "sliding_window": null,
70
+ "tie_word_embeddings": false,
71
+ "transformers_version": "5.5.3",
72
+ "use_cache": true,
73
+ "vocab_size": 32768
74
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "do_sample": true,
5
+ "eos_token_id": 2,
6
+ "transformers_version": "5.5.3"
7
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfcf75467cadbe45ff417cf8051d93164dd3f6545955085ad623b95c81adc9b6
3
+ size 4168468336
quant_log.csv ADDED
@@ -0,0 +1,225 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ layer,module,loss,samples,damp,time
2
+ 0,self_attn.k_proj,0.0000025754,0.05000,4.550
3
+ 0,self_attn.v_proj,0.0000002206,0.05000,4.562
4
+ 0,self_attn.q_proj,0.0000087561,0.05000,4.573
5
+ 0,self_attn.o_proj,0.0000000012,0.05000,1.502
6
+ 0,mlp.up_proj,0.0000081505,0.05000,2.709
7
+ 0,mlp.gate_proj,0.0000094237,0.05000,2.716
8
+ 0,mlp.down_proj,0.0000000070,0.05000,5.802
9
+ 1,self_attn.q_proj,0.0000285129,0.05000,5.844
10
+ 1,self_attn.v_proj,0.0000020318,0.05000,5.856
11
+ 1,self_attn.k_proj,0.0000127451,0.05000,5.870
12
+ 1,self_attn.o_proj,0.0000000052,0.05000,1.503
13
+ 1,mlp.gate_proj,0.0000322149,0.05000,2.735
14
+ 1,mlp.up_proj,0.0000282160,0.05000,2.741
15
+ 1,mlp.down_proj,0.0000052935,0.05000,5.818
16
+ 2,self_attn.v_proj,0.0000137185,0.05000,5.586
17
+ 2,self_attn.k_proj,0.0001054883,0.05000,5.603
18
+ 2,self_attn.q_proj,0.0002171249,0.05000,5.632
19
+ 2,self_attn.o_proj,0.0000000075,0.05000,1.523
20
+ 2,mlp.gate_proj,0.0000672672,0.05000,2.829
21
+ 2,mlp.up_proj,0.0000587216,0.05000,2.835
22
+ 2,mlp.down_proj,0.0000000224,0.05000,5.795
23
+ 3,self_attn.v_proj,0.0000093818,0.05000,5.672
24
+ 3,self_attn.q_proj,0.0001175257,0.05000,5.684
25
+ 3,self_attn.k_proj,0.0000570549,0.05000,5.696
26
+ 3,self_attn.o_proj,0.0000000112,0.05000,1.535
27
+ 3,mlp.gate_proj,0.0001121420,0.05000,2.703
28
+ 3,mlp.up_proj,0.0000968189,0.05000,2.706
29
+ 3,mlp.down_proj,0.0000000410,0.05000,5.772
30
+ 4,self_attn.q_proj,0.0001813112,0.05000,5.543
31
+ 4,self_attn.v_proj,0.0000157679,0.05000,5.555
32
+ 4,self_attn.k_proj,0.0000802006,0.05000,5.555
33
+ 4,self_attn.o_proj,0.0000000139,0.05000,1.527
34
+ 4,mlp.gate_proj,0.0001625613,0.05000,2.747
35
+ 4,mlp.up_proj,0.0001317042,0.05000,2.761
36
+ 4,mlp.down_proj,0.0000000744,0.05000,5.809
37
+ 5,self_attn.k_proj,0.0001039211,0.05000,5.706
38
+ 5,self_attn.q_proj,0.0002341090,0.05000,5.739
39
+ 5,self_attn.v_proj,0.0000174460,0.05000,5.786
40
+ 5,self_attn.o_proj,0.0000000322,0.05000,1.503
41
+ 5,mlp.gate_proj,0.0002247521,0.05000,2.734
42
+ 5,mlp.up_proj,0.0001709394,0.05000,2.734
43
+ 5,mlp.down_proj,0.0000001268,0.05000,5.818
44
+ 6,self_attn.k_proj,0.0001032290,0.05000,5.563
45
+ 6,self_attn.v_proj,0.0000177316,0.05000,5.576
46
+ 6,self_attn.q_proj,0.0002197504,0.05000,5.594
47
+ 6,self_attn.o_proj,0.0000000426,0.05000,1.519
48
+ 6,mlp.gate_proj,0.0002620231,0.05000,2.695
49
+ 6,mlp.up_proj,0.0002037956,0.05000,2.700
50
+ 6,mlp.down_proj,0.0000001768,0.05000,5.722
51
+ 7,self_attn.k_proj,0.0001301391,0.05000,5.649
52
+ 7,self_attn.q_proj,0.0002715318,0.05000,5.686
53
+ 7,self_attn.v_proj,0.0000233400,0.05000,5.700
54
+ 7,self_attn.o_proj,0.0000000710,0.05000,1.489
55
+ 7,mlp.gate_proj,0.0003091105,0.05000,2.726
56
+ 7,mlp.up_proj,0.0002347886,0.05000,2.734
57
+ 7,mlp.down_proj,0.0000002321,0.05000,5.731
58
+ 8,self_attn.k_proj,0.0001017436,0.05000,5.731
59
+ 8,self_attn.q_proj,0.0002240664,0.05000,5.757
60
+ 8,self_attn.v_proj,0.0000217979,0.05000,5.766
61
+ 8,self_attn.o_proj,0.0000000915,0.05000,1.519
62
+ 8,mlp.up_proj,0.0002580485,0.05000,2.713
63
+ 8,mlp.gate_proj,0.0003330376,0.05000,2.718
64
+ 8,mlp.down_proj,0.0000002755,0.05000,5.747
65
+ 9,self_attn.v_proj,0.0000258198,0.05000,5.596
66
+ 9,self_attn.q_proj,0.0003062698,0.05000,5.632
67
+ 9,self_attn.k_proj,0.0001433366,0.05000,5.638
68
+ 9,self_attn.o_proj,0.0000001034,0.05000,1.490
69
+ 9,mlp.up_proj,0.0002804786,0.05000,2.756
70
+ 9,mlp.gate_proj,0.0003499140,0.05000,2.766
71
+ 9,mlp.down_proj,0.0000003341,0.05000,5.813
72
+ 10,self_attn.k_proj,0.0001297817,0.05000,5.668
73
+ 10,self_attn.v_proj,0.0000226510,0.05000,5.703
74
+ 10,self_attn.q_proj,0.0002727139,0.05000,5.738
75
+ 10,self_attn.o_proj,0.0000001711,0.05000,1.504
76
+ 10,mlp.gate_proj,0.0003655863,0.05000,2.747
77
+ 10,mlp.up_proj,0.0003002079,0.05000,2.752
78
+ 10,mlp.down_proj,0.0000003908,0.05000,5.818
79
+ 11,self_attn.v_proj,0.0000333907,0.05000,5.675
80
+ 11,self_attn.k_proj,0.0001514282,0.05000,5.690
81
+ 11,self_attn.q_proj,0.0003284788,0.05000,5.704
82
+ 11,self_attn.o_proj,0.0000002205,0.05000,1.515
83
+ 11,mlp.gate_proj,0.0003984610,0.05000,2.731
84
+ 11,mlp.up_proj,0.0003320518,0.05000,2.740
85
+ 11,mlp.down_proj,0.0000004510,0.05000,5.806
86
+ 12,self_attn.k_proj,0.0001964771,0.05000,5.543
87
+ 12,self_attn.q_proj,0.0004358755,0.05000,5.666
88
+ 12,self_attn.v_proj,0.0000379014,0.05000,5.708
89
+ 12,self_attn.o_proj,0.0000002516,0.05000,1.495
90
+ 12,mlp.up_proj,0.0003744479,0.05000,2.767
91
+ 12,mlp.gate_proj,0.0004391452,0.05000,2.776
92
+ 12,mlp.down_proj,0.0000005534,0.05000,5.815
93
+ 13,self_attn.v_proj,0.0000360716,0.05000,5.625
94
+ 13,self_attn.q_proj,0.0003422806,0.05000,5.741
95
+ 13,self_attn.k_proj,0.0001674168,0.05000,5.749
96
+ 13,self_attn.o_proj,0.0000003109,0.05000,1.493
97
+ 13,mlp.gate_proj,0.0004911288,0.05000,2.685
98
+ 13,mlp.up_proj,0.0004301303,0.05000,2.689
99
+ 13,mlp.down_proj,0.0000006914,0.05000,5.771
100
+ 14,self_attn.k_proj,0.0001664226,0.05000,5.596
101
+ 14,self_attn.v_proj,0.0000576001,0.05000,5.624
102
+ 14,self_attn.q_proj,0.0003889395,0.05000,5.668
103
+ 14,self_attn.o_proj,0.0000004098,0.05000,1.493
104
+ 14,mlp.up_proj,0.0004783811,0.05000,2.743
105
+ 14,mlp.gate_proj,0.0005488174,0.05000,2.747
106
+ 14,mlp.down_proj,0.0000008860,0.05000,5.796
107
+ 15,self_attn.q_proj,0.0004867710,0.05000,5.634
108
+ 15,self_attn.k_proj,0.0002165216,0.05000,5.752
109
+ 15,self_attn.v_proj,0.0000653710,0.05000,5.760
110
+ 15,self_attn.o_proj,0.0000004345,0.05000,1.515
111
+ 15,mlp.gate_proj,0.0006246117,0.05000,2.696
112
+ 15,mlp.up_proj,0.0005259726,0.05000,2.704
113
+ 15,mlp.down_proj,0.0000011260,0.05000,5.745
114
+ 16,self_attn.k_proj,0.0001991889,0.05000,5.492
115
+ 16,self_attn.v_proj,0.0000615639,0.05000,5.508
116
+ 16,self_attn.q_proj,0.0004318745,0.05000,5.523
117
+ 16,self_attn.o_proj,0.0000005076,0.05000,1.503
118
+ 16,mlp.up_proj,0.0006129682,0.05000,2.751
119
+ 16,mlp.gate_proj,0.0007694462,0.05000,2.759
120
+ 16,mlp.down_proj,0.0000015809,0.05000,5.768
121
+ 17,self_attn.v_proj,0.0000590238,0.05000,5.789
122
+ 17,self_attn.k_proj,0.0001672252,0.05000,5.818
123
+ 17,self_attn.q_proj,0.0003993788,0.05000,5.828
124
+ 17,self_attn.o_proj,0.0000006334,0.05000,1.505
125
+ 17,mlp.up_proj,0.0007126845,0.05000,2.701
126
+ 17,mlp.gate_proj,0.0008941703,0.05000,2.715
127
+ 17,mlp.down_proj,0.0000021782,0.05000,5.786
128
+ 18,self_attn.v_proj,0.0000725807,0.05000,5.491
129
+ 18,self_attn.k_proj,0.0001988027,0.05000,5.544
130
+ 18,self_attn.q_proj,0.0005069916,0.05000,5.570
131
+ 18,self_attn.o_proj,0.0000005907,0.05000,1.536
132
+ 18,mlp.gate_proj,0.0010087889,0.05000,2.764
133
+ 18,mlp.up_proj,0.0008049888,0.05000,2.769
134
+ 18,mlp.down_proj,0.0000031469,0.05000,5.804
135
+ 19,self_attn.q_proj,0.0004640531,0.05000,5.718
136
+ 19,self_attn.k_proj,0.0001974665,0.05000,5.751
137
+ 19,self_attn.v_proj,0.0000839271,0.05000,5.758
138
+ 19,self_attn.o_proj,0.0000007363,0.05000,1.516
139
+ 19,mlp.up_proj,0.0008893232,0.05000,2.702
140
+ 19,mlp.gate_proj,0.0011344106,0.05000,2.704
141
+ 19,mlp.down_proj,0.0000041928,0.05000,5.776
142
+ 20,self_attn.v_proj,0.0000917941,0.05000,5.457
143
+ 20,self_attn.k_proj,0.0002024085,0.05000,5.464
144
+ 20,self_attn.q_proj,0.0004972993,0.05000,5.482
145
+ 20,self_attn.o_proj,0.0000006737,0.05000,1.525
146
+ 20,mlp.gate_proj,0.0012861970,0.05000,2.697
147
+ 20,mlp.up_proj,0.0009820292,0.05000,2.696
148
+ 20,mlp.down_proj,0.0000043654,0.05000,5.801
149
+ 21,self_attn.k_proj,0.0001981790,0.05000,5.710
150
+ 21,self_attn.v_proj,0.0000964703,0.05000,5.747
151
+ 21,self_attn.q_proj,0.0004897626,0.05000,5.770
152
+ 21,self_attn.o_proj,0.0000006938,0.05000,1.536
153
+ 21,mlp.gate_proj,0.0015099732,0.05000,2.692
154
+ 21,mlp.up_proj,0.0010752812,0.05000,2.708
155
+ 21,mlp.down_proj,0.0000044608,0.05000,5.819
156
+ 22,self_attn.v_proj,0.0000996507,0.05000,5.592
157
+ 22,self_attn.q_proj,0.0004715399,0.05000,5.642
158
+ 22,self_attn.k_proj,0.0001876980,0.05000,5.657
159
+ 22,self_attn.o_proj,0.0000004057,0.05000,1.512
160
+ 22,mlp.gate_proj,0.0016046927,0.05000,2.720
161
+ 22,mlp.up_proj,0.0011544167,0.05000,2.726
162
+ 22,mlp.down_proj,0.0000046066,0.05000,5.792
163
+ 23,self_attn.q_proj,0.0004739835,0.05000,5.550
164
+ 23,self_attn.k_proj,0.0001863427,0.05000,5.639
165
+ 23,self_attn.v_proj,0.0001045092,0.05000,5.656
166
+ 23,self_attn.o_proj,0.0000006813,0.05000,1.508
167
+ 23,mlp.up_proj,0.0012700862,0.05000,2.755
168
+ 23,mlp.gate_proj,0.0017711886,0.05000,2.766
169
+ 23,mlp.down_proj,0.0000051867,0.05000,5.805
170
+ 24,self_attn.q_proj,0.0005410001,0.05000,5.842
171
+ 24,self_attn.v_proj,0.0001214173,0.05000,5.883
172
+ 24,self_attn.k_proj,0.0002158198,0.05000,5.946
173
+ 24,self_attn.o_proj,0.0000006280,0.05000,1.501
174
+ 24,mlp.gate_proj,0.0019970989,0.05000,2.721
175
+ 24,mlp.up_proj,0.0014057605,0.05000,2.721
176
+ 24,mlp.down_proj,0.0000056286,0.05000,5.838
177
+ 25,self_attn.k_proj,0.0002077088,0.05000,5.659
178
+ 25,self_attn.v_proj,0.0001386532,0.05000,5.680
179
+ 25,self_attn.q_proj,0.0005421010,0.05000,5.690
180
+ 25,self_attn.o_proj,0.0000006926,0.05000,1.508
181
+ 25,mlp.gate_proj,0.0021648855,0.05000,2.806
182
+ 25,mlp.up_proj,0.0015368462,0.05000,2.807
183
+ 25,mlp.down_proj,0.0000063590,0.05000,5.777
184
+ 26,self_attn.q_proj,0.0005148287,0.05000,5.733
185
+ 26,self_attn.v_proj,0.0001467281,0.05000,5.761
186
+ 26,self_attn.k_proj,0.0001950796,0.05000,5.790
187
+ 26,self_attn.o_proj,0.0000009540,0.05000,1.512
188
+ 26,mlp.up_proj,0.0016700355,0.05000,2.757
189
+ 26,mlp.gate_proj,0.0022701313,0.05000,2.764
190
+ 26,mlp.down_proj,0.0000073036,0.05000,5.829
191
+ 27,self_attn.q_proj,0.0005313924,0.05000,5.597
192
+ 27,self_attn.k_proj,0.0001970788,0.05000,5.617
193
+ 27,self_attn.v_proj,0.0001329189,0.05000,5.631
194
+ 27,self_attn.o_proj,0.0000010856,0.05000,1.539
195
+ 27,mlp.gate_proj,0.0024865442,0.05000,2.738
196
+ 27,mlp.up_proj,0.0018403968,0.05000,2.737
197
+ 27,mlp.down_proj,0.0000087551,0.05000,5.844
198
+ 28,self_attn.k_proj,0.0001981637,0.05000,5.458
199
+ 28,self_attn.v_proj,0.0001949648,0.05000,5.500
200
+ 28,self_attn.q_proj,0.0005183223,0.05000,5.508
201
+ 28,self_attn.o_proj,0.0000016372,0.05000,1.530
202
+ 28,mlp.gate_proj,0.0026638827,0.05000,2.748
203
+ 28,mlp.up_proj,0.0020455004,0.05000,2.762
204
+ 28,mlp.down_proj,0.0000119281,0.05000,5.836
205
+ 29,self_attn.q_proj,0.0005931044,0.05000,5.728
206
+ 29,self_attn.k_proj,0.0001997706,0.05000,5.741
207
+ 29,self_attn.v_proj,0.0002828346,0.05000,5.767
208
+ 29,self_attn.o_proj,0.0000034553,0.05000,1.534
209
+ 29,mlp.up_proj,0.0020760434,0.05000,2.725
210
+ 29,mlp.gate_proj,0.0025936320,0.05000,2.729
211
+ 29,mlp.down_proj,0.0000151650,0.05000,5.807
212
+ 30,self_attn.v_proj,0.0003089608,0.05000,5.433
213
+ 30,self_attn.k_proj,0.0001842356,0.05000,5.482
214
+ 30,self_attn.q_proj,0.0005517652,0.05000,5.508
215
+ 30,self_attn.o_proj,0.0000030842,0.05000,1.513
216
+ 30,mlp.up_proj,0.0021368292,0.05000,2.743
217
+ 30,mlp.gate_proj,0.0026252946,0.05000,2.751
218
+ 30,mlp.down_proj,0.0000199158,0.05000,5.768
219
+ 31,self_attn.k_proj,0.0001757457,0.05000,5.804
220
+ 31,self_attn.v_proj,0.0003163291,0.05000,5.898
221
+ 31,self_attn.q_proj,0.0005140052,0.05000,5.915
222
+ 31,self_attn.o_proj,0.0000041636,0.05000,1.517
223
+ 31,mlp.gate_proj,0.0022865063,0.05000,2.720
224
+ 31,mlp.up_proj,0.0018066571,0.05000,2.729
225
+ 31,mlp.down_proj,0.0000333210,0.05000,5.901
quantize_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bits": 4,
3
+ "group_size": 128,
4
+ "desc_act": false,
5
+ "lm_head": false,
6
+ "method": "gptq",
7
+ "quant_method": "gptq",
8
+ "format": "gptq",
9
+ "checkpoint_format": "gptq",
10
+ "pack_dtype": "int32",
11
+ "meta": {
12
+ "quantizer": [
13
+ "gptqmodel:6.0.3"
14
+ ],
15
+ "uri": "https://github.com/modelcloud/gptqmodel",
16
+ "damp_percent": 0.05,
17
+ "damp_auto_increment": 0.01,
18
+ "static_groups": false,
19
+ "true_sequential": true,
20
+ "mse": 0.0,
21
+ "gptaq": null,
22
+ "foem": null,
23
+ "act_group_aware": true,
24
+ "fallback": {
25
+ "strategy": "rtn",
26
+ "threshold": "0.5%",
27
+ "smooth": null
28
+ },
29
+ "offload_to_disk": true,
30
+ "offload_to_disk_path": "./gptqmodel_offload/orcmjeui-tnqhqrfy/",
31
+ "pack_impl": "cpu",
32
+ "gc_mode": "interval",
33
+ "wait_for_submodule_finalizers": false,
34
+ "auto_forward_data_parallel": true,
35
+ "vram_strategy": "exclusive",
36
+ "mock_quantization": false,
37
+ "hessian": {
38
+ "chunk_size": null,
39
+ "chunk_bytes": null,
40
+ "staging_dtype": "float32"
41
+ }
42
+ },
43
+ "sym": true
44
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "backend": "tokenizers",
4
+ "bos_token": "<s>",
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "</s>",
7
+ "is_local": false,
8
+ "legacy": false,
9
+ "model_max_length": 1000000000000000019884624838656,
10
+ "pad_token": null,
11
+ "sp_model_kwargs": {},
12
+ "spaces_between_special_tokens": false,
13
+ "tokenizer_class": "TokenizersBackend",
14
+ "unk_token": "<unk>",
15
+ "use_default_system_prompt": false
16
+ }