iproskurina commited on
Commit
00c523e
·
verified ·
1 Parent(s): f6c4096

Add files using upload-large-folder tool

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. quant_log.csv +144 -144
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93c83a68e9ec3f86037b49ff8625ced97a17aab9ed0704439e17b4c79aad738a
3
  size 845033800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f9ceaebdb06d5deee40a8d4db27fe595dff5875a126846cde3a7317ffeb05e
3
  size 845033800
quant_log.csv CHANGED
@@ -1,145 +1,145 @@
1
  layer,module,loss,samples,damp,time
2
- 0,self_attn.k_proj,0.00399020,0.01000,1.264
3
- 0,self_attn.v_proj,0.00070882,0.01000,0.970
4
- 0,self_attn.q_proj,0.00407133,0.01000,0.970
5
- 0,self_attn.out_proj,0.00002185,0.01000,1.010
6
- 0,fc1,0.00872974,0.01000,0.978
7
- 0,fc2,0.00022706,0.01000,4.293
8
- 1,self_attn.k_proj,0.00293531,0.01000,0.986
9
- 1,self_attn.v_proj,0.00037064,0.01000,0.984
10
- 1,self_attn.q_proj,0.00318605,0.01000,0.986
11
- 1,self_attn.out_proj,0.00000342,0.01000,0.990
12
- 1,fc1,0.00963631,0.01000,0.987
13
- 1,fc2,0.00019677,0.01000,4.262
14
- 2,self_attn.k_proj,0.00401148,0.01000,0.973
15
- 2,self_attn.v_proj,0.00062648,0.01000,0.969
16
- 2,self_attn.q_proj,0.00399745,0.01000,0.966
17
- 2,self_attn.out_proj,0.00000257,0.01000,0.969
18
- 2,fc1,0.01047378,0.01000,0.996
19
- 2,fc2,0.00007746,0.01000,4.171
20
- 3,self_attn.k_proj,0.00450096,0.01000,0.971
21
- 3,self_attn.v_proj,0.00088504,0.01000,0.962
22
- 3,self_attn.q_proj,0.00498925,0.01000,0.974
23
- 3,self_attn.out_proj,0.00000471,0.01000,0.986
24
- 3,fc1,0.01086146,0.01000,0.975
25
- 3,fc2,0.00008414,0.01000,4.121
26
- 4,self_attn.k_proj,0.00736717,0.01000,0.978
27
- 4,self_attn.v_proj,0.00119574,0.01000,0.970
28
- 4,self_attn.q_proj,0.00785260,0.01000,0.979
29
- 4,self_attn.out_proj,0.00001008,0.01000,0.984
30
- 4,fc1,0.01312051,0.01000,0.979
31
- 4,fc2,0.00009959,0.01000,4.149
32
- 5,self_attn.k_proj,0.00950116,0.01000,0.964
33
- 5,self_attn.v_proj,0.00169445,0.01000,0.969
34
- 5,self_attn.q_proj,0.00980629,0.01000,0.968
35
- 5,self_attn.out_proj,0.00001083,0.01000,0.973
36
- 5,fc1,0.01551265,0.01000,0.977
37
- 5,fc2,0.00011699,0.01000,4.148
38
- 6,self_attn.k_proj,0.01533377,0.01000,0.969
39
- 6,self_attn.v_proj,0.00226665,0.01000,0.952
40
- 6,self_attn.q_proj,0.01375490,0.01000,0.973
41
- 6,self_attn.out_proj,0.00002926,0.01000,0.970
42
- 6,fc1,0.02030997,0.01000,0.971
43
- 6,fc2,0.00015709,0.01000,4.118
44
- 7,self_attn.k_proj,0.01740401,0.01000,0.969
45
- 7,self_attn.v_proj,0.00279684,0.01000,0.967
46
- 7,self_attn.q_proj,0.01548278,0.01000,0.972
47
- 7,self_attn.out_proj,0.00003702,0.01000,0.969
48
- 7,fc1,0.02616167,0.01000,0.976
49
- 7,fc2,0.00022070,0.01000,4.118
50
- 8,self_attn.k_proj,0.02040624,0.01000,0.976
51
- 8,self_attn.v_proj,0.00337292,0.01000,0.974
52
- 8,self_attn.q_proj,0.01664504,0.01000,0.977
53
- 8,self_attn.out_proj,0.00005092,0.01000,0.983
54
- 8,fc1,0.03254646,0.01000,0.992
55
- 8,fc2,0.00029163,0.01000,4.102
56
- 9,self_attn.k_proj,0.02243577,0.01000,0.969
57
- 9,self_attn.v_proj,0.00395448,0.01000,0.981
58
- 9,self_attn.q_proj,0.01871208,0.01000,0.999
59
- 9,self_attn.out_proj,0.00007879,0.01000,0.983
60
- 9,fc1,0.03796821,0.01000,0.984
61
- 9,fc2,0.00038551,0.01000,4.163
62
- 10,self_attn.k_proj,0.02308127,0.01000,0.976
63
- 10,self_attn.v_proj,0.00508604,0.01000,0.973
64
- 10,self_attn.q_proj,0.01914719,0.01000,0.974
65
- 10,self_attn.out_proj,0.00010216,0.01000,0.984
66
- 10,fc1,0.04341091,0.01000,0.980
67
- 10,fc2,0.00060412,0.01000,4.128
68
- 11,self_attn.k_proj,0.02389702,0.01000,0.975
69
- 11,self_attn.v_proj,0.00636119,0.01000,0.984
70
- 11,self_attn.q_proj,0.01992871,0.01000,0.987
71
- 11,self_attn.out_proj,0.00014076,0.01000,0.999
72
- 11,fc1,0.04898007,0.01000,0.988
73
- 11,fc2,0.00081568,0.01000,4.164
74
- 12,self_attn.k_proj,0.02727781,0.01000,0.977
75
- 12,self_attn.v_proj,0.00716118,0.01000,0.980
76
- 12,self_attn.q_proj,0.02138953,0.01000,0.973
77
- 12,self_attn.out_proj,0.00022961,0.01000,0.974
78
- 12,fc1,0.05186468,0.01000,0.975
79
- 12,fc2,0.00110451,0.01000,4.126
80
- 13,self_attn.k_proj,0.02947615,0.01000,0.980
81
- 13,self_attn.v_proj,0.00801060,0.01000,0.976
82
- 13,self_attn.q_proj,0.02191754,0.01000,0.986
83
- 13,self_attn.out_proj,0.00024779,0.01000,0.972
84
- 13,fc1,0.05749568,0.01000,0.983
85
- 13,fc2,0.00148446,0.01000,4.256
86
- 14,self_attn.k_proj,0.02809097,0.01000,0.968
87
- 14,self_attn.v_proj,0.01016108,0.01000,0.961
88
- 14,self_attn.q_proj,0.02138641,0.01000,0.967
89
- 14,self_attn.out_proj,0.00027950,0.01000,0.964
90
- 14,fc1,0.06364647,0.01000,0.968
91
- 14,fc2,0.00202063,0.01000,4.102
92
- 15,self_attn.k_proj,0.02527042,0.01000,0.964
93
- 15,self_attn.v_proj,0.01288679,0.01000,0.966
94
- 15,self_attn.q_proj,0.02164990,0.01000,0.966
95
- 15,self_attn.out_proj,0.00026314,0.01000,0.974
96
- 15,fc1,0.06786803,0.01000,0.966
97
- 15,fc2,0.00252577,0.01000,4.123
98
- 16,self_attn.k_proj,0.02550102,0.01000,0.969
99
- 16,self_attn.v_proj,0.01406841,0.01000,0.958
100
- 16,self_attn.q_proj,0.01926361,0.01000,0.963
101
- 16,self_attn.out_proj,0.00039853,0.01000,0.971
102
- 16,fc1,0.07458527,0.01000,0.979
103
- 16,fc2,0.00321327,0.01000,4.129
104
- 17,self_attn.k_proj,0.02485269,0.01000,0.961
105
- 17,self_attn.v_proj,0.01542338,0.01000,0.960
106
- 17,self_attn.q_proj,0.01941807,0.01000,0.971
107
- 17,self_attn.out_proj,0.00048917,0.01000,0.970
108
- 17,fc1,0.08214158,0.01000,0.973
109
- 17,fc2,0.00403266,0.01000,4.117
110
- 18,self_attn.k_proj,0.02275580,0.01000,0.963
111
- 18,self_attn.v_proj,0.01784235,0.01000,0.961
112
- 18,self_attn.q_proj,0.01897552,0.01000,0.965
113
- 18,self_attn.out_proj,0.00052644,0.01000,0.966
114
- 18,fc1,0.08688586,0.01000,0.975
115
- 18,fc2,0.00493614,0.01000,4.105
116
- 19,self_attn.k_proj,0.02327104,0.01000,0.963
117
- 19,self_attn.v_proj,0.02300425,0.01000,0.972
118
- 19,self_attn.q_proj,0.01916058,0.01000,0.956
119
- 19,self_attn.out_proj,0.00077869,0.01000,0.977
120
- 19,fc1,0.09395289,0.01000,0.977
121
- 19,fc2,0.00609364,0.01000,4.118
122
- 20,self_attn.k_proj,0.02386747,0.01000,0.962
123
- 20,self_attn.v_proj,0.02619410,0.01000,0.974
124
- 20,self_attn.q_proj,0.01858719,0.01000,0.968
125
- 20,self_attn.out_proj,0.00093543,0.01000,0.968
126
- 20,fc1,0.09828432,0.01000,0.985
127
- 20,fc2,0.00770969,0.01000,4.126
128
- 21,self_attn.k_proj,0.02234699,0.01000,0.973
129
- 21,self_attn.v_proj,0.02693190,0.01000,0.977
130
- 21,self_attn.q_proj,0.02045901,0.01000,0.972
131
- 21,self_attn.out_proj,0.00080754,0.01000,0.981
132
- 21,fc1,0.09965696,0.01000,1.016
133
- 21,fc2,0.00898138,0.01000,4.172
134
- 22,self_attn.k_proj,0.02288331,0.01000,0.978
135
- 22,self_attn.v_proj,0.02985917,0.01000,0.957
136
- 22,self_attn.q_proj,0.02454582,0.01000,0.980
137
- 22,self_attn.out_proj,0.00085336,0.01000,0.969
138
- 22,fc1,0.09818267,0.01000,0.974
139
- 22,fc2,0.00932770,0.01000,4.090
140
- 23,self_attn.k_proj,0.02912697,0.01000,0.972
141
- 23,self_attn.v_proj,0.02026520,0.01000,0.968
142
- 23,self_attn.q_proj,0.05245103,0.01000,0.969
143
- 23,self_attn.out_proj,0.00163580,0.01000,0.974
144
- 23,fc1,0.09108696,0.01000,0.980
145
- 23,fc2,0.00708841,0.01000,4.131
 
1
  layer,module,loss,samples,damp,time
2
+ 0,self_attn.k_proj,0.00399020,0.01000,1.769
3
+ 0,self_attn.v_proj,0.00070882,0.01000,0.943
4
+ 0,self_attn.q_proj,0.00407133,0.01000,0.973
5
+ 0,self_attn.out_proj,0.00002881,0.01000,0.954
6
+ 0,fc1,0.00841130,0.01000,0.949
7
+ 0,fc2,0.00023788,0.01000,4.238
8
+ 1,self_attn.k_proj,0.00265268,0.01000,0.977
9
+ 1,self_attn.v_proj,0.00033390,0.01000,0.980
10
+ 1,self_attn.q_proj,0.00286817,0.01000,0.962
11
+ 1,self_attn.out_proj,0.00000700,0.01000,0.976
12
+ 1,fc1,0.00870118,0.01000,0.987
13
+ 1,fc2,0.00015716,0.01000,4.314
14
+ 2,self_attn.k_proj,0.00358274,0.01000,0.969
15
+ 2,self_attn.v_proj,0.00055633,0.01000,0.966
16
+ 2,self_attn.q_proj,0.00357723,0.01000,0.967
17
+ 2,self_attn.out_proj,0.00000220,0.01000,0.976
18
+ 2,fc1,0.00947768,0.01000,0.976
19
+ 2,fc2,0.00006839,0.01000,4.106
20
+ 3,self_attn.k_proj,0.00388418,0.01000,0.970
21
+ 3,self_attn.v_proj,0.00075879,0.01000,0.992
22
+ 3,self_attn.q_proj,0.00437635,0.01000,0.970
23
+ 3,self_attn.out_proj,0.00000383,0.01000,1.023
24
+ 3,fc1,0.00933810,0.01000,0.972
25
+ 3,fc2,0.00007643,0.01000,4.081
26
+ 4,self_attn.k_proj,0.00632844,0.01000,0.963
27
+ 4,self_attn.v_proj,0.00101882,0.01000,0.968
28
+ 4,self_attn.q_proj,0.00671913,0.01000,0.978
29
+ 4,self_attn.out_proj,0.00000953,0.01000,0.974
30
+ 4,fc1,0.01132140,0.01000,1.014
31
+ 4,fc2,0.00009407,0.01000,4.120
32
+ 5,self_attn.k_proj,0.00836137,0.01000,0.970
33
+ 5,self_attn.v_proj,0.00141843,0.01000,0.966
34
+ 5,self_attn.q_proj,0.00862948,0.01000,0.977
35
+ 5,self_attn.out_proj,0.00001295,0.01000,0.976
36
+ 5,fc1,0.01352680,0.01000,1.009
37
+ 5,fc2,0.00010500,0.01000,4.146
38
+ 6,self_attn.k_proj,0.01344048,0.01000,0.964
39
+ 6,self_attn.v_proj,0.00186100,0.01000,0.983
40
+ 6,self_attn.q_proj,0.01191495,0.01000,0.974
41
+ 6,self_attn.out_proj,0.00002467,0.01000,0.959
42
+ 6,fc1,0.01742047,0.01000,0.953
43
+ 6,fc2,0.00013119,0.01000,4.097
44
+ 7,self_attn.k_proj,0.01503923,0.01000,0.980
45
+ 7,self_attn.v_proj,0.00229473,0.01000,0.966
46
+ 7,self_attn.q_proj,0.01326014,0.01000,0.976
47
+ 7,self_attn.out_proj,0.00003410,0.01000,0.946
48
+ 7,fc1,0.02252554,0.01000,0.981
49
+ 7,fc2,0.00018367,0.01000,4.157
50
+ 8,self_attn.k_proj,0.01784026,0.01000,0.954
51
+ 8,self_attn.v_proj,0.00280950,0.01000,0.951
52
+ 8,self_attn.q_proj,0.01452082,0.01000,0.971
53
+ 8,self_attn.out_proj,0.00004744,0.01000,1.036
54
+ 8,fc1,0.02815095,0.01000,0.972
55
+ 8,fc2,0.00025076,0.01000,4.100
56
+ 9,self_attn.k_proj,0.01993856,0.01000,0.971
57
+ 9,self_attn.v_proj,0.00336911,0.01000,0.985
58
+ 9,self_attn.q_proj,0.01663456,0.01000,0.974
59
+ 9,self_attn.out_proj,0.00007329,0.01000,0.988
60
+ 9,fc1,0.03346713,0.01000,0.991
61
+ 9,fc2,0.00033390,0.01000,4.126
62
+ 10,self_attn.k_proj,0.02098462,0.01000,0.952
63
+ 10,self_attn.v_proj,0.00442903,0.01000,0.972
64
+ 10,self_attn.q_proj,0.01737896,0.01000,0.970
65
+ 10,self_attn.out_proj,0.00009355,0.01000,0.956
66
+ 10,fc1,0.03937871,0.01000,0.969
67
+ 10,fc2,0.00054157,0.01000,4.074
68
+ 11,self_attn.k_proj,0.02233104,0.01000,0.990
69
+ 11,self_attn.v_proj,0.00575745,0.01000,0.969
70
+ 11,self_attn.q_proj,0.01841100,0.01000,0.988
71
+ 11,self_attn.out_proj,0.00012954,0.01000,0.975
72
+ 11,fc1,0.04563497,0.01000,0.976
73
+ 11,fc2,0.00075835,0.01000,4.148
74
+ 12,self_attn.k_proj,0.02574713,0.01000,0.971
75
+ 12,self_attn.v_proj,0.00661912,0.01000,0.965
76
+ 12,self_attn.q_proj,0.02014845,0.01000,0.957
77
+ 12,self_attn.out_proj,0.00022067,0.01000,0.963
78
+ 12,fc1,0.04933250,0.01000,0.991
79
+ 12,fc2,0.00101735,0.01000,4.085
80
+ 13,self_attn.k_proj,0.02849308,0.01000,0.977
81
+ 13,self_attn.v_proj,0.00755646,0.01000,0.960
82
+ 13,self_attn.q_proj,0.02111352,0.01000,0.955
83
+ 13,self_attn.out_proj,0.00024542,0.01000,0.983
84
+ 13,fc1,0.05511705,0.01000,0.962
85
+ 13,fc2,0.00135350,0.01000,4.206
86
+ 14,self_attn.k_proj,0.02709149,0.01000,0.963
87
+ 14,self_attn.v_proj,0.00964833,0.01000,0.956
88
+ 14,self_attn.q_proj,0.02070987,0.01000,0.972
89
+ 14,self_attn.out_proj,0.00027742,0.01000,0.963
90
+ 14,fc1,0.06202892,0.01000,0.974
91
+ 14,fc2,0.00191707,0.01000,4.080
92
+ 15,self_attn.k_proj,0.02484710,0.01000,0.951
93
+ 15,self_attn.v_proj,0.01247784,0.01000,0.952
94
+ 15,self_attn.q_proj,0.02116217,0.01000,0.983
95
+ 15,self_attn.out_proj,0.00025006,0.01000,0.970
96
+ 15,fc1,0.06626023,0.01000,1.001
97
+ 15,fc2,0.00237964,0.01000,4.261
98
+ 16,self_attn.k_proj,0.02497149,0.01000,0.968
99
+ 16,self_attn.v_proj,0.01356158,0.01000,0.954
100
+ 16,self_attn.q_proj,0.01884268,0.01000,0.968
101
+ 16,self_attn.out_proj,0.00038158,0.01000,0.967
102
+ 16,fc1,0.07270662,0.01000,0.957
103
+ 16,fc2,0.00306718,0.01000,4.124
104
+ 17,self_attn.k_proj,0.02425222,0.01000,0.985
105
+ 17,self_attn.v_proj,0.01491047,0.01000,0.990
106
+ 17,self_attn.q_proj,0.01910833,0.01000,0.981
107
+ 17,self_attn.out_proj,0.00044458,0.01000,0.949
108
+ 17,fc1,0.08014514,0.01000,0.976
109
+ 17,fc2,0.00390363,0.01000,4.102
110
+ 18,self_attn.k_proj,0.02210768,0.01000,0.986
111
+ 18,self_attn.v_proj,0.01711883,0.01000,1.004
112
+ 18,self_attn.q_proj,0.01853545,0.01000,0.982
113
+ 18,self_attn.out_proj,0.00051715,0.01000,0.989
114
+ 18,fc1,0.08440722,0.01000,0.989
115
+ 18,fc2,0.00473098,0.01000,4.083
116
+ 19,self_attn.k_proj,0.02249363,0.01000,0.967
117
+ 19,self_attn.v_proj,0.02193001,0.01000,0.960
118
+ 19,self_attn.q_proj,0.01848070,0.01000,0.968
119
+ 19,self_attn.out_proj,0.00083592,0.01000,1.005
120
+ 19,fc1,0.09134186,0.01000,1.013
121
+ 19,fc2,0.00585078,0.01000,4.103
122
+ 20,self_attn.k_proj,0.02311379,0.01000,0.952
123
+ 20,self_attn.v_proj,0.02502821,0.01000,0.955
124
+ 20,self_attn.q_proj,0.01801062,0.01000,0.961
125
+ 20,self_attn.out_proj,0.00098910,0.01000,0.968
126
+ 20,fc1,0.09524175,0.01000,0.993
127
+ 20,fc2,0.00739040,0.01000,4.123
128
+ 21,self_attn.k_proj,0.02165480,0.01000,0.994
129
+ 21,self_attn.v_proj,0.02562368,0.01000,0.961
130
+ 21,self_attn.q_proj,0.01968897,0.01000,0.964
131
+ 21,self_attn.out_proj,0.00083486,0.01000,0.955
132
+ 21,fc1,0.09495520,0.01000,0.957
133
+ 21,fc2,0.00845354,0.01000,4.166
134
+ 22,self_attn.k_proj,0.02163469,0.01000,0.990
135
+ 22,self_attn.v_proj,0.02802912,0.01000,1.023
136
+ 22,self_attn.q_proj,0.02326590,0.01000,0.975
137
+ 22,self_attn.out_proj,0.00088141,0.01000,0.967
138
+ 22,fc1,0.09237307,0.01000,0.976
139
+ 22,fc2,0.00874107,0.01000,4.192
140
+ 23,self_attn.k_proj,0.02720753,0.01000,0.974
141
+ 23,self_attn.v_proj,0.01896040,0.01000,0.957
142
+ 23,self_attn.q_proj,0.04915815,0.01000,0.973
143
+ 23,self_attn.out_proj,0.00157263,0.01000,0.961
144
+ 23,fc1,0.08544412,0.01000,0.981
145
+ 23,fc2,0.00670062,0.01000,4.107