| ,layer_id,layer_type,param_type,shape,nparam,nnz,sparsity | |
| 5,bert.encoder.layer.0.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 7,bert.encoder.layer.0.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 9,bert.encoder.layer.0.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 11,bert.encoder.layer.0.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 15,bert.encoder.layer.0.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 17,bert.encoder.layer.0.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 21,bert.encoder.layer.1.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 23,bert.encoder.layer.1.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 25,bert.encoder.layer.1.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 27,bert.encoder.layer.1.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 31,bert.encoder.layer.1.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 33,bert.encoder.layer.1.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 37,bert.encoder.layer.2.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 39,bert.encoder.layer.2.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 41,bert.encoder.layer.2.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 43,bert.encoder.layer.2.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 47,bert.encoder.layer.2.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 49,bert.encoder.layer.2.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 53,bert.encoder.layer.3.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 55,bert.encoder.layer.3.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 57,bert.encoder.layer.3.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 59,bert.encoder.layer.3.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 63,bert.encoder.layer.3.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 65,bert.encoder.layer.3.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 69,bert.encoder.layer.4.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 71,bert.encoder.layer.4.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 73,bert.encoder.layer.4.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 75,bert.encoder.layer.4.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 79,bert.encoder.layer.4.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 81,bert.encoder.layer.4.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 85,bert.encoder.layer.5.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 87,bert.encoder.layer.5.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 89,bert.encoder.layer.5.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 91,bert.encoder.layer.5.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 95,bert.encoder.layer.5.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 97,bert.encoder.layer.5.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 101,bert.encoder.layer.6.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 103,bert.encoder.layer.6.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 105,bert.encoder.layer.6.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 107,bert.encoder.layer.6.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 111,bert.encoder.layer.6.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 113,bert.encoder.layer.6.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 117,bert.encoder.layer.7.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 119,bert.encoder.layer.7.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 121,bert.encoder.layer.7.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 123,bert.encoder.layer.7.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 127,bert.encoder.layer.7.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 129,bert.encoder.layer.7.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 133,bert.encoder.layer.8.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 135,bert.encoder.layer.8.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 137,bert.encoder.layer.8.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 139,bert.encoder.layer.8.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 143,bert.encoder.layer.8.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 145,bert.encoder.layer.8.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 149,bert.encoder.layer.9.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 151,bert.encoder.layer.9.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 153,bert.encoder.layer.9.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 155,bert.encoder.layer.9.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 159,bert.encoder.layer.9.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 161,bert.encoder.layer.9.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 165,bert.encoder.layer.10.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 167,bert.encoder.layer.10.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 169,bert.encoder.layer.10.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 171,bert.encoder.layer.10.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 175,bert.encoder.layer.10.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 177,bert.encoder.layer.10.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |
| 181,bert.encoder.layer.11.attention.self.query,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 183,bert.encoder.layer.11.attention.self.key,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 185,bert.encoder.layer.11.attention.self.value,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 187,bert.encoder.layer.11.attention.output.dense,Linear,weight,"[768, 768]",589824,589824,0.0 | |
| 191,bert.encoder.layer.11.intermediate.dense,Linear,weight,"[3072, 768]",2359296,2359296,0.0 | |
| 193,bert.encoder.layer.11.output.dense,Linear,weight,"[768, 3072]",2359296,2359296,0.0 | |