orca-zhang's picture
Add multilingual-e5-small-int8 bundle
c85a312 verified
7767517
333 394
Input in0 0 1 in0
Input in1 0 1 in1
Split splitncnn_0 1 2 in1 2 3
Embed embed_97 1 1 in0 4 0=384 1=250037 3=96014208 18=2
MemoryData pnnx_fold_102 0 1 5 0=384 1=255
MemoryData pnnx_fold_104 0 1 6 0=384 1=255
BinaryOp add_0 2 1 4 5 7
BinaryOp add_1 2 1 7 6 8
LayerNorm ln_98 1 1 8 9 0=384 1=1.000000e-12
Split splitncnn_1 1 4 9 10 11 12 13
Reshape reshape_135 1 1 2 14 0=255 1=1 2=1
BinaryOp sub_2 1 1 14 15 0=7 1=1 2=1.000000e+00
BinaryOp mul_3 1 1 15 16 0=2 1=1 2=-1.000000e+04
Split splitncnn_2 1 12 16 17 18 19 20 21 22 23 24 25 26 27 28
Gemm gemm_0 1 1 13 29 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_136 1 1 29 30 0=32 1=12 2=255
Permute transpose_211 1 1 30 31 0=2
Gemm gemm_1 1 1 12 32 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_137 1 1 32 33 0=32 1=12 2=255
Gemm gemm_2 1 1 11 34 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_138 1 1 34 35 0=32 1=12 2=255
Permute transpose_212 1 1 35 36 0=2
Permute permute_123 1 1 33 37 0=3
MatMul matmul_185 2 1 31 37 38
BinaryOp mul_4 1 1 38 39 0=2 1=1 2=1.767770e-01
BinaryOp add_5 2 1 39 17 40
Softmax softmax_85 1 1 40 41 0=2 1=1
MatMul matmul_186 2 1 41 36 42
Permute transpose_213 1 1 42 43 0=2
Reshape reshape_139 1 1 43 44 0=384 1=255
Gemm gemm_3 1 1 44 45 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_6 2 1 45 10 46
LayerNorm ln_99 1 1 46 47 0=384 1=1.000000e-12
Split splitncnn_3 1 2 47 48 49
Gemm gemm_4 1 1 49 50 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_72 1 1 50 51
Gemm gemm_5 1 1 51 52 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_7 2 1 52 48 53
LayerNorm ln_100 1 1 53 54 0=384 1=1.000000e-12
Split splitncnn_4 1 4 54 55 56 57 58
Gemm gemm_6 1 1 58 59 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_140 1 1 59 60 0=32 1=12 2=255
Permute transpose_214 1 1 60 61 0=2
Gemm gemm_7 1 1 57 62 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_141 1 1 62 63 0=32 1=12 2=255
Gemm gemm_8 1 1 56 64 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_142 1 1 64 65 0=32 1=12 2=255
Permute transpose_215 1 1 65 66 0=2
Permute permute_124 1 1 63 67 0=3
MatMul matmul_187 2 1 61 67 68
BinaryOp mul_8 1 1 68 69 0=2 1=1 2=1.767770e-01
BinaryOp add_9 2 1 69 18 70
Softmax softmax_86 1 1 70 71 0=2 1=1
MatMul matmul_188 2 1 71 66 72
Permute transpose_216 1 1 72 73 0=2
Reshape reshape_143 1 1 73 74 0=384 1=255
Gemm gemm_9 1 1 74 75 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_10 2 1 75 55 76
LayerNorm ln_101 1 1 76 77 0=384 1=1.000000e-12
Split splitncnn_5 1 2 77 78 79
Gemm gemm_10 1 1 79 80 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_73 1 1 80 81
Gemm gemm_11 1 1 81 82 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_11 2 1 82 78 83
LayerNorm ln_102 1 1 83 84 0=384 1=1.000000e-12
Split splitncnn_6 1 4 84 85 86 87 88
Gemm gemm_12 1 1 88 89 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_144 1 1 89 90 0=32 1=12 2=255
Permute transpose_217 1 1 90 91 0=2
Gemm gemm_13 1 1 87 92 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_145 1 1 92 93 0=32 1=12 2=255
Gemm gemm_14 1 1 86 94 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_146 1 1 94 95 0=32 1=12 2=255
Permute transpose_218 1 1 95 96 0=2
Permute permute_125 1 1 93 97 0=3
MatMul matmul_189 2 1 91 97 98
BinaryOp mul_12 1 1 98 99 0=2 1=1 2=1.767770e-01
BinaryOp add_13 2 1 99 19 100
Softmax softmax_87 1 1 100 101 0=2 1=1
MatMul matmul_190 2 1 101 96 102
Permute transpose_219 1 1 102 103 0=2
Reshape reshape_147 1 1 103 104 0=384 1=255
Gemm gemm_15 1 1 104 105 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_14 2 1 105 85 106
LayerNorm ln_103 1 1 106 107 0=384 1=1.000000e-12
Split splitncnn_7 1 2 107 108 109
Gemm gemm_16 1 1 109 110 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_74 1 1 110 111
Gemm gemm_17 1 1 111 112 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_15 2 1 112 108 113
LayerNorm ln_104 1 1 113 114 0=384 1=1.000000e-12
Split splitncnn_8 1 4 114 115 116 117 118
Gemm gemm_18 1 1 118 119 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_148 1 1 119 120 0=32 1=12 2=255
Permute transpose_220 1 1 120 121 0=2
Gemm gemm_19 1 1 117 122 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_149 1 1 122 123 0=32 1=12 2=255
Gemm gemm_20 1 1 116 124 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_150 1 1 124 125 0=32 1=12 2=255
Permute transpose_221 1 1 125 126 0=2
Permute permute_126 1 1 123 127 0=3
MatMul matmul_191 2 1 121 127 128
BinaryOp mul_16 1 1 128 129 0=2 1=1 2=1.767770e-01
BinaryOp add_17 2 1 129 20 130
Softmax softmax_88 1 1 130 131 0=2 1=1
MatMul matmul_192 2 1 131 126 132
Permute transpose_222 1 1 132 133 0=2
Reshape reshape_151 1 1 133 134 0=384 1=255
Gemm gemm_21 1 1 134 135 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_18 2 1 135 115 136
LayerNorm ln_105 1 1 136 137 0=384 1=1.000000e-12
Split splitncnn_9 1 2 137 138 139
Gemm gemm_22 1 1 139 140 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_75 1 1 140 141
Gemm gemm_23 1 1 141 142 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_19 2 1 142 138 143
LayerNorm ln_106 1 1 143 144 0=384 1=1.000000e-12
Split splitncnn_10 1 4 144 145 146 147 148
Gemm gemm_24 1 1 148 149 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_152 1 1 149 150 0=32 1=12 2=255
Permute transpose_223 1 1 150 151 0=2
Gemm gemm_25 1 1 147 152 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_153 1 1 152 153 0=32 1=12 2=255
Gemm gemm_26 1 1 146 154 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_154 1 1 154 155 0=32 1=12 2=255
Permute transpose_224 1 1 155 156 0=2
Permute permute_127 1 1 153 157 0=3
MatMul matmul_193 2 1 151 157 158
BinaryOp mul_20 1 1 158 159 0=2 1=1 2=1.767770e-01
BinaryOp add_21 2 1 159 21 160
Softmax softmax_89 1 1 160 161 0=2 1=1
MatMul matmul_194 2 1 161 156 162
Permute transpose_225 1 1 162 163 0=2
Reshape reshape_155 1 1 163 164 0=384 1=255
Gemm gemm_27 1 1 164 165 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_22 2 1 165 145 166
LayerNorm ln_107 1 1 166 167 0=384 1=1.000000e-12
Split splitncnn_11 1 2 167 168 169
Gemm gemm_28 1 1 169 170 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_76 1 1 170 171
Gemm gemm_29 1 1 171 172 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_23 2 1 172 168 173
LayerNorm ln_108 1 1 173 174 0=384 1=1.000000e-12
Split splitncnn_12 1 4 174 175 176 177 178
Gemm gemm_30 1 1 178 179 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_156 1 1 179 180 0=32 1=12 2=255
Permute transpose_226 1 1 180 181 0=2
Gemm gemm_31 1 1 177 182 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_157 1 1 182 183 0=32 1=12 2=255
Gemm gemm_32 1 1 176 184 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_158 1 1 184 185 0=32 1=12 2=255
Permute transpose_227 1 1 185 186 0=2
Permute permute_128 1 1 183 187 0=3
MatMul matmul_195 2 1 181 187 188
BinaryOp mul_24 1 1 188 189 0=2 1=1 2=1.767770e-01
BinaryOp add_25 2 1 189 22 190
Softmax softmax_90 1 1 190 191 0=2 1=1
MatMul matmul_196 2 1 191 186 192
Permute transpose_228 1 1 192 193 0=2
Reshape reshape_159 1 1 193 194 0=384 1=255
Gemm gemm_33 1 1 194 195 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_26 2 1 195 175 196
LayerNorm ln_109 1 1 196 197 0=384 1=1.000000e-12
Split splitncnn_13 1 2 197 198 199
Gemm gemm_34 1 1 199 200 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_77 1 1 200 201
Gemm gemm_35 1 1 201 202 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_27 2 1 202 198 203
LayerNorm ln_110 1 1 203 204 0=384 1=1.000000e-12
Split splitncnn_14 1 4 204 205 206 207 208
Gemm gemm_36 1 1 208 209 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_160 1 1 209 210 0=32 1=12 2=255
Permute transpose_229 1 1 210 211 0=2
Gemm gemm_37 1 1 207 212 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_161 1 1 212 213 0=32 1=12 2=255
Gemm gemm_38 1 1 206 214 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_162 1 1 214 215 0=32 1=12 2=255
Permute transpose_230 1 1 215 216 0=2
Permute permute_129 1 1 213 217 0=3
MatMul matmul_197 2 1 211 217 218
BinaryOp mul_28 1 1 218 219 0=2 1=1 2=1.767770e-01
BinaryOp add_29 2 1 219 23 220
Softmax softmax_91 1 1 220 221 0=2 1=1
MatMul matmul_198 2 1 221 216 222
Permute transpose_231 1 1 222 223 0=2
Reshape reshape_163 1 1 223 224 0=384 1=255
Gemm gemm_39 1 1 224 225 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_30 2 1 225 205 226
LayerNorm ln_111 1 1 226 227 0=384 1=1.000000e-12
Split splitncnn_15 1 2 227 228 229
Gemm gemm_40 1 1 229 230 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_78 1 1 230 231
Gemm gemm_41 1 1 231 232 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_31 2 1 232 228 233
LayerNorm ln_112 1 1 233 234 0=384 1=1.000000e-12
Split splitncnn_16 1 4 234 235 236 237 238
Gemm gemm_42 1 1 238 239 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_164 1 1 239 240 0=32 1=12 2=255
Permute transpose_232 1 1 240 241 0=2
Gemm gemm_43 1 1 237 242 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_165 1 1 242 243 0=32 1=12 2=255
Gemm gemm_44 1 1 236 244 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_166 1 1 244 245 0=32 1=12 2=255
Permute transpose_233 1 1 245 246 0=2
Permute permute_130 1 1 243 247 0=3
MatMul matmul_199 2 1 241 247 248
BinaryOp mul_32 1 1 248 249 0=2 1=1 2=1.767770e-01
BinaryOp add_33 2 1 249 24 250
Softmax softmax_92 1 1 250 251 0=2 1=1
MatMul matmul_200 2 1 251 246 252
Permute transpose_234 1 1 252 253 0=2
Reshape reshape_167 1 1 253 254 0=384 1=255
Gemm gemm_45 1 1 254 255 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_34 2 1 255 235 256
LayerNorm ln_113 1 1 256 257 0=384 1=1.000000e-12
Split splitncnn_17 1 2 257 258 259
Gemm gemm_46 1 1 259 260 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_79 1 1 260 261
Gemm gemm_47 1 1 261 262 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_35 2 1 262 258 263
LayerNorm ln_114 1 1 263 264 0=384 1=1.000000e-12
Split splitncnn_18 1 4 264 265 266 267 268
Gemm gemm_48 1 1 268 269 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_168 1 1 269 270 0=32 1=12 2=255
Permute transpose_235 1 1 270 271 0=2
Gemm gemm_49 1 1 267 272 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_169 1 1 272 273 0=32 1=12 2=255
Gemm gemm_50 1 1 266 274 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_170 1 1 274 275 0=32 1=12 2=255
Permute transpose_236 1 1 275 276 0=2
Permute permute_131 1 1 273 277 0=3
MatMul matmul_201 2 1 271 277 278
BinaryOp mul_36 1 1 278 279 0=2 1=1 2=1.767770e-01
BinaryOp add_37 2 1 279 25 280
Softmax softmax_93 1 1 280 281 0=2 1=1
MatMul matmul_202 2 1 281 276 282
Permute transpose_237 1 1 282 283 0=2
Reshape reshape_171 1 1 283 284 0=384 1=255
Gemm gemm_51 1 1 284 285 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_38 2 1 285 265 286
LayerNorm ln_115 1 1 286 287 0=384 1=1.000000e-12
Split splitncnn_19 1 2 287 288 289
Gemm gemm_52 1 1 289 290 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_80 1 1 290 291
Gemm gemm_53 1 1 291 292 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_39 2 1 292 288 293
LayerNorm ln_116 1 1 293 294 0=384 1=1.000000e-12
Split splitncnn_20 1 4 294 295 296 297 298
Gemm gemm_54 1 1 298 299 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_172 1 1 299 300 0=32 1=12 2=255
Permute transpose_238 1 1 300 301 0=2
Gemm gemm_55 1 1 297 302 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_173 1 1 302 303 0=32 1=12 2=255
Gemm gemm_56 1 1 296 304 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_174 1 1 304 305 0=32 1=12 2=255
Permute transpose_239 1 1 305 306 0=2
Permute permute_132 1 1 303 307 0=3
MatMul matmul_203 2 1 301 307 308
BinaryOp mul_40 1 1 308 309 0=2 1=1 2=1.767770e-01
BinaryOp add_41 2 1 309 26 310
Softmax softmax_94 1 1 310 311 0=2 1=1
MatMul matmul_204 2 1 311 306 312
Permute transpose_240 1 1 312 313 0=2
Reshape reshape_175 1 1 313 314 0=384 1=255
Gemm gemm_57 1 1 314 315 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_42 2 1 315 295 316
LayerNorm ln_117 1 1 316 317 0=384 1=1.000000e-12
Split splitncnn_21 1 2 317 318 319
Gemm gemm_58 1 1 319 320 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_81 1 1 320 321
Gemm gemm_59 1 1 321 322 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_43 2 1 322 318 323
LayerNorm ln_118 1 1 323 324 0=384 1=1.000000e-12
Split splitncnn_22 1 4 324 325 326 327 328
Gemm gemm_60 1 1 328 329 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_176 1 1 329 330 0=32 1=12 2=255
Permute transpose_241 1 1 330 331 0=2
Gemm gemm_61 1 1 327 332 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_177 1 1 332 333 0=32 1=12 2=255
Gemm gemm_62 1 1 326 334 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_178 1 1 334 335 0=32 1=12 2=255
Permute transpose_242 1 1 335 336 0=2
Permute permute_133 1 1 333 337 0=3
MatMul matmul_205 2 1 331 337 338
BinaryOp mul_44 1 1 338 339 0=2 1=1 2=1.767770e-01
BinaryOp add_45 2 1 339 27 340
Softmax softmax_95 1 1 340 341 0=2 1=1
MatMul matmul_206 2 1 341 336 342
Permute transpose_243 1 1 342 343 0=2
Reshape reshape_179 1 1 343 344 0=384 1=255
Gemm gemm_63 1 1 344 345 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_46 2 1 345 325 346
LayerNorm ln_119 1 1 346 347 0=384 1=1.000000e-12
Split splitncnn_23 1 2 347 348 349
Gemm gemm_64 1 1 349 350 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_82 1 1 350 351
Gemm gemm_65 1 1 351 352 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_47 2 1 352 348 353
LayerNorm ln_120 1 1 353 354 0=384 1=1.000000e-12
Split splitncnn_24 1 4 354 355 356 357 358
Gemm gemm_66 1 1 358 359 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_180 1 1 359 360 0=32 1=12 2=255
Permute transpose_244 1 1 360 361 0=2
Gemm gemm_67 1 1 357 362 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_181 1 1 362 363 0=32 1=12 2=255
Gemm gemm_68 1 1 356 364 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
Reshape reshape_182 1 1 364 365 0=32 1=12 2=255
Permute transpose_245 1 1 365 366 0=2
Permute permute_134 1 1 363 367 0=3
MatMul matmul_207 2 1 361 367 368
BinaryOp mul_48 1 1 368 369 0=2 1=1 2=1.767770e-01
BinaryOp add_49 2 1 369 28 370
Softmax softmax_96 1 1 370 371 0=2 1=1
MatMul matmul_208 2 1 371 366 372
Permute transpose_246 1 1 372 373 0=2
Reshape reshape_183 1 1 373 374 0=384 1=255
Gemm gemm_69 1 1 374 375 3=1 5=1 6=1 7=255 8=384 9=384 10=4 18=2
BinaryOp add_50 2 1 375 355 376
LayerNorm ln_121 1 1 376 377 0=384 1=1.000000e-12
Split splitncnn_25 1 2 377 378 379
Gemm gemm_70 1 1 379 380 3=1 5=1 6=1 7=255 8=1536 9=384 10=4 18=2
GELU gelu_83 1 1 380 381
Gemm gemm_71 1 1 381 382 3=1 5=1 6=1 7=255 8=384 9=1536 10=4 18=2
BinaryOp add_51 2 1 382 378 383
LayerNorm ln_122 1 1 383 384 0=384 1=1.000000e-12
ExpandDims unsqueeze_247 1 1 3 385 -23303=1,-1
Split splitncnn_26 1 2 385 386 387
BinaryOp mul_52 2 1 384 386 388 0=2
Reduction sum_209 1 1 388 389 1=0 -23303=1,0 5=1
Reduction sum_210 1 1 387 390 1=0 -23303=1,0 5=1
Clip clamp_184 1 1 390 391 0=1.000000e+00 1=3.402823e+38
BinaryOp div_53 2 1 389 391 392 0=3
Normalize normalize_84 1 1 392 out0 0=1 1=1 2=1.000000e-12 3=1 9=1