File size: 1,358 Bytes
5be0d4a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 |
t5-small - T5-Small-Human-Attentive-Try2-Pass2-step1000
generation_config.json: 100%
147/147 [00:00<00:00, 7.39kB/s]
layer mean_abs_diff max_abs_diff sum_abs_diff
shared.weight 0.174424 6.953552 2.869195e+06
decoder.final_layer_norm.weight 0.024521 0.154768 1.255470e+01
decoder.block.4.layer.0.SelfAttention.o.weight 0.018399 0.419979 4.823166e+03
decoder.block.5.layer.2.DenseReluDense.wo.weight 0.016679 1.636604 1.748921e+04
decoder.block.5.layer.1.EncDecAttention.v.weight 0.016636 0.149930 4.360904e+03
decoder.block.5.layer.2.layer_norm.weight 0.016384 0.055661 8.388475e+00
decoder.block.5.layer.2.DenseReluDense.wi.weight 0.016216 1.137286 1.700386e+04
decoder.block.5.layer.1.EncDecAttention.o.weight 0.015909 0.295170 4.170528e+03
decoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight 0.015417 0.182647 3.946715e+00
decoder.block.5.layer.0.SelfAttention.o.weight 0.014727 0.399601 3.860541e+03 |