| { | |
| "prompt_tokens": 300, | |
| "first_token": 1039, | |
| "native_next_argmax": 2009, | |
| "custom_next_argmax": 2009, | |
| "logits_max_abs_diff": 0.30511796474456787, | |
| "logits_mean_abs_diff": 0.0421568788588047, | |
| "fixed_cache_length": 512, | |
| "fixed_native_max_abs_diff": 0.30511796474456787, | |
| "fixed_native_mean_abs_diff": 0.04215686395764351, | |
| "fixed_growing_max_abs_diff": 4.76837158203125e-06, | |
| "fixed_custom_next_argmax": 2009, | |
| "full_layers": 6, | |
| "linear_layers": 18, | |
| "next_full_key_shape": [ | |
| 1, | |
| 2, | |
| 301, | |
| 256 | |
| ], | |
| "next_conv_shape": [ | |
| 1, | |
| 6144, | |
| 4 | |
| ], | |
| "next_recurrent_shape": [ | |
| 1, | |
| 16, | |
| 128, | |
| 128 | |
| ] | |
| } | |