{ "model_name": "openai/whisper-medium", "model_config": { "transformers_version": "5.5.3", "architectures": [ "WhisperForConditionalGeneration" ], "output_hidden_states": false, "return_dict": true, "dtype": "float32", "chunk_size_feed_forward": 0, "is_encoder_decoder": true, "id2label": { "0": "LABEL_0", "1": "LABEL_1" }, "label2id": { "LABEL_0": 0, "LABEL_1": 1 }, "problem_type": null, "vocab_size": 51865, "num_mel_bins": 80, "encoder_layers": 24, "encoder_attention_heads": 16, "decoder_layers": 24, "decoder_attention_heads": 16, "decoder_ffn_dim": 4096, "encoder_ffn_dim": 4096, "encoder_layerdrop": 0.0, "decoder_layerdrop": 0.0, "decoder_start_token_id": 50258, "use_cache": true, "activation_function": "gelu", "d_model": 1024, "dropout": 0.0, "attention_dropout": 0.0, "activation_dropout": 0.0, "init_std": 0.02, "scale_embedding": false, "max_source_positions": 1500, "max_target_positions": 448, "pad_token_id": 50257, "bos_token_id": 50257, "eos_token_id": 50257, "suppress_tokens": [ 1, 2, 7, 8, 9, 10, 14, 25, 26, 27, 28, 29, 31, 58, 59, 60, 61, 62, 63, 90, 91, 92, 93, 359, 503, 522, 542, 873, 893, 902, 918, 922, 931, 1350, 1853, 1982, 2460, 2627, 3246, 3253, 3268, 3536, 3846, 3961, 4183, 4667, 6585, 6647, 7273, 9061, 9383, 10428, 10929, 11938, 12033, 12331, 12562, 13793, 14157, 14635, 15265, 15618, 16553, 16604, 18362, 18956, 20075, 21675, 22520, 26130, 26161, 26435, 28279, 29464, 31650, 32302, 32470, 36865, 42863, 47425, 49870, 50254, 50258, 50358, 50359, 50360, 50361, 50362 ], "begin_suppress_tokens": [ 220, 50257 ], "use_weighted_layer_sum": false, "classifier_proj_size": 256, "apply_spec_augment": false, "mask_time_prob": 0.05, "mask_time_length": 10, "mask_time_min_masks": 2, "mask_feature_prob": 0.0, "mask_feature_length": 10, "mask_feature_min_masks": 0, "median_filter_width": 7, "tie_word_embeddings": true, "_name_or_path": "openai/whisper-medium", "forced_decoder_ids": [ [ 1, 50259 ], [ 2, 50359 ], [ 3, 50363 ] ], "model_type": "whisper", "output_attentions": false }, "quant_config": { "components": [ "decoder" ], "scheme": "tritplane3", "group_size": 32, "n_iter": 10, "salient_fraction": 0.0, "rescue_fraction": 0.0, "n_planes": 3, "allow_all_linear": false, "target_module_names": [ "Wqkv", "att_proj", "attn.proj", "attn.qkv", "c_attn", "c_fc", "c_proj", "dense", "dense_4h_to_h", "dense_h_to_4h", "down_proj", "fc1", "fc2", "ff_proj", "gate_proj", "gate_up_proj", "k", "k_proj", "linear", "o", "o_proj", "out_proj", "per_layer_input_gate", "per_layer_projection", "proj", "q", "q_proj", "qkv", "qkv_proj", "query_key_value", "up_proj", "v", "v_proj", "w1", "w2", "w3", "wi", "wi_0", "wi_1", "wo" ], "max_length": 160, "calibration_batch_size": 2, "calibration_prompts": null, "vlm_use_demo_image": true }, "plan": {}, "layer_info": { "model.decoder.layers.0.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.0.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.0.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.1.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.1.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.1.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.2.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.2.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.2.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.3.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.3.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.3.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.4.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.4.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.4.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.5.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.5.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.5.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.6.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.6.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.6.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.7.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.7.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.7.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.8.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.8.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.8.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.9.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.9.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.9.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.10.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.10.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.10.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.11.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.11.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.11.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.12.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.12.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.12.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.13.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.13.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.13.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.14.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.14.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.14.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.15.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.15.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.15.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.16.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.16.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.16.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.17.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.17.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.17.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.18.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.18.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.18.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.19.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.19.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.19.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.20.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.20.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.20.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.21.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.21.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.21.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.22.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.22.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.22.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.23.self_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.self_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.self_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.self_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.encoder_attn.k_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.encoder_attn.v_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.encoder_attn.q_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.encoder_attn.out_proj": { "scheme": "tritplane_small_v1", "shape": [ 1024, 1024 ], "dtype": "torch.float32", "num_elements": 1048576, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 1179648, "effective_bits": 9.0 }, "model.decoder.layers.23.fc1": { "scheme": "tritplane_small_v1", "shape": [ 4096, 1024 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 }, "model.decoder.layers.23.fc2": { "scheme": "tritplane_small_v1", "shape": [ 1024, 4096 ], "dtype": "torch.float32", "num_elements": 4194304, "n_planes": 3, "group_sizes": [ 32, 32, 32 ], "rescued_rows": 0, "stored_bytes": 4718592, "effective_bits": 9.0 } }, "stats": { "model.decoder.layers.0.self_attn.k_proj": { "mse": 8.22391393739963e-06, "rmse": 0.0028677367273513147, "relative_error": 0.11225825031610676, "max_error": 0.07249832153320312, "sparsity": 0.39663855234781903, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.self_attn.v_proj": { "mse": 2.537128693802515e-06, "rmse": 0.001592836681459375, "relative_error": 0.1253849898161065, "max_error": 0.052634596824645996, "sparsity": 0.3911902109781901, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.self_attn.q_proj": { "mse": 7.867356544011272e-06, "rmse": 0.002804880843103905, "relative_error": 0.11485303222807783, "max_error": 0.12257003784179688, "sparsity": 0.3965638478597005, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.self_attn.out_proj": { "mse": 2.3530305952590425e-06, "rmse": 0.0015339591243768663, "relative_error": 0.12316348329498344, "max_error": 0.05019688606262207, "sparsity": 0.3834683100382487, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.encoder_attn.k_proj": { "mse": 2.932305505964905e-06, "rmse": 0.0017123975899203156, "relative_error": 0.14878440781545277, "max_error": 0.052741289138793945, "sparsity": 0.38413047790527344, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.encoder_attn.v_proj": { "mse": 2.9527541300922167e-06, "rmse": 0.0017183579749552235, "relative_error": 0.15262952638414398, "max_error": 0.04509568214416504, "sparsity": 0.3845523198445638, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.encoder_attn.q_proj": { "mse": 1.7530026070744498e-06, "rmse": 0.001324010047950713, "relative_error": 0.11584667248381872, "max_error": 0.0369831919670105, "sparsity": 0.38655567169189453, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.encoder_attn.out_proj": { "mse": 3.997231488028774e-06, "rmse": 0.0019993077522054412, "relative_error": 0.1804483932496295, "max_error": 0.04954719543457031, "sparsity": 0.3609612782796224, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.fc1": { "mse": 3.4595873330545146e-06, "rmse": 0.0018599965949040106, "relative_error": 0.12480082603415626, "max_error": 0.06718039512634277, "sparsity": 0.39367198944091797, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.0.fc2": { "mse": 9.965755452867597e-06, "rmse": 0.0031568584784351034, "relative_error": 0.258659206797803, "max_error": 0.10831642150878906, "sparsity": 0.3432497978210449, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.self_attn.k_proj": { "mse": 2.03306717594387e-06, "rmse": 0.0014258566463511927, "relative_error": 0.10631741618956413, "max_error": 0.050121307373046875, "sparsity": 0.38936614990234375, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.self_attn.v_proj": { "mse": 1.2314576451899484e-06, "rmse": 0.0011097106132636329, "relative_error": 0.12502401296497923, "max_error": 0.036118507385253906, "sparsity": 0.39406808217366535, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.self_attn.q_proj": { "mse": 2.091504939016886e-06, "rmse": 0.0014462036298588405, "relative_error": 0.114342204814357, "max_error": 0.052300095558166504, "sparsity": 0.3865979512532552, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.self_attn.out_proj": { "mse": 2.3585996586916735e-06, "rmse": 0.0015357733096689997, "relative_error": 0.16983263226843545, "max_error": 0.055203378200531006, "sparsity": 0.36684226989746094, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.encoder_attn.k_proj": { "mse": 2.569649268480134e-06, "rmse": 0.0016030125603001787, "relative_error": 0.145535704383827, "max_error": 0.061995506286621094, "sparsity": 0.3825670878092448, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.encoder_attn.v_proj": { "mse": 2.6175509901804617e-06, "rmse": 0.001617884727099079, "relative_error": 0.152717885751071, "max_error": 0.05068695545196533, "sparsity": 0.385009765625, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.encoder_attn.q_proj": { "mse": 1.3694378822037834e-06, "rmse": 0.0011702298416139383, "relative_error": 0.10105443997993861, "max_error": 0.051283836364746094, "sparsity": 0.3925361633300781, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.encoder_attn.out_proj": { "mse": 3.2205025490839034e-06, "rmse": 0.001794575868857013, "relative_error": 0.1678963406077039, "max_error": 0.07158446311950684, "sparsity": 0.3641344706217448, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.fc1": { "mse": 2.8058025236532558e-06, "rmse": 0.001675052991297068, "relative_error": 0.12601454584557661, "max_error": 0.08018875122070312, "sparsity": 0.38286805152893066, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.1.fc2": { "mse": 7.15729493094841e-06, "rmse": 0.0026753121184169165, "relative_error": 0.2385123906472085, "max_error": 0.1420459747314453, "sparsity": 0.37098320325215656, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.self_attn.k_proj": { "mse": 1.408790922141634e-06, "rmse": 0.0011869249858949106, "relative_error": 0.15586319641563348, "max_error": 0.05228686332702637, "sparsity": 0.38851292928059894, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.self_attn.v_proj": { "mse": 2.4211458367062733e-06, "rmse": 0.0015560031608921215, "relative_error": 0.19859374281883027, "max_error": 0.0744476318359375, "sparsity": 0.39120133717854816, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.self_attn.q_proj": { "mse": 1.3298435987962876e-06, "rmse": 0.0011531884489519861, "relative_error": 0.1712732837930552, "max_error": 0.044757843017578125, "sparsity": 0.38156604766845703, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.self_attn.out_proj": { "mse": 3.029804929610691e-06, "rmse": 0.0017406334851457646, "relative_error": 0.2584208819885451, "max_error": 0.07974696159362793, "sparsity": 0.35305945078531903, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.encoder_attn.k_proj": { "mse": 2.2631470528722275e-06, "rmse": 0.001504375967925647, "relative_error": 0.1425945197962898, "max_error": 0.04911303520202637, "sparsity": 0.3848470052083333, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.encoder_attn.v_proj": { "mse": 3.066921181016369e-06, "rmse": 0.0017512627390018805, "relative_error": 0.15523498710637637, "max_error": 0.043721556663513184, "sparsity": 0.3850396474202474, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.encoder_attn.q_proj": { "mse": 1.306824174207577e-06, "rmse": 0.0011431641064202362, "relative_error": 0.10384071954394945, "max_error": 0.0584259033203125, "sparsity": 0.39062023162841797, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.encoder_attn.out_proj": { "mse": 2.39322457673552e-06, "rmse": 0.0015470050344893902, "relative_error": 0.13837125067483497, "max_error": 0.03503692150115967, "sparsity": 0.3704687754313151, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.fc1": { "mse": 2.6717477794591105e-06, "rmse": 0.0016345481881728388, "relative_error": 0.13424853534381614, "max_error": 0.12715303897857666, "sparsity": 0.37990784645080566, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.2.fc2": { "mse": 6.862672307761386e-06, "rmse": 0.002619670266991895, "relative_error": 0.24381065264040552, "max_error": 0.22676372528076172, "sparsity": 0.3882887363433838, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.self_attn.k_proj": { "mse": 1.7996961787503096e-06, "rmse": 0.0013415275542270123, "relative_error": 0.1192658384835929, "max_error": 0.04256439208984375, "sparsity": 0.37576770782470703, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.self_attn.v_proj": { "mse": 2.0297898117860314e-06, "rmse": 0.0014247069213652438, "relative_error": 0.13746902832804708, "max_error": 0.03883171081542969, "sparsity": 0.38527584075927734, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.self_attn.q_proj": { "mse": 2.1074170035717543e-06, "rmse": 0.0014516945283260367, "relative_error": 0.11590249312665402, "max_error": 0.07066059112548828, "sparsity": 0.38370641072591144, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.self_attn.out_proj": { "mse": 1.333709519713011e-06, "rmse": 0.0011548634203718685, "relative_error": 0.117272895602355, "max_error": 0.07680273056030273, "sparsity": 0.4009917577107747, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.encoder_attn.k_proj": { "mse": 2.471836751283263e-06, "rmse": 0.001572207604384123, "relative_error": 0.14458506102228255, "max_error": 0.04527485370635986, "sparsity": 0.3834635416666667, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.encoder_attn.v_proj": { "mse": 3.16734735861246e-06, "rmse": 0.0017797042896538907, "relative_error": 0.15301164247019403, "max_error": 0.059139907360076904, "sparsity": 0.3846127192179362, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.encoder_attn.q_proj": { "mse": 1.4525229516948457e-06, "rmse": 0.001205206601249282, "relative_error": 0.10425491084889804, "max_error": 0.09468531608581543, "sparsity": 0.3902708689371745, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.encoder_attn.out_proj": { "mse": 2.678065584404976e-06, "rmse": 0.0016364796315276814, "relative_error": 0.1430544824579208, "max_error": 0.051494598388671875, "sparsity": 0.37117163340250653, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.fc1": { "mse": 2.3618308659933973e-06, "rmse": 0.0015368249301704463, "relative_error": 0.1245729986149135, "max_error": 0.05836009979248047, "sparsity": 0.37219882011413574, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.3.fc2": { "mse": 1.5611518392688595e-05, "rmse": 0.003951141403783037, "relative_error": 0.3720975771798556, "max_error": 0.5879669189453125, "sparsity": 0.38265403111775714, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.self_attn.k_proj": { "mse": 2.8701028895739e-06, "rmse": 0.0016941378012351592, "relative_error": 0.11716970889271452, "max_error": 0.055669307708740234, "sparsity": 0.3828910191853841, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.self_attn.v_proj": { "mse": 1.9905580757040298e-06, "rmse": 0.0014108713887892226, "relative_error": 0.12301872679402027, "max_error": 0.053325772285461426, "sparsity": 0.3898334503173828, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.self_attn.q_proj": { "mse": 2.990354914800264e-06, "rmse": 0.0017292642697980733, "relative_error": 0.11543029947746948, "max_error": 0.06011366844177246, "sparsity": 0.3869177500406901, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.self_attn.out_proj": { "mse": 1.7686877527012257e-06, "rmse": 0.001329920205388739, "relative_error": 0.1234683605164969, "max_error": 0.06157732009887695, "sparsity": 0.3810313542683919, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.encoder_attn.k_proj": { "mse": 2.4499702249158872e-06, "rmse": 0.0015652380729192243, "relative_error": 0.14753199522550947, "max_error": 0.04569506645202637, "sparsity": 0.38436158498128253, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.encoder_attn.v_proj": { "mse": 3.2714881399442675e-06, "rmse": 0.0018087255568339459, "relative_error": 0.15390755351674237, "max_error": 0.04762768745422363, "sparsity": 0.38466930389404297, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.encoder_attn.q_proj": { "mse": 1.2864924201494432e-06, "rmse": 0.001134236492160891, "relative_error": 0.10177971901165225, "max_error": 0.0303804874420166, "sparsity": 0.39114030202229816, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.encoder_attn.out_proj": { "mse": 2.4311630113516003e-06, "rmse": 0.0015592187182533438, "relative_error": 0.13463845742763503, "max_error": 0.04355788230895996, "sparsity": 0.3733196258544922, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.fc1": { "mse": 2.469627816026332e-06, "rmse": 0.001571504952593638, "relative_error": 0.12524985734406285, "max_error": 0.08176088333129883, "sparsity": 0.3696654637654622, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.4.fc2": { "mse": 5.365253400668735e-06, "rmse": 0.002316301664435946, "relative_error": 0.21985876196410048, "max_error": 0.16083449125289917, "sparsity": 0.3907614549001058, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.self_attn.k_proj": { "mse": 2.7977457648376003e-06, "rmse": 0.0016726463358515452, "relative_error": 0.10678882412118908, "max_error": 0.06360578536987305, "sparsity": 0.3896319071451823, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.self_attn.v_proj": { "mse": 2.054051037703175e-06, "rmse": 0.0014331960918531612, "relative_error": 0.11478326691502795, "max_error": 0.04179668426513672, "sparsity": 0.3933906555175781, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.self_attn.q_proj": { "mse": 2.887436266973964e-06, "rmse": 0.0016992457935725378, "relative_error": 0.10747942741596392, "max_error": 0.07212746143341064, "sparsity": 0.39190673828125, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.self_attn.out_proj": { "mse": 2.422082388875424e-06, "rmse": 0.0015563040798235491, "relative_error": 0.12821936986008606, "max_error": 0.03042781352996826, "sparsity": 0.37738768259684247, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.encoder_attn.k_proj": { "mse": 2.1594835288851755e-06, "rmse": 0.0014695181281240376, "relative_error": 0.14820830447000122, "max_error": 0.05715823173522949, "sparsity": 0.38480599721272785, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.encoder_attn.v_proj": { "mse": 2.402921154498472e-06, "rmse": 0.0015501358503365026, "relative_error": 0.15172739547983966, "max_error": 0.049695730209350586, "sparsity": 0.38500118255615234, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.encoder_attn.q_proj": { "mse": 1.2580545671880827e-06, "rmse": 0.0011216303166320365, "relative_error": 0.10791561656075024, "max_error": 0.07042884826660156, "sparsity": 0.39124329884847003, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.encoder_attn.out_proj": { "mse": 2.0925813259964343e-06, "rmse": 0.0014465757242524272, "relative_error": 0.1422147514369969, "max_error": 0.05846059322357178, "sparsity": 0.37059179941813153, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.fc1": { "mse": 3.071619175898377e-06, "rmse": 0.0017526035421333533, "relative_error": 0.12686562610632215, "max_error": 0.0797877311706543, "sparsity": 0.3853236834208171, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.5.fc2": { "mse": 5.129960754857166e-06, "rmse": 0.002264941666987732, "relative_error": 0.1860462585742565, "max_error": 0.05859053134918213, "sparsity": 0.38653842608133954, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.self_attn.k_proj": { "mse": 2.7227015380049124e-06, "rmse": 0.001650061070992499, "relative_error": 0.1084165589968581, "max_error": 0.05523967742919922, "sparsity": 0.3882598876953125, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.self_attn.v_proj": { "mse": 1.960485178642557e-06, "rmse": 0.0014001732673646348, "relative_error": 0.11180013694606943, "max_error": 0.06603431701660156, "sparsity": 0.3924814860026042, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.self_attn.q_proj": { "mse": 2.7193116238777293e-06, "rmse": 0.0016490335423749662, "relative_error": 0.10691578744139109, "max_error": 0.04374641180038452, "sparsity": 0.3899396260579427, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.self_attn.out_proj": { "mse": 2.0261477402527817e-06, "rmse": 0.0014234281647672923, "relative_error": 0.11932234164492085, "max_error": 0.05954170227050781, "sparsity": 0.3812958399454753, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.encoder_attn.k_proj": { "mse": 1.914561835292261e-06, "rmse": 0.0013836769259087402, "relative_error": 0.1409572228796846, "max_error": 0.05499941110610962, "sparsity": 0.3855908711751302, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.encoder_attn.v_proj": { "mse": 2.064477939711651e-06, "rmse": 0.0014368291268315975, "relative_error": 0.15090229510718225, "max_error": 0.041681647300720215, "sparsity": 0.38470935821533203, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.encoder_attn.q_proj": { "mse": 1.2734592473861994e-06, "rmse": 0.0011284765160986733, "relative_error": 0.10325489365368369, "max_error": 0.03181350231170654, "sparsity": 0.3910401662190755, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.encoder_attn.out_proj": { "mse": 1.8945763713418273e-06, "rmse": 0.0013764361123357043, "relative_error": 0.1406672765822477, "max_error": 0.03437471389770508, "sparsity": 0.37631797790527344, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.fc1": { "mse": 3.0933047128200997e-06, "rmse": 0.0017587793246510773, "relative_error": 0.12332660056166439, "max_error": 0.09690666198730469, "sparsity": 0.3895715077718099, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.6.fc2": { "mse": 5.023699941375526e-06, "rmse": 0.002241361180482861, "relative_error": 0.17801352059730607, "max_error": 0.07062911987304688, "sparsity": 0.38503503799438477, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.self_attn.k_proj": { "mse": 2.669979267011513e-06, "rmse": 0.001634007119633055, "relative_error": 0.10356912057004246, "max_error": 0.05674147605895996, "sparsity": 0.39308420817057294, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.self_attn.v_proj": { "mse": 1.693527110546711e-06, "rmse": 0.0013013558739048711, "relative_error": 0.10513660505308145, "max_error": 0.04603254795074463, "sparsity": 0.39510377248128253, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.self_attn.q_proj": { "mse": 2.754891966105788e-06, "rmse": 0.0016597867230779345, "relative_error": 0.10414344160911279, "max_error": 0.0881616473197937, "sparsity": 0.3932339350382487, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.self_attn.out_proj": { "mse": 2.3079376205714652e-06, "rmse": 0.0015191897908330826, "relative_error": 0.12670858213626052, "max_error": 0.0412135124206543, "sparsity": 0.37942059834798175, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.encoder_attn.k_proj": { "mse": 3.342863919897354e-06, "rmse": 0.0018283500539823753, "relative_error": 0.15063672352428492, "max_error": 0.0661466121673584, "sparsity": 0.3860619862874349, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.encoder_attn.v_proj": { "mse": 2.972983565996401e-06, "rmse": 0.00172423419696873, "relative_error": 0.15345657818512687, "max_error": 0.21555328369140625, "sparsity": 0.38444073994954425, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.encoder_attn.q_proj": { "mse": 1.6744468211982166e-06, "rmse": 0.0012940041812908552, "relative_error": 0.10236945613803666, "max_error": 0.060260772705078125, "sparsity": 0.39227835337320965, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.encoder_attn.out_proj": { "mse": 2.9717300549236825e-06, "rmse": 0.0017238706607294186, "relative_error": 0.15377582478905313, "max_error": 0.08759880065917969, "sparsity": 0.3660281499226888, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.fc1": { "mse": 2.8657561870204518e-06, "rmse": 0.001692854449449347, "relative_error": 0.11476676538134392, "max_error": 0.1609211564064026, "sparsity": 0.39171473185221356, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.7.fc2": { "mse": 5.369829978008056e-06, "rmse": 0.0023172893600083818, "relative_error": 0.17915047105444631, "max_error": 0.06115150451660156, "sparsity": 0.3791286150614421, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.self_attn.k_proj": { "mse": 2.874462779800524e-06, "rmse": 0.001695424070785986, "relative_error": 0.10408217734095601, "max_error": 0.04898780584335327, "sparsity": 0.39197508494059247, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.self_attn.v_proj": { "mse": 1.954801291503827e-06, "rmse": 0.0013981420855921, "relative_error": 0.10715554077548149, "max_error": 0.04911994934082031, "sparsity": 0.39489396413167316, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.self_attn.q_proj": { "mse": 2.988884716614848e-06, "rmse": 0.0017288391239831565, "relative_error": 0.10488478135736144, "max_error": 0.052776336669921875, "sparsity": 0.3927752176920573, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.self_attn.out_proj": { "mse": 2.2270126009971136e-06, "rmse": 0.0014923178619171969, "relative_error": 0.11837970535523554, "max_error": 0.04682779312133789, "sparsity": 0.38154157002766925, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.encoder_attn.k_proj": { "mse": 4.145021193835419e-06, "rmse": 0.002035932512102358, "relative_error": 0.14794230558981988, "max_error": 0.06369626522064209, "sparsity": 0.38465213775634766, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.encoder_attn.v_proj": { "mse": 3.111481191808707e-06, "rmse": 0.0017639391122736372, "relative_error": 0.15156701666066377, "max_error": 0.04685235023498535, "sparsity": 0.38491566975911456, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.encoder_attn.q_proj": { "mse": 2.2250369511311874e-06, "rmse": 0.0014916557750135207, "relative_error": 0.10434207297549174, "max_error": 0.050441741943359375, "sparsity": 0.39132245381673175, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.encoder_attn.out_proj": { "mse": 3.1934757771523437e-06, "rmse": 0.0017870298758421313, "relative_error": 0.15283987169747038, "max_error": 0.08969151973724365, "sparsity": 0.3676007588704427, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.fc1": { "mse": 2.79184632745455e-06, "rmse": 0.0016708819011092765, "relative_error": 0.11036536299564526, "max_error": 0.12213349342346191, "sparsity": 0.3927458127339681, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.8.fc2": { "mse": 5.2020336624991614e-06, "rmse": 0.002280796716610045, "relative_error": 0.17299622967154382, "max_error": 0.07349264621734619, "sparsity": 0.3765496412913005, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.self_attn.k_proj": { "mse": 3.0386931939574424e-06, "rmse": 0.0017431847847997762, "relative_error": 0.1058218625977078, "max_error": 0.0761750340461731, "sparsity": 0.3904520670572917, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.self_attn.v_proj": { "mse": 2.23638562601991e-06, "rmse": 0.0014954549896335596, "relative_error": 0.11097779406996414, "max_error": 0.041104793548583984, "sparsity": 0.3938833872477214, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.self_attn.q_proj": { "mse": 3.189991730323527e-06, "rmse": 0.0017860547948827122, "relative_error": 0.10832728289648673, "max_error": 0.06943631172180176, "sparsity": 0.3921623229980469, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.self_attn.out_proj": { "mse": 2.696985120564932e-06, "rmse": 0.001642250017678469, "relative_error": 0.1281785123233537, "max_error": 0.18055415153503418, "sparsity": 0.37871678670247394, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.encoder_attn.k_proj": { "mse": 3.2500684028491378e-06, "rmse": 0.0018027946091690916, "relative_error": 0.14403063462528215, "max_error": 0.056221961975097656, "sparsity": 0.3845011393229167, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.encoder_attn.v_proj": { "mse": 3.189758899679873e-06, "rmse": 0.0017859896135419917, "relative_error": 0.15269143882686897, "max_error": 0.04081469774246216, "sparsity": 0.38484986623128253, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.encoder_attn.q_proj": { "mse": 1.9499902919051237e-06, "rmse": 0.001396420528316998, "relative_error": 0.10472704022264365, "max_error": 0.03749656677246094, "sparsity": 0.3913602828979492, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.encoder_attn.out_proj": { "mse": 2.9134057513147127e-06, "rmse": 0.0017068701624068283, "relative_error": 0.14487531428174485, "max_error": 0.10330677032470703, "sparsity": 0.3698616027832031, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.fc1": { "mse": 2.8058291263732826e-06, "rmse": 0.0016750609321374798, "relative_error": 0.1102062185498671, "max_error": 0.19041013717651367, "sparsity": 0.3934587637583415, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.9.fc2": { "mse": 5.31405476067448e-06, "rmse": 0.002305223364594954, "relative_error": 0.17306741105103132, "max_error": 0.0740041732788086, "sparsity": 0.37359078725179035, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.self_attn.k_proj": { "mse": 2.8235283480171347e-06, "rmse": 0.0016803357843053676, "relative_error": 0.10581116696721167, "max_error": 0.12559711933135986, "sparsity": 0.39281590779622394, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.self_attn.v_proj": { "mse": 2.129301947206841e-06, "rmse": 0.0014592127833893318, "relative_error": 0.10461520351896639, "max_error": 0.06537044048309326, "sparsity": 0.39534536997477215, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.self_attn.q_proj": { "mse": 2.9481207093340345e-06, "rmse": 0.0017170092339105327, "relative_error": 0.10566365640016753, "max_error": 0.0826263427734375, "sparsity": 0.3939990997314453, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.self_attn.out_proj": { "mse": 3.0388287086680066e-06, "rmse": 0.0017432236542302903, "relative_error": 0.12941463793508615, "max_error": 0.04368305206298828, "sparsity": 0.37840938568115234, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.encoder_attn.k_proj": { "mse": 4.262691163603449e-06, "rmse": 0.002064628577638954, "relative_error": 0.1455730293477049, "max_error": 0.06619501113891602, "sparsity": 0.3850278854370117, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.encoder_attn.v_proj": { "mse": 4.141321824135957e-06, "rmse": 0.002035023789574942, "relative_error": 0.15507668501761301, "max_error": 0.046338558197021484, "sparsity": 0.38466326395670575, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.encoder_attn.q_proj": { "mse": 2.3088205125532113e-06, "rmse": 0.0015194803429308362, "relative_error": 0.10376620421198642, "max_error": 0.04837995767593384, "sparsity": 0.3922373453776042, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.encoder_attn.out_proj": { "mse": 3.749622464965796e-06, "rmse": 0.0019363941915234604, "relative_error": 0.15077165945466575, "max_error": 0.043268442153930664, "sparsity": 0.3687426249186198, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.fc1": { "mse": 2.742124252108624e-06, "rmse": 0.0016559360652237225, "relative_error": 0.10881992614733726, "max_error": 0.09426462650299072, "sparsity": 0.39169470469156903, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.10.fc2": { "mse": 5.248308752925368e-06, "rmse": 0.0022909187573821486, "relative_error": 0.16801593877256882, "max_error": 0.09567546844482422, "sparsity": 0.37460168202718097, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.self_attn.k_proj": { "mse": 3.0592714210797567e-06, "rmse": 0.0017490773056328176, "relative_error": 0.10734568285249818, "max_error": 0.09254008531570435, "sparsity": 0.3920777638753255, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.self_attn.v_proj": { "mse": 2.1376101813075365e-06, "rmse": 0.0014620568324478828, "relative_error": 0.10559583271255113, "max_error": 0.029812395572662354, "sparsity": 0.3952624003092448, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.self_attn.q_proj": { "mse": 3.1045001378515735e-06, "rmse": 0.0017619591759889255, "relative_error": 0.10693716839240887, "max_error": 0.090118408203125, "sparsity": 0.3924741744995117, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.self_attn.out_proj": { "mse": 3.1066649626154685e-06, "rmse": 0.0017625733921217206, "relative_error": 0.13225657965413115, "max_error": 0.06195068359375, "sparsity": 0.3758252461751302, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.encoder_attn.k_proj": { "mse": 4.285246177460067e-06, "rmse": 0.0020700836160551747, "relative_error": 0.14720766834565957, "max_error": 0.06798171997070312, "sparsity": 0.3851782480875651, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.encoder_attn.v_proj": { "mse": 4.828083092434099e-06, "rmse": 0.0021972899427326604, "relative_error": 0.1586933413077182, "max_error": 0.05201244354248047, "sparsity": 0.3848873774210612, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.encoder_attn.q_proj": { "mse": 2.283047706441721e-06, "rmse": 0.001510975746476998, "relative_error": 0.10365660136115314, "max_error": 0.048856914043426514, "sparsity": 0.3916358947753906, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.encoder_attn.out_proj": { "mse": 4.28708926847321e-06, "rmse": 0.00207052874128161, "relative_error": 0.15415400301442833, "max_error": 0.04470396041870117, "sparsity": 0.3667583465576172, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.fc1": { "mse": 2.7612836674961727e-06, "rmse": 0.001661711066189358, "relative_error": 0.10893671218267384, "max_error": 0.1811065673828125, "sparsity": 0.3911479314168294, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.11.fc2": { "mse": 5.29205226484919e-06, "rmse": 0.002300446101270184, "relative_error": 0.16487893138147464, "max_error": 0.11721420288085938, "sparsity": 0.373733123143514, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.self_attn.k_proj": { "mse": 2.9784519028908107e-06, "rmse": 0.0017258191976249455, "relative_error": 0.10706666687076272, "max_error": 0.10212254524230957, "sparsity": 0.3907483418782552, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.self_attn.v_proj": { "mse": 2.395839828750468e-06, "rmse": 0.0015478500666248225, "relative_error": 0.10913041404713451, "max_error": 0.05898064374923706, "sparsity": 0.39325809478759766, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.self_attn.q_proj": { "mse": 3.0919227356207557e-06, "rmse": 0.0017583864011134628, "relative_error": 0.10877376011568239, "max_error": 0.09144771099090576, "sparsity": 0.39208539326985675, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.self_attn.out_proj": { "mse": 3.2778616514406167e-06, "rmse": 0.0018104865786413929, "relative_error": 0.13259861849468188, "max_error": 0.05882430076599121, "sparsity": 0.3744872411092122, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.encoder_attn.k_proj": { "mse": 4.489171260502189e-06, "rmse": 0.002118766447842279, "relative_error": 0.14508222072774984, "max_error": 0.06339359283447266, "sparsity": 0.3842233022054036, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.encoder_attn.v_proj": { "mse": 4.473969056562055e-06, "rmse": 0.0021151758925824714, "relative_error": 0.1564127825375384, "max_error": 0.05270886421203613, "sparsity": 0.38474464416503906, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.encoder_attn.q_proj": { "mse": 2.4208638933487236e-06, "rmse": 0.0015559125596731726, "relative_error": 0.10374680012869537, "max_error": 0.03216981887817383, "sparsity": 0.39106400807698566, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.encoder_attn.out_proj": { "mse": 4.03118428948801e-06, "rmse": 0.002007780936628299, "relative_error": 0.15214832136551018, "max_error": 0.05477547645568848, "sparsity": 0.3683900833129883, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.fc1": { "mse": 2.6280795282218605e-06, "rmse": 0.0016211352590767558, "relative_error": 0.10722597587911696, "max_error": 0.1983776092529297, "sparsity": 0.3908070723215739, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.12.fc2": { "mse": 4.76806872029556e-06, "rmse": 0.0021835907859064528, "relative_error": 0.15451343321763653, "max_error": 0.06719207763671875, "sparsity": 0.37807003657023114, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.self_attn.k_proj": { "mse": 3.1032777769723907e-06, "rmse": 0.0017616122663549976, "relative_error": 0.10859283459981478, "max_error": 0.08640223741531372, "sparsity": 0.3908227284749349, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.self_attn.v_proj": { "mse": 2.4164837668649852e-06, "rmse": 0.0015545043476507183, "relative_error": 0.11088639104509466, "max_error": 0.09391403198242188, "sparsity": 0.3939778010050456, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.self_attn.q_proj": { "mse": 3.1459003366762772e-06, "rmse": 0.0017736686095988386, "relative_error": 0.10887852983292154, "max_error": 0.0973324179649353, "sparsity": 0.39158089955647785, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.self_attn.out_proj": { "mse": 3.010093223565491e-06, "rmse": 0.001734962023666654, "relative_error": 0.12833051491091624, "max_error": 0.08125495910644531, "sparsity": 0.37650807698567706, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.encoder_attn.k_proj": { "mse": 4.259429260855541e-06, "rmse": 0.002063838477414243, "relative_error": 0.14530331557484114, "max_error": 0.061621904373168945, "sparsity": 0.38376013437906903, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.encoder_attn.v_proj": { "mse": 4.011252713098656e-06, "rmse": 0.002002811202559706, "relative_error": 0.15357150644740222, "max_error": 0.05202364921569824, "sparsity": 0.38488419850667316, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.encoder_attn.q_proj": { "mse": 2.3202264856081456e-06, "rmse": 0.0015232289669016097, "relative_error": 0.10355130654722193, "max_error": 0.04495662450790405, "sparsity": 0.3904116948445638, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.encoder_attn.out_proj": { "mse": 3.6354515486891614e-06, "rmse": 0.001906686012087245, "relative_error": 0.14821881625212166, "max_error": 0.07686328887939453, "sparsity": 0.36955706278483075, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.fc1": { "mse": 2.724333626247244e-06, "rmse": 0.0016505555507910796, "relative_error": 0.10972522648773587, "max_error": 0.21759366989135742, "sparsity": 0.39084283510843915, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.13.fc2": { "mse": 4.931787771056406e-06, "rmse": 0.0022207628804211416, "relative_error": 0.15521514437074152, "max_error": 0.09429550170898438, "sparsity": 0.37915460268656415, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.self_attn.k_proj": { "mse": 3.087111963395728e-06, "rmse": 0.0017570179177787938, "relative_error": 0.1092595745005226, "max_error": 0.09504544734954834, "sparsity": 0.390896479288737, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.self_attn.v_proj": { "mse": 2.5206579721270828e-06, "rmse": 0.001587658014853036, "relative_error": 0.11081719637216424, "max_error": 0.051631927490234375, "sparsity": 0.39329179128011066, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.self_attn.q_proj": { "mse": 3.190672487107804e-06, "rmse": 0.0017862453602760747, "relative_error": 0.11018739252519799, "max_error": 0.08269834518432617, "sparsity": 0.3911660512288411, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.self_attn.out_proj": { "mse": 3.2235734579444397e-06, "rmse": 0.0017954312735230051, "relative_error": 0.12984946467693861, "max_error": 0.07321488857269287, "sparsity": 0.37707042694091797, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.encoder_attn.k_proj": { "mse": 4.632142918126192e-06, "rmse": 0.002152241370786788, "relative_error": 0.14750340403551016, "max_error": 0.06115221977233887, "sparsity": 0.3844248453776042, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.encoder_attn.v_proj": { "mse": 4.610026280715829e-06, "rmse": 0.0021470971754244915, "relative_error": 0.15607740424439667, "max_error": 0.05488014221191406, "sparsity": 0.3850485483805339, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.encoder_attn.q_proj": { "mse": 2.4240475795522798e-06, "rmse": 0.0015569353164317007, "relative_error": 0.10406009770556121, "max_error": 0.042209625244140625, "sparsity": 0.3910134633382161, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.encoder_attn.out_proj": { "mse": 3.991907306044595e-06, "rmse": 0.001997975802166932, "relative_error": 0.14917388540435966, "max_error": 0.1012420654296875, "sparsity": 0.3692118326822917, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.fc1": { "mse": 2.651945123943733e-06, "rmse": 0.001628479390088721, "relative_error": 0.10843630002577104, "max_error": 0.17707645893096924, "sparsity": 0.3903570969899495, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.14.fc2": { "mse": 5.093220352136996e-06, "rmse": 0.0022568164196799427, "relative_error": 0.15510645443953647, "max_error": 0.09729671478271484, "sparsity": 0.378409465154012, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.self_attn.k_proj": { "mse": 2.952674776679487e-06, "rmse": 0.00171833488490442, "relative_error": 0.11039714548231819, "max_error": 0.05137348175048828, "sparsity": 0.39000829060872394, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.self_attn.v_proj": { "mse": 2.5764302336028777e-06, "rmse": 0.0016051262360334397, "relative_error": 0.11392904939485686, "max_error": 0.07793331146240234, "sparsity": 0.3936421076456706, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.self_attn.q_proj": { "mse": 3.0681758289574645e-06, "rmse": 0.0017516209147408193, "relative_error": 0.111066066762652, "max_error": 0.061458587646484375, "sparsity": 0.3910897572835286, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.self_attn.out_proj": { "mse": 3.2459129215567373e-06, "rmse": 0.0018016417295224757, "relative_error": 0.13252200909794726, "max_error": 0.17857837677001953, "sparsity": 0.3764670689900716, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.encoder_attn.k_proj": { "mse": 3.870277396345045e-06, "rmse": 0.001967302060270625, "relative_error": 0.1451358525235946, "max_error": 0.05497002601623535, "sparsity": 0.38480281829833984, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.encoder_attn.v_proj": { "mse": 4.471807187655941e-06, "rmse": 0.002114664793213322, "relative_error": 0.15706173162807832, "max_error": 0.07093095779418945, "sparsity": 0.3840920130411784, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.encoder_attn.q_proj": { "mse": 2.2638698737864615e-06, "rmse": 0.0015046161881976617, "relative_error": 0.10758771192543139, "max_error": 0.06101179122924805, "sparsity": 0.389739990234375, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.encoder_attn.out_proj": { "mse": 4.6661739361297805e-06, "rmse": 0.00216013285150006, "relative_error": 0.164261855187405, "max_error": 0.16168975830078125, "sparsity": 0.36803849538167316, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.fc1": { "mse": 2.6208585950371344e-06, "rmse": 0.0016189066047913741, "relative_error": 0.10883047265246418, "max_error": 0.2597169876098633, "sparsity": 0.3904755115509033, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.15.fc2": { "mse": 5.432469151855912e-06, "rmse": 0.002330765786572283, "relative_error": 0.15863985173106748, "max_error": 0.09306836128234863, "sparsity": 0.37816667556762695, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.self_attn.k_proj": { "mse": 2.975872803290258e-06, "rmse": 0.0017250718255453186, "relative_error": 0.11149507911807895, "max_error": 0.0687759518623352, "sparsity": 0.38975874582926434, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.self_attn.v_proj": { "mse": 2.708741931201075e-06, "rmse": 0.001645825607772912, "relative_error": 0.11401836328792606, "max_error": 0.10725784301757812, "sparsity": 0.3934755325317383, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.self_attn.q_proj": { "mse": 3.0313924526126357e-06, "rmse": 0.0017410894441735713, "relative_error": 0.11183478459241353, "max_error": 0.08448153734207153, "sparsity": 0.3898779551188151, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.self_attn.out_proj": { "mse": 2.974707740577287e-06, "rmse": 0.001724734107211105, "relative_error": 0.12364482519876267, "max_error": 0.10401153564453125, "sparsity": 0.3794857660929362, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.encoder_attn.k_proj": { "mse": 5.051839252701029e-06, "rmse": 0.0022476296965249923, "relative_error": 0.1462108008993025, "max_error": 0.06560587882995605, "sparsity": 0.38422679901123047, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.encoder_attn.v_proj": { "mse": 4.101235390407965e-06, "rmse": 0.00202515070807285, "relative_error": 0.15203837714653734, "max_error": 0.062149763107299805, "sparsity": 0.38334306081136066, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.encoder_attn.q_proj": { "mse": 2.8545221084641526e-06, "rmse": 0.0016895331036899373, "relative_error": 0.10754797639395516, "max_error": 0.05772113800048828, "sparsity": 0.39005088806152344, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.encoder_attn.out_proj": { "mse": 3.7151462493056897e-06, "rmse": 0.001927471465237732, "relative_error": 0.14317596856972012, "max_error": 0.07494163513183594, "sparsity": 0.37266890207926434, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.fc1": { "mse": 2.5293929866165854e-06, "rmse": 0.0015904065475898248, "relative_error": 0.1073629947850975, "max_error": 0.15852278470993042, "sparsity": 0.3905927340189616, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.16.fc2": { "mse": 6.293004844337702e-06, "rmse": 0.002508586224218275, "relative_error": 0.16603359634059295, "max_error": 0.10226941108703613, "sparsity": 0.37468798955281574, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.self_attn.k_proj": { "mse": 3.057536559936125e-06, "rmse": 0.0017485812992069098, "relative_error": 0.11201393995950695, "max_error": 0.09579706192016602, "sparsity": 0.3894125620524089, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.self_attn.v_proj": { "mse": 2.4118428427755134e-06, "rmse": 0.0015530108958972289, "relative_error": 0.11385278737880668, "max_error": 0.04882359504699707, "sparsity": 0.3921810785929362, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.self_attn.q_proj": { "mse": 3.1471593047172064e-06, "rmse": 0.0017740234791899475, "relative_error": 0.11315092671556473, "max_error": 0.08912181854248047, "sparsity": 0.38965892791748047, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.self_attn.out_proj": { "mse": 3.0684352623211453e-06, "rmse": 0.0017516949684009328, "relative_error": 0.13184404672823571, "max_error": 0.062131404876708984, "sparsity": 0.3765624364217122, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.encoder_attn.k_proj": { "mse": 4.313059889682336e-06, "rmse": 0.002076790766948451, "relative_error": 0.1438282830189719, "max_error": 0.0576934814453125, "sparsity": 0.38422075907389325, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.encoder_attn.v_proj": { "mse": 5.9649946706485935e-06, "rmse": 0.0024423338573275753, "relative_error": 0.15639097085047413, "max_error": 0.13858509063720703, "sparsity": 0.38591798146565753, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.encoder_attn.q_proj": { "mse": 2.7382375265005976e-06, "rmse": 0.001654762075496232, "relative_error": 0.1126409982320043, "max_error": 0.05305671691894531, "sparsity": 0.38878027598063153, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.encoder_attn.out_proj": { "mse": 5.209771188674495e-06, "rmse": 0.002282492319521469, "relative_error": 0.15552468907321956, "max_error": 0.14420032501220703, "sparsity": 0.3756395975748698, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.fc1": { "mse": 2.62208232015837e-06, "rmse": 0.0016192845087131444, "relative_error": 0.10946967739129748, "max_error": 0.18319380283355713, "sparsity": 0.39118019739786786, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.17.fc2": { "mse": 5.671533472195733e-06, "rmse": 0.0023814981570842615, "relative_error": 0.15605075908659866, "max_error": 0.10937494039535522, "sparsity": 0.37987271944681805, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.self_attn.k_proj": { "mse": 3.062216137550422e-06, "rmse": 0.001749918894563523, "relative_error": 0.11481806587196931, "max_error": 0.06973004341125488, "sparsity": 0.3889427185058594, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.self_attn.v_proj": { "mse": 2.6578031793178525e-06, "rmse": 0.0016302770253296991, "relative_error": 0.11580165808777118, "max_error": 0.07330894470214844, "sparsity": 0.3923803965250651, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.self_attn.q_proj": { "mse": 3.1825525184103753e-06, "rmse": 0.0017839709970765712, "relative_error": 0.11659504798291477, "max_error": 0.11487168073654175, "sparsity": 0.38934771219889325, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.self_attn.out_proj": { "mse": 3.1932124784361804e-06, "rmse": 0.0017869562049575194, "relative_error": 0.12925187774123928, "max_error": 0.061557769775390625, "sparsity": 0.3762219746907552, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.encoder_attn.k_proj": { "mse": 3.7404693102871533e-06, "rmse": 0.001934029294061275, "relative_error": 0.14225427023342369, "max_error": 0.06442117691040039, "sparsity": 0.3841543197631836, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.encoder_attn.v_proj": { "mse": 5.93807635596022e-06, "rmse": 0.002436816849080008, "relative_error": 0.15289312638788924, "max_error": 0.09826511144638062, "sparsity": 0.3840119043986003, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.encoder_attn.q_proj": { "mse": 2.600288553367136e-06, "rmse": 0.0016125410237780421, "relative_error": 0.11576435007585356, "max_error": 0.04055023193359375, "sparsity": 0.3882484436035156, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.encoder_attn.out_proj": { "mse": 6.008140189805999e-06, "rmse": 0.0024511507888757065, "relative_error": 0.16401463535585767, "max_error": 0.19881439208984375, "sparsity": 0.3687610626220703, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.fc1": { "mse": 2.5828803700278513e-06, "rmse": 0.0016071342103346103, "relative_error": 0.10860366900771316, "max_error": 0.18947696685791016, "sparsity": 0.39104294776916504, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.18.fc2": { "mse": 7.289684617717285e-06, "rmse": 0.002699941595241883, "relative_error": 0.17422221641452565, "max_error": 0.1270887851715088, "sparsity": 0.37224801381429035, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.self_attn.k_proj": { "mse": 3.049122142328997e-06, "rmse": 0.0017461735716500228, "relative_error": 0.11567203769595212, "max_error": 0.0702664852142334, "sparsity": 0.38868459065755206, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.self_attn.v_proj": { "mse": 2.7155556381330825e-06, "rmse": 0.0016478943042965719, "relative_error": 0.1192114629832996, "max_error": 0.07558798789978027, "sparsity": 0.39115556081136066, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.self_attn.q_proj": { "mse": 3.1372007924801437e-06, "rmse": 0.001771214496462849, "relative_error": 0.11738424348854617, "max_error": 0.06286239624023438, "sparsity": 0.38935597737630206, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.self_attn.out_proj": { "mse": 3.676388359963312e-06, "rmse": 0.0019173910294885891, "relative_error": 0.14067619140069135, "max_error": 0.07267498970031738, "sparsity": 0.3723777135213216, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.encoder_attn.k_proj": { "mse": 4.325136615079828e-06, "rmse": 0.002079696279527332, "relative_error": 0.1461241549187539, "max_error": 0.10210031270980835, "sparsity": 0.38515504201253253, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.encoder_attn.v_proj": { "mse": 7.3299588621011935e-06, "rmse": 0.0027073896768107088, "relative_error": 0.15419761759787312, "max_error": 0.11008405685424805, "sparsity": 0.38483206431070965, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.encoder_attn.q_proj": { "mse": 3.1062227208167315e-06, "rmse": 0.0017624479342144355, "relative_error": 0.12209272833975149, "max_error": 0.04779624938964844, "sparsity": 0.38499895731608075, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.encoder_attn.out_proj": { "mse": 8.42092777020298e-06, "rmse": 0.0029018834866691287, "relative_error": 0.1775200950024603, "max_error": 0.21614456176757812, "sparsity": 0.3764657974243164, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.fc1": { "mse": 2.607575652291416e-06, "rmse": 0.0016147989510435707, "relative_error": 0.10923039530021018, "max_error": 0.14707237482070923, "sparsity": 0.3912237485249837, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.19.fc2": { "mse": 8.792547305347398e-06, "rmse": 0.0029652229773403883, "relative_error": 0.18922121151644503, "max_error": 0.125, "sparsity": 0.3674290180206299, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.self_attn.k_proj": { "mse": 2.585725269454997e-06, "rmse": 0.0016080190513345907, "relative_error": 0.1106971274399791, "max_error": 0.04056340456008911, "sparsity": 0.38825352986653644, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.self_attn.v_proj": { "mse": 2.6116106255358318e-06, "rmse": 0.001616047841351187, "relative_error": 0.1165965263213501, "max_error": 0.0487060546875, "sparsity": 0.39172935485839844, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.self_attn.q_proj": { "mse": 2.7351811695552897e-06, "rmse": 0.0016538383142119092, "relative_error": 0.11324436363197928, "max_error": 0.05264711380004883, "sparsity": 0.3888041178385417, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.self_attn.out_proj": { "mse": 3.686214313347591e-06, "rmse": 0.0019199516434919893, "relative_error": 0.14039298497893754, "max_error": 0.08768653869628906, "sparsity": 0.37349573771158856, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.encoder_attn.k_proj": { "mse": 4.4726807573169935e-06, "rmse": 0.0021148713335134585, "relative_error": 0.14211945336391, "max_error": 0.08284521102905273, "sparsity": 0.38464196523030597, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.encoder_attn.v_proj": { "mse": 7.222415661090054e-06, "rmse": 0.0026874552388998136, "relative_error": 0.15828476986233206, "max_error": 0.11456680297851562, "sparsity": 0.38407135009765625, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.encoder_attn.q_proj": { "mse": 3.376102540642023e-06, "rmse": 0.001837417356139324, "relative_error": 0.12240313810067552, "max_error": 0.07167434692382812, "sparsity": 0.3857393264770508, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.encoder_attn.out_proj": { "mse": 5.347591013560304e-06, "rmse": 0.002312485894780832, "relative_error": 0.14779052883935034, "max_error": 0.14819598197937012, "sparsity": 0.370513916015625, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.fc1": { "mse": 2.671948550414527e-06, "rmse": 0.0016346096018360246, "relative_error": 0.11068499087775575, "max_error": 0.20884323120117188, "sparsity": 0.39017558097839355, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.20.fc2": { "mse": 8.031453035073355e-06, "rmse": 0.002833981833934959, "relative_error": 0.17959298852793198, "max_error": 0.14152908325195312, "sparsity": 0.37109629313151044, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.self_attn.k_proj": { "mse": 2.8241770451131742e-06, "rmse": 0.001680528799251347, "relative_error": 0.11666074817263411, "max_error": 0.08865010738372803, "sparsity": 0.38890234629313153, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.self_attn.v_proj": { "mse": 2.7611768018687144e-06, "rmse": 0.0016616789105807158, "relative_error": 0.11628176687983355, "max_error": 0.06029319763183594, "sparsity": 0.39069143931070965, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.self_attn.q_proj": { "mse": 2.902990217990009e-06, "rmse": 0.0017038163686236875, "relative_error": 0.11756411493004902, "max_error": 0.09850597381591797, "sparsity": 0.38947486877441406, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.self_attn.out_proj": { "mse": 3.309012527097366e-06, "rmse": 0.00181906913752539, "relative_error": 0.12909355415486923, "max_error": 0.10249519348144531, "sparsity": 0.3772468566894531, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.encoder_attn.k_proj": { "mse": 4.397637894726358e-06, "rmse": 0.0020970545760009103, "relative_error": 0.14199766950719964, "max_error": 0.056479454040527344, "sparsity": 0.3843771616617839, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.encoder_attn.v_proj": { "mse": 9.549195965519175e-06, "rmse": 0.0030901773356102357, "relative_error": 0.15587564523772446, "max_error": 0.1548752784729004, "sparsity": 0.38514550526936847, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.encoder_attn.q_proj": { "mse": 3.236666543671163e-06, "rmse": 0.0017990738016188115, "relative_error": 0.12158806361064572, "max_error": 0.044310808181762695, "sparsity": 0.3864482243855794, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.encoder_attn.out_proj": { "mse": 1.2453544513846282e-05, "rmse": 0.0035289579926440443, "relative_error": 0.19398958543544084, "max_error": 0.2276768684387207, "sparsity": 0.37346363067626953, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.fc1": { "mse": 2.6899620024778415e-06, "rmse": 0.0016401103628956928, "relative_error": 0.11088570231448468, "max_error": 0.19092488288879395, "sparsity": 0.39104406038920086, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.21.fc2": { "mse": 1.1716691915353294e-05, "rmse": 0.0034229653687049325, "relative_error": 0.21299683368336433, "max_error": 0.18568956851959229, "sparsity": 0.35869065920511883, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.self_attn.k_proj": { "mse": 2.4202918211813085e-06, "rmse": 0.0015557287106630477, "relative_error": 0.11283075734818315, "max_error": 0.08211708068847656, "sparsity": 0.3905862172444661, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.self_attn.v_proj": { "mse": 2.446655571475276e-06, "rmse": 0.0015641788809069364, "relative_error": 0.1136433297025706, "max_error": 0.04386502504348755, "sparsity": 0.3926156361897786, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.self_attn.q_proj": { "mse": 2.585672973509645e-06, "rmse": 0.001608002790267991, "relative_error": 0.11486764879772378, "max_error": 0.08422493934631348, "sparsity": 0.3920370737711589, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.self_attn.out_proj": { "mse": 3.3158557926071808e-06, "rmse": 0.0018209491460793683, "relative_error": 0.13301228810832066, "max_error": 0.07436180114746094, "sparsity": 0.37401390075683594, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.encoder_attn.k_proj": { "mse": 4.3133932194905356e-06, "rmse": 0.0020768710165753037, "relative_error": 0.14067432703895769, "max_error": 0.05864429473876953, "sparsity": 0.38448651631673175, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.encoder_attn.v_proj": { "mse": 8.616913873993326e-06, "rmse": 0.00293545803478662, "relative_error": 0.15301533169596557, "max_error": 0.17897844314575195, "sparsity": 0.3843116760253906, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.encoder_attn.q_proj": { "mse": 2.9848199574189493e-06, "rmse": 0.0017276631492912468, "relative_error": 0.11710600067795825, "max_error": 0.0589747428894043, "sparsity": 0.3881543477376302, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.encoder_attn.out_proj": { "mse": 8.628910109109711e-06, "rmse": 0.0029375006568696646, "relative_error": 0.17018883610312907, "max_error": 0.1784210205078125, "sparsity": 0.37581761678059894, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.fc1": { "mse": 2.6359286948718363e-06, "rmse": 0.0016235543399812143, "relative_error": 0.10956246786200693, "max_error": 0.15522384643554688, "sparsity": 0.3922089735666911, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.22.fc2": { "mse": 1.6377167412429117e-05, "rmse": 0.004046871311572573, "relative_error": 0.2533474753294872, "max_error": 0.22931241989135742, "sparsity": 0.334999958674113, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.self_attn.k_proj": { "mse": 2.916458697654889e-06, "rmse": 0.0017077642394823967, "relative_error": 0.11842748635264559, "max_error": 0.06891632080078125, "sparsity": 0.3846117655436198, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.self_attn.v_proj": { "mse": 2.9219972930150107e-06, "rmse": 0.001709385062826691, "relative_error": 0.12511812783253307, "max_error": 0.04297161102294922, "sparsity": 0.3864247004191081, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.self_attn.q_proj": { "mse": 2.794949296003324e-06, "rmse": 0.0016718101853988462, "relative_error": 0.11630976302364118, "max_error": 0.05386066436767578, "sparsity": 0.3846616744995117, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.self_attn.out_proj": { "mse": 2.7796131689683534e-06, "rmse": 0.0016672171931000333, "relative_error": 0.12332751993743979, "max_error": 0.09098243713378906, "sparsity": 0.3754889170328776, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.encoder_attn.k_proj": { "mse": 4.40665189671563e-06, "rmse": 0.0020992026811900823, "relative_error": 0.14626904581808187, "max_error": 0.09139752388000488, "sparsity": 0.38378461201985675, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.encoder_attn.v_proj": { "mse": 5.509216862265021e-06, "rmse": 0.0023471720989874222, "relative_error": 0.14926709862472565, "max_error": 0.11292362213134766, "sparsity": 0.3838071823120117, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.encoder_attn.q_proj": { "mse": 3.3597671063034795e-06, "rmse": 0.0018329667499175973, "relative_error": 0.12338244477979932, "max_error": 0.04654979705810547, "sparsity": 0.38701915740966797, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.encoder_attn.out_proj": { "mse": 3.527855142237968e-06, "rmse": 0.0018782585397750671, "relative_error": 0.1269762413270245, "max_error": 0.10678958892822266, "sparsity": 0.37538401285807294, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.fc1": { "mse": 3.3838575745903654e-06, "rmse": 0.0018395264538979496, "relative_error": 0.11950819790999201, "max_error": 0.0970156192779541, "sparsity": 0.38993239402770996, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 }, "model.decoder.layers.23.fc2": { "mse": 1.7770662452676333e-05, "rmse": 0.00421552635535307, "relative_error": 0.2633558020199924, "max_error": 0.3130340576171875, "sparsity": 0.33670878410339355, "effective_bits": 9.0, "sparse_nnz": 0, "n_planes": 3, "rescued_rows": 0 } }, "summary": { "method_name": "Broad-tritplane3", "model_family": "seq2seq_lm", "selected_components": [ "decoder" ], "quantized_modules": 240, "quantized_params": 402653184, "quantized_fraction": 0.5271309931564236, "avg_relative_error": 0.13568142455431076, "avg_effective_bits": 9.0, "full_model_effective_bits": 12.310083047905035, "compression_ratio": 1.299747527107295 }, "method_name": "Broad-tritplane3", "model_family": "seq2seq_lm", "format_family": "tritplane_small", "format_version": "1.0", "total_packed_bytes": 452984832, "total_fp16_bytes": 805306368, "compression_ratio": 1.7777777777777777 }