| model=/mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/MiniMax-M2.7-256x4.9B-BF16-00001-of-00010.gguf |
|
|
| numactl -N ${SOCKET} -m ${SOCKET} \ |
| ./build/bin/llama-imatrix \ |
| --model "$model"\ |
| -f ubergarm-imatrix-calibration-corpus-v02.txt \ |
| -o /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat \ |
| --no-fused-moe \ |
| --no-fused-up-gate \ |
| --no-fused-mul-multiadd \ |
| --ctx-size 512 \ |
| -ub 4096 -b 4096 \ |
| --threads 96 \ |
| --threads-batch 128 \ |
| --no-mmap \ |
| --numa numactl \ |
| --verbosity 1 \ |
| --layer-similarity |
|
|
| CPU: using device CPU - 0 MiB free |
| llama_model_loader: additional 9 GGUFs metadata loaded. |
| llama_model_loader: loaded meta data with 40 key-value pairs and 809 tensors from /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/MiniMax-M2.7-256x4.9B-BF16-00001-of-00010.gguf (version GGUF V3 (latest)) |
| llama_model_loader: Dumping metadata keys/values. Note: KV overrides do not apply in this output. |
| llama_model_loader: - kv 0: general.architecture str = minimax-m2 |
| llama_model_loader: - kv 1: general.type str = model |
| llama_model_loader: - kv 2: general.sampling.top_k i32 = 40 |
| llama_model_loader: - kv 3: general.sampling.top_p f32 = 0.950000 |
| llama_model_loader: - kv 4: general.sampling.temp f32 = 1.000000 |
| llama_model_loader: - kv 5: general.name str = MiniMax M2.7 |
| llama_model_loader: - kv 6: general.size_label str = 256x4.9B |
| llama_model_loader: - kv 7: general.license str = other |
| llama_model_loader: - kv 8: general.license.name str = modified-mit |
| llama_model_loader: - kv 9: general.license.link str = https: |
| llama_model_loader: - kv 10: general.tags arr[str,1] = ["text-generation"] |
| llama_model_loader: - kv 11: minimax-m2.block_count u32 = 62 |
| llama_model_loader: - kv 12: minimax-m2.context_length u32 = 196608 |
| llama_model_loader: - kv 13: minimax-m2.embedding_length u32 = 3072 |
| llama_model_loader: - kv 14: minimax-m2.feed_forward_length u32 = 1536 |
| llama_model_loader: - kv 15: minimax-m2.attention.head_count u32 = 48 |
| llama_model_loader: - kv 16: minimax-m2.attention.head_count_kv u32 = 8 |
| llama_model_loader: - kv 17: minimax-m2.rope.freq_base f32 = 5000000.000000 |
| llama_model_loader: - kv 18: minimax-m2.attention.layer_norm_rms_epsilon f32 = 0.000001 |
| llama_model_loader: - kv 19: minimax-m2.expert_count u32 = 256 |
| llama_model_loader: - kv 20: minimax-m2.expert_used_count u32 = 8 |
| llama_model_loader: - kv 21: minimax-m2.expert_gating_func u32 = 2 |
| llama_model_loader: - kv 22: minimax-m2.attention.key_length u32 = 128 |
| llama_model_loader: - kv 23: minimax-m2.attention.value_length u32 = 128 |
| llama_model_loader: - kv 24: general.file_type u32 = 32 |
| llama_model_loader: - kv 25: minimax-m2.expert_feed_forward_length u32 = 1536 |
| llama_model_loader: - kv 26: minimax-m2.rope.dimension_count u32 = 64 |
| llama_model_loader: - kv 27: general.quantization_version u32 = 2 |
| llama_model_loader: - kv 28: tokenizer.ggml.model str = gpt2 |
| llama_model_loader: - kv 29: tokenizer.ggml.pre str = minimax-m2 |
| llama_model_loader: - kv 30: tokenizer.ggml.tokens arr[str,200064] = ["Ā", "ā", "Ă", "ă", "Ą", "ą", ...llama_model_loader: - kv 31: tokenizer.ggml.token_type arr[i32,200064] = [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...llama_model_loader: - kv 32: tokenizer.ggml.merges arr[str,199744] = ["Ġ Ġ", "Ġ t", "Ġ a", "i n", "e r... |
| llama_model_loader: - kv 33: tokenizer.ggml.bos_token_id u32 = 200034 |
| llama_model_loader: - kv 34: tokenizer.ggml.eos_token_id u32 = 200020 |
| llama_model_loader: - kv 35: tokenizer.ggml.unknown_token_id u32 = 200021 |
| llama_model_loader: - kv 36: tokenizer.chat_template str = {# ----------‑‑‑ special token ... |
| llama_model_loader: - kv 37: split.no u16 = 0 |
| llama_model_loader: - kv 38: split.count u16 = 10 |
| llama_model_loader: - kv 39: split.tensors.count i32 = 809 |
| llama_model_loader: - type f32: 373 tensors |
| llama_model_loader: - type bf16: 436 tensors |
| load: 0 unused tokens |
| load: special_eos_id is not in special_eog_ids - the tokenizer config may be incorrect |
| load: printing all EOG tokens: |
| load: - 200004 ('<fim_pad>') |
| load: - 200005 ('<reponame>') |
| load: - 200020 ('[e~[') |
| load: special tokens cache size = 54 |
| load: token to piece cache size = 1.3355 MB |
| llm_load_print_meta: format = GGUF V3 (latest) |
| llm_load_print_meta: arch = minimax-m2 |
| llm_load_print_meta: n_ctx_train = 196608 |
| llm_load_print_meta: n_embd = 3072 |
| llm_load_print_meta: n_layer = 62 |
| llm_load_print_meta: n_head = 48 |
| llm_load_print_meta: n_head_kv = 8 |
| llm_load_print_meta: n_rot = 64 |
| llm_load_print_meta: n_swa = 0 |
| llm_load_print_meta: n_swa_pattern = 1 |
| llm_load_print_meta: n_embd_head_k = 128 |
| llm_load_print_meta: n_embd_head_v = 128 |
| llm_load_print_meta: n_gqa = 6 |
| llm_load_print_meta: n_embd_k_gqa = 1024 |
| llm_load_print_meta: n_embd_v_gqa = 1024 |
| llm_load_print_meta: f_norm_eps = 0.0e+00 |
| llm_load_print_meta: f_norm_rms_eps = 1.0e-06 |
| llm_load_print_meta: f_clamp_kqv = 0.0e+00 |
| llm_load_print_meta: f_max_alibi_bias = 0.0e+00 |
| llm_load_print_meta: f_logit_scale = 0.0e+00 |
| llm_load_print_meta: n_ff = 1536 |
| llm_load_print_meta: n_expert = 256 |
| llm_load_print_meta: n_expert_used = 8 |
| llm_load_print_meta: causal attn = 1 |
| llm_load_print_meta: pooling type = 0 |
| llm_load_print_meta: rope type = 2 |
| llm_load_print_meta: rope scaling = linear |
| llm_load_print_meta: freq_base_train = 5000000.0 |
| llm_load_print_meta: freq_scale_train = 1 |
| llm_load_print_meta: n_ctx_orig_yarn = 196608 |
| llm_load_print_meta: rope_finetuned = unknown |
| llm_load_print_meta: ssm_d_conv = 0 |
| llm_load_print_meta: ssm_d_inner = 0 |
| llm_load_print_meta: ssm_d_state = 0 |
| llm_load_print_meta: ssm_dt_rank = 0 |
| llm_load_print_meta: ssm_n_group = 0 |
| llm_load_print_meta: model type = 230B.A10B |
| llm_load_print_meta: model ftype = BF16 |
| llm_load_print_meta: model params = 228.690 B |
| llm_load_print_meta: model size = 426.060 GiB (16.003 BPW) |
| llm_load_print_meta: repeating layers = 423.771 GiB (16.003 BPW, 227.461 B parameters) |
| llm_load_print_meta: general.name = MiniMax M2.7 |
| print_info: vocab type = BPE |
| print_info: n_vocab = 200064 |
| print_info: n_merges = 199744 |
| print_info: BOS token = 200034 ']~!b[' |
| print_info: EOS token = 200020 '[e~[' |
| print_info: UNK token = 200021 ']!d~[' |
| print_info: LF token = 10 'Ċ' |
| print_info: FIM PRE token = 200001 '<fim_prefix>' |
| print_info: FIM SUF token = 200003 '<fim_suffix>' |
| print_info: FIM MID token = 200002 '<fim_middle>' |
| print_info: FIM PAD token = 200004 '<fim_pad>' |
| print_info: FIM REP token = 200005 '<reponame>' |
| print_info: EOG token = 200004 '<fim_pad>' |
| print_info: EOG token = 200005 '<reponame>' |
| print_info: EOG token = 200020 '[e~[' |
| print_info: max token length = 256 |
| ======================================= HAVE_FANCY_SIMD is defined |
| Free memory 0 MiB on device 0 is less the 1024 MiB safety margin |
| ------------------- Layer sizes: |
| Layer 0: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 1: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 2: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 3: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 4: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 5: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 6: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 7: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 8: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 9: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 10: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 11: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 12: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 13: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 14: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 15: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 16: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 17: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 18: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 19: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 20: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 21: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 22: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 23: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 24: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 25: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 26: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 27: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 28: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 29: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 30: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 31: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 32: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 33: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 34: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 35: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 36: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 37: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 38: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 39: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 40: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 41: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 42: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 43: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 44: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 45: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 46: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 47: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 48: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 49: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 50: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 51: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 52: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 53: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 54: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 55: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 56: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 57: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 58: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 59: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 60: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 61: 6999.05, 2.00, 7001.05 108.00 MiB |
| Layer 62: 1172.25, 282.75, 1455.00 MiB (output layer) |
| -------------------------------------------------------------------------- |
| Total : 433941.21, 406.75, 434347.96 MiB |
| Free memory 0 MiB on device 0 is less the required compute buffer size 108 MiB |
| Memory required for model tensors + cache: 435520 MiB |
| Memory available on all devices - compute: 0 MiB |
| llm_load_tensors: ggml ctx size = 0.35 MiB |
| llm_load_tensors: offloading 0 repeating layers to GPU |
| llm_load_tensors: offloaded 0/63 layers to GPU |
| llm_load_tensors: CPU buffer size = 436285.72 MiB |
| .................................................................................................... |
| llama_init_from_model: n_ctx = 512 |
| llama_init_from_model: n_batch = 512 |
| llama_init_from_model: n_ubatch = 512 |
| llama_init_from_model: flash_attn = 1 |
| llama_init_from_model: attn_max_b = 0 |
| llama_init_from_model: fused_moe = 0 |
| llama_init_from_model: grouped er = 0 |
| llama_init_from_model: fused_up_gate = 0 |
| llama_init_from_model: fused_mmad = 0 |
| llama_init_from_model: rope_cache = 0 |
| llama_init_from_model: graph_reuse = 1 |
| llama_init_from_model: k_cache_hadam = 0 |
| llama_init_from_model: v_cache_hadam = 0 |
| llama_init_from_model: split_mode_graph_scheduling = 0 |
| llama_init_from_model: reduce_type = f16 |
| llama_init_from_model: sched_async = 0 |
| llama_init_from_model: ser = -1, 0 |
| llama_init_from_model: freq_base = 5000000.0 |
| llama_init_from_model: freq_scale = 1 |
| llama_kv_cache_init: CPU KV buffer size = 124.00 MiB |
| llama_init_from_model: KV self size = 124.00 MiB, K (f16): 62.00 MiB, V (f16): 62.00 MiB |
| llama_init_from_model: CPU output buffer size = 0.76 MiB |
| llama_init_from_model: CPU compute buffer size = 402.75 MiB |
| llama_init_from_model: graph nodes = 2609 |
| llama_init_from_model: graph splits = 1 |
| llama_init_from_model: enabling only_active_experts scheduling |
| |
| system_info: n_threads = 96 (n_threads_batch = 128) / 512 | AVX = 1 | AVX_VNNI = 1 | AVX2 = 1 | AVX512 = 1 | AVX512_VBMI = 1 | AVX512_VNNI = 1 | AVX512_BF16 = 1 | FMA = 1 | NEON = 0 | SVE = 0 | ARM_FMA = 0 | F16C = 1 | FP16_VA = 0 | WASM_SIMD = 0 | BLAS = 0 | SSE3 = 1 | SSSE3 = 1 | VSX = 0 | MATMUL_INT8 = 0 | |
| compute_imatrix: tokenizing the input .. |
| compute_imatrix: tokenization took 779.628 ms |
| compute_imatrix: computing over 796 chunks with batch_size 512 |
| compute_imatrix: 3.99 seconds per pass - ETA 52.95 minutes |
| [1]91.6530,[2]16.4837,[3]7.9862,[4]4.7587,[5]3.6240,[6]2.9956,[7]2.5865,[8]2.3337,[9]2.2805, |
| save_imatrix: entry ' blk.60.ffn_down_exps.weight' has partial data (91.80%) 21 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.59.ffn_gate_exps.weight' has partial data (94.14%) 15 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.59.ffn_up_exps.weight' has partial data (94.14%) 15 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.58.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.58.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.57.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.57.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.57.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.56.ffn_gate_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.55.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.60.ffn_gate_exps.weight' has partial data (91.80%) 21 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.55.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.55.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.54.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.53.ffn_down_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.56.ffn_down_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.52.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.52.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.52.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.48.ffn_up_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.47.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.47.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.46.ffn_down_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.46.ffn_up_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.45.ffn_down_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.43.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.43.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.42.ffn_down_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.42.ffn_up_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_gate_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.39.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.38.ffn_down_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.38.ffn_gate_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.39.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.37.ffn_gate_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.37.ffn_up_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.36.ffn_down_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.40.ffn_down_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.35.ffn_down_exps.weight' has partial data (93.75%) 16 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.35.ffn_gate_exps.weight' has partial data (93.75%) 16 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.51.ffn_gate_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_up_exps.weight' has partial data (92.58%) 19 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.33.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.33.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.33.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.39.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.32.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.32.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_down_exps.weight' has partial data (92.58%) 19 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.42.ffn_gate_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.50.ffn_down_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.15.ffn_gate_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.38.ffn_up_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.45.ffn_gate_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.16.ffn_up_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.47.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.45.ffn_up_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.23.ffn_gate_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.15.ffn_down_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.16.ffn_gate_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.51.ffn_up_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.53.ffn_gate_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.41.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.50.ffn_up_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.59.ffn_down_exps.weight' has partial data (94.14%) 15 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.54.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.4.ffn_up_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_down_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.36.ffn_gate_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.31.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.58.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.29.ffn_gate_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.41.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.6.ffn_up_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.41.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.1.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_gate_exps.weight' has partial data (92.58%) 19 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.49.ffn_down_exps.weight' has partial data (98.05%) 5 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.19.ffn_up_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.15.ffn_up_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.56.ffn_up_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_up_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.4.ffn_gate_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.23.ffn_down_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.0.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.37.ffn_down_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.32.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (81.64%) 47 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.48.ffn_down_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.29.ffn_up_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.0.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.40.ffn_up_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.18.ffn_up_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.21.ffn_down_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.4.ffn_down_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.54.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.2.ffn_up_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.28.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.50.ffn_gate_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.24.ffn_down_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.28.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.51.ffn_down_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.6.ffn_down_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.26.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.30.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.40.ffn_gate_exps.weight' has partial data (94.53%) 14 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.1.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.1.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.16.ffn_down_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.18.ffn_gate_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.49.ffn_up_exps.weight' has partial data (98.05%) 5 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.35.ffn_up_exps.weight' has partial data (93.75%) 16 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.18.ffn_down_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.21.ffn_up_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.6.ffn_gate_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.19.ffn_gate_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.24.ffn_up_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.19.ffn_down_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (81.64%) 47 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.2.ffn_down_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.48.ffn_gate_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.21.ffn_gate_exps.weight' has partial data (99.22%) 2 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.29.ffn_down_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.22.ffn_up_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.22.ffn_gate_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.22.ffn_down_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.23.ffn_up_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.53.ffn_up_exps.weight' has partial data (98.83%) 3 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.24.ffn_gate_exps.weight' has partial data (97.27%) 7 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.49.ffn_gate_exps.weight' has partial data (98.05%) 5 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (81.64%) 47 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.25.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.2.ffn_gate_exps.weight' has partial data (99.61%) 1 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.25.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.25.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.36.ffn_up_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.26.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.27.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.27.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.60.ffn_up_exps.weight' has partial data (91.80%) 21 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.26.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.27.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.43.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.0.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.28.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.31.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.46.ffn_gate_exps.weight' has partial data (98.44%) 4 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.30.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.30.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.31.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: warning: storing only 461 out of 497 entries |
| |
| save_imatrix: stored collected data after 10 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [10]2.2152,[11]2.2249,[12]2.4598,[13]2.5706,[14]2.5471,[15]2.4061,[16]2.2934,[17]2.1901,[18]2.1276,[19]2.0519, |
| save_imatrix: entry ' blk.60.ffn_down_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.59.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.59.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.60.ffn_gate_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.45.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.38.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.38.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.37.ffn_gate_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.37.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.36.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.40.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.35.ffn_down_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.35.ffn_gate_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_down_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.38.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.45.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.45.ffn_up_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.59.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.36.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.29.ffn_gate_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.34.ffn_gate_exps.weight' has partial data (95.31%) 12 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.44.ffn_up_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.37.ffn_down_exps.weight' has partial data (96.09%) 10 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (83.59%) 42 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.29.ffn_up_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.40.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.40.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.35.ffn_up_exps.weight' has partial data (95.70%) 11 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (83.59%) 42 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.29.ffn_down_exps.weight' has partial data (97.66%) 6 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (83.59%) 42 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.36.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.60.ffn_up_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: warning: storing only 491 out of 497 entries |
| |
| save_imatrix: stored collected data after 20 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [20]2.0097,[21]1.9543,[22]1.9059,[23]1.9143,[24]1.8992,[25]1.8525,[26]1.9506,[27]2.0486,[28]2.1579,[29]2.1379, |
| save_imatrix: entry ' blk.60.ffn_down_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.60.ffn_gate_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (83.98%) 41 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (83.98%) 41 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (83.98%) 41 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.60.ffn_up_exps.weight' has partial data (94.92%) 13 out of 256 experts are missing data - skipping |
| save_imatrix: warning: storing only 491 out of 497 entries |
| |
| save_imatrix: stored collected data after 30 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [30]2.3057,[31]2.2805,[32]2.3091,[33]2.2842,[34]2.2976,[35]2.3024,[36]2.2904,[37]2.2937,[38]2.3360,[39]2.3423, |
| save_imatrix: entry ' blk.60.ffn_down_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.60.ffn_gate_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (87.11%) 33 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (87.11%) 33 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (87.11%) 33 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.60.ffn_up_exps.weight' has partial data (96.48%) 9 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: warning: storing only 494 out of 497 entries |
| |
| save_imatrix: stored collected data after 40 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [40]2.3262,[41]2.3632,[42]2.3749,[43]2.3947,[44]2.4239,[45]2.4425,[46]2.4257,[47]2.4243,[48]2.4192,[49]2.4269, |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (87.50%) 32 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (87.50%) 32 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (87.50%) 32 out of 256 experts are missing data - skipping |
| save_imatrix: warning: storing only 494 out of 497 entries |
| |
| save_imatrix: stored collected data after 50 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [50]2.4123,[51]2.4286,[52]2.4539,[53]2.4376,[54]2.4462,[55]2.4430,[56]2.4412,[57]2.4322,[58]2.5168,[59]2.5695, |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (89.06%) 28 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (89.06%) 28 out of 256 experts are missing data - skipping |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (89.06%) 28 out of 256 experts are missing data - skipping |
| save_imatrix: warning: storing only 494 out of 497 entries |
| |
| save_imatrix: stored collected data after 60 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [60]2.6236,[61]2.6529,[62]2.7734,[63]2.8045,[64]2.8668,[65]2.9429,[66]3.0196,[67]3.1169,[68]3.2083,[69]3.2922, |
| save_imatrix: entry ' blk.61.ffn_down_exps.weight' has partial data (96.88%) 8 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_up_exps.weight' has partial data (96.88%) 8 out of 256 experts are missing data Storing **but be aware** |
| save_imatrix: entry ' blk.61.ffn_gate_exps.weight' has partial data (96.88%) 8 out of 256 experts are missing data Storing **but be aware** |
| |
| save_imatrix: stored collected data after 70 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [70]3.3446,[71]3.3814,[72]3.3968,[73]3.4427,[74]3.5064,[75]3.6009,[76]3.5929,[77]3.5709,[78]3.5574,[79]3.5950, |
| save_imatrix: stored collected data after 80 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [80]3.7128,[81]3.7851,[82]3.7799,[83]3.7675,[84]3.7440,[85]3.8345,[86]3.8787,[87]3.8800,[88]3.8999,[89]3.9499, |
| save_imatrix: stored collected data after 90 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [90]4.0183,[91]4.0139,[92]4.0121,[93]4.0164,[94]4.0088,[95]3.9814,[96]4.0118,[97]4.0338,[98]4.0638,[99]4.0308, |
| save_imatrix: stored collected data after 100 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [100]4.0811,[101]4.1422,[102]4.1939,[103]4.2519,[104]4.2992,[105]4.3474,[106]4.3983,[107]4.3891,[108]4.3950,[109]4.4223, |
| save_imatrix: stored collected data after 110 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [110]4.4616,[111]4.4628,[112]4.5131,[113]4.5552,[114]4.5702,[115]4.5605,[116]4.5330,[117]4.5458,[118]4.5474,[119]4.5088, |
| save_imatrix: stored collected data after 120 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [120]4.4704,[121]4.4584,[122]4.4520,[123]4.4576,[124]4.4923,[125]4.4902,[126]4.5301,[127]4.5808,[128]4.6256,[129]4.5970, |
| save_imatrix: stored collected data after 130 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [130]4.5674,[131]4.5513,[132]4.5352,[133]4.5398,[134]4.5298,[135]4.5768,[136]4.6216,[137]4.6465,[138]4.6503,[139]4.6840, |
| save_imatrix: stored collected data after 140 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [140]4.7355,[141]4.7856,[142]4.8292,[143]4.8613,[144]4.8905,[145]4.9105,[146]4.9111,[147]4.9161,[148]4.9055,[149]4.9285, |
| save_imatrix: stored collected data after 150 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [150]4.9394,[151]4.9498,[152]4.9741,[153]5.0031,[154]5.0031,[155]5.0045,[156]5.0191,[157]5.0347,[158]5.0440,[159]5.0578, |
| save_imatrix: stored collected data after 160 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [160]5.0635,[161]5.0710,[162]5.0824,[163]5.0815,[164]5.0738,[165]5.1019,[166]5.1153,[167]5.1173,[168]5.1427,[169]5.1669, |
| save_imatrix: stored collected data after 170 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [170]5.1473,[171]5.1656,[172]5.1706,[173]5.1913,[174]5.2133,[175]5.2240,[176]5.2127,[177]5.1976,[178]5.1853,[179]5.1704, |
| save_imatrix: stored collected data after 180 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [180]5.1552,[181]5.1410,[182]5.1326,[183]5.1509,[184]5.1726,[185]5.2238,[186]5.2688,[187]5.3029,[188]5.3528,[189]5.3781, |
| save_imatrix: stored collected data after 190 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [190]5.4022,[191]5.3836,[192]5.4077,[193]5.3986,[194]5.3637,[195]5.3234,[196]5.3419,[197]5.3768,[198]5.3905,[199]5.4038, |
| save_imatrix: stored collected data after 200 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [200]5.4335,[201]5.4573,[202]5.4781,[203]5.5035,[204]5.5272,[205]5.5297,[206]5.5102,[207]5.4930,[208]5.4923,[209]5.4749, |
| save_imatrix: stored collected data after 210 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [210]5.4644,[211]5.4467,[212]5.4250,[213]5.4277,[214]5.4415,[215]5.4205,[216]5.4175,[217]5.4225,[218]5.4355,[219]5.4566, |
| save_imatrix: stored collected data after 220 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [220]5.4845,[221]5.5102,[222]5.5357,[223]5.5438,[224]5.5872,[225]5.6260,[226]5.6398,[227]5.6421,[228]5.6588,[229]5.6900, |
| save_imatrix: stored collected data after 230 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [230]5.7133,[231]5.7253,[232]5.7605,[233]5.7680,[234]5.8151,[235]5.8574,[236]5.8745,[237]5.8959,[238]5.9191,[239]5.9352, |
| save_imatrix: stored collected data after 240 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [240]5.9543,[241]5.9810,[242]6.0051,[243]6.0283,[244]6.0441,[245]6.0680,[246]6.0936,[247]6.1145,[248]6.1212,[249]6.1335, |
| save_imatrix: stored collected data after 250 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [250]6.1408,[251]6.1578,[252]6.1708,[253]6.1907,[254]6.2048,[255]6.2183,[256]6.2155,[257]6.2234,[258]6.2454,[259]6.2756, |
| save_imatrix: stored collected data after 260 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [260]6.3059,[261]6.3243,[262]6.3548,[263]6.3571,[264]6.3698,[265]6.3824,[266]6.3960,[267]6.4167,[268]6.4371,[269]6.4558, |
| save_imatrix: stored collected data after 270 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [270]6.4693,[271]6.4706,[272]6.4964,[273]6.5114,[274]6.5362,[275]6.5569,[276]6.5564,[277]6.5617,[278]6.5767,[279]6.5802, |
| save_imatrix: stored collected data after 280 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [280]6.5975,[281]6.6092,[282]6.6280,[283]6.6407,[284]6.6626,[285]6.6823,[286]6.7023,[287]6.7206,[288]6.7522,[289]6.7722, |
| save_imatrix: stored collected data after 290 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [290]6.7935,[291]6.8167,[292]6.8329,[293]6.8436,[294]6.8604,[295]6.8677,[296]6.8786,[297]6.8961,[298]6.9088,[299]6.9215, |
| save_imatrix: stored collected data after 300 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [300]6.9300,[301]6.9391,[302]6.9487,[303]6.9748,[304]6.9890,[305]6.9988,[306]7.0184,[307]7.0456,[308]7.0756,[309]7.1029, |
| save_imatrix: stored collected data after 310 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [310]7.0595,[311]7.0437,[312]7.0151,[313]6.9929,[314]7.0202,[315]7.0333,[316]7.0051,[317]7.0187,[318]7.0321,[319]7.0287, |
| save_imatrix: stored collected data after 320 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [320]7.0292,[321]7.0347,[322]7.0606,[323]7.0596,[324]7.0731,[325]7.0907,[326]7.1053,[327]7.1201,[328]7.0776,[329]7.0961, |
| save_imatrix: stored collected data after 330 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [330]7.1338,[331]7.1613,[332]7.1877,[333]7.2135,[334]7.2131,[335]7.2100,[336]7.2196,[337]7.2257,[338]7.2430,[339]7.2647, |
| save_imatrix: stored collected data after 340 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [340]7.2429,[341]7.2588,[342]7.2679,[343]7.2644,[344]7.2647,[345]7.2656,[346]7.2518,[347]7.2605,[348]7.2791,[349]7.2685, |
| save_imatrix: stored collected data after 350 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [350]7.2599,[351]7.2307,[352]7.1949,[353]7.1699,[354]7.1475,[355]7.1109,[356]7.0880,[357]7.0686,[358]7.0488,[359]7.0303, |
| save_imatrix: stored collected data after 360 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [360]7.0089,[361]6.9886,[362]6.9868,[363]6.9704,[364]6.9412,[365]6.9239,[366]6.8979,[367]6.8821,[368]6.8681,[369]6.8420, |
| save_imatrix: stored collected data after 370 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [370]6.8320,[371]6.8266,[372]6.8237,[373]6.8128,[374]6.7941,[375]6.7615,[376]6.7304,[377]6.7149,[378]6.6930,[379]6.6661, |
| save_imatrix: stored collected data after 380 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [380]6.6338,[381]6.6010,[382]6.5842,[383]6.5753,[384]6.5680,[385]6.5561,[386]6.5725,[387]6.5692,[388]6.5422,[389]6.5191, |
| save_imatrix: stored collected data after 390 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [390]6.5028,[391]6.4825,[392]6.4643,[393]6.4496,[394]6.4257,[395]6.4064,[396]6.3898,[397]6.3681,[398]6.3439,[399]6.3203, |
| save_imatrix: stored collected data after 400 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [400]6.3079,[401]6.2973,[402]6.2837,[403]6.2782,[404]6.2749,[405]6.2642,[406]6.2559,[407]6.2414,[408]6.2154,[409]6.1894, |
| save_imatrix: stored collected data after 410 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [410]6.1638,[411]6.1418,[412]6.1162,[413]6.0923,[414]6.0714,[415]6.0458,[416]6.0250,[417]6.0073,[418]5.9871,[419]5.9676, |
| save_imatrix: stored collected data after 420 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [420]5.9470,[421]5.9249,[422]5.9074,[423]5.9091,[424]5.9010,[425]5.8958,[426]5.8760,[427]5.8586,[428]5.8375,[429]5.8194, |
| save_imatrix: stored collected data after 430 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [430]5.8022,[431]5.7885,[432]5.7719,[433]5.7611,[434]5.7449,[435]5.7391,[436]5.7237,[437]5.7058,[438]5.7005,[439]5.6861, |
| save_imatrix: stored collected data after 440 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [440]5.6712,[441]5.6568,[442]5.6466,[443]5.6298,[444]5.6099,[445]5.5903,[446]5.5717,[447]5.5519,[448]5.5326,[449]5.5163, |
| save_imatrix: stored collected data after 450 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [450]5.4969,[451]5.4781,[452]5.4617,[453]5.4562,[454]5.4372,[455]5.4286,[456]5.4145,[457]5.4103,[458]5.3989,[459]5.3871, |
| save_imatrix: stored collected data after 460 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [460]5.3765,[461]5.3653,[462]5.3547,[463]5.3435,[464]5.3327,[465]5.3219,[466]5.3112,[467]5.3002,[468]5.2927,[469]5.2821, |
| save_imatrix: stored collected data after 470 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [470]5.2688,[471]5.2511,[472]5.2386,[473]5.2345,[474]5.2388,[475]5.2207,[476]5.2076,[477]5.1938,[478]5.1777,[479]5.1635, |
| save_imatrix: stored collected data after 480 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [480]5.1486,[481]5.1391,[482]5.1274,[483]5.1208,[484]5.1108,[485]5.1004,[486]5.0933,[487]5.0843,[488]5.0738,[489]5.0712, |
| save_imatrix: stored collected data after 490 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [490]5.0715,[491]5.0750,[492]5.0731,[493]5.0748,[494]5.0754,[495]5.0720,[496]5.0647,[497]5.0758,[498]5.0891,[499]5.1042, |
| save_imatrix: stored collected data after 500 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [500]5.1145,[501]5.1254,[502]5.1377,[503]5.1500,[504]5.1586,[505]5.1751,[506]5.1879,[507]5.1988,[508]5.2218,[509]5.2465, |
| save_imatrix: stored collected data after 510 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [510]5.2716,[511]5.2686,[512]5.2800,[513]5.2934,[514]5.3038,[515]5.3089,[516]5.3158,[517]5.3198,[518]5.3211,[519]5.3273, |
| save_imatrix: stored collected data after 520 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [520]5.3322,[521]5.3420,[522]5.3407,[523]5.3395,[524]5.3485,[525]5.3749,[526]5.3980,[527]5.3991,[528]5.4007,[529]5.4041, |
| save_imatrix: stored collected data after 530 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [530]5.4079,[531]5.4105,[532]5.4148,[533]5.4181,[534]5.4237,[535]5.4300,[536]5.4400,[537]5.4535,[538]5.4647,[539]5.4754, |
| save_imatrix: stored collected data after 540 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [540]5.4833,[541]5.4879,[542]5.4937,[543]5.4936,[544]5.4891,[545]5.4841,[546]5.4875,[547]5.4898,[548]5.4953,[549]5.4987, |
| save_imatrix: stored collected data after 550 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [550]5.5043,[551]5.5035,[552]5.5094,[553]5.5107,[554]5.5154,[555]5.5127,[556]5.5156,[557]5.5126,[558]5.5058,[559]5.5026, |
| save_imatrix: stored collected data after 560 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [560]5.4951,[561]5.4855,[562]5.4787,[563]5.4741,[564]5.4685,[565]5.4666,[566]5.4657,[567]5.4612,[568]5.4647,[569]5.4620, |
| save_imatrix: stored collected data after 570 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [570]5.4593,[571]5.4565,[572]5.4557,[573]5.4501,[574]5.4500,[575]5.4437,[576]5.4366,[577]5.4354,[578]5.4349,[579]5.4221, |
| save_imatrix: stored collected data after 580 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [580]5.4108,[581]5.3990,[582]5.3873,[583]5.3841,[584]5.3858,[585]5.3878,[586]5.3844,[587]5.3816,[588]5.3760,[589]5.3742, |
| save_imatrix: stored collected data after 590 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [590]5.3760,[591]5.3727,[592]5.3678,[593]5.3653,[594]5.3627,[595]5.3625,[596]5.3602,[597]5.3576,[598]5.3524,[599]5.3527, |
| save_imatrix: stored collected data after 600 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [600]5.3397,[601]5.3306,[602]5.3214,[603]5.3112,[604]5.3034,[605]5.2952,[606]5.2832,[607]5.2688,[608]5.2544,[609]5.2403, |
| save_imatrix: stored collected data after 610 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [610]5.2380,[611]5.2296,[612]5.2281,[613]5.2184,[614]5.2166,[615]5.2094,[616]5.2129,[617]5.2115,[618]5.2185,[619]5.2136, |
| save_imatrix: stored collected data after 620 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [620]5.2109,[621]5.2041,[622]5.2001,[623]5.1963,[624]5.1912,[625]5.1884,[626]5.1852,[627]5.1806,[628]5.1794,[629]5.1857, |
| save_imatrix: stored collected data after 630 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [630]5.1878,[631]5.1874,[632]5.1867,[633]5.1888,[634]5.1905,[635]5.1918,[636]5.1956,[637]5.1966,[638]5.1964,[639]5.1990, |
| save_imatrix: stored collected data after 640 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [640]5.1947,[641]5.1989,[642]5.2005,[643]5.2037,[644]5.2043,[645]5.2043,[646]5.2063,[647]5.2032,[648]5.1926,[649]5.1865, |
| save_imatrix: stored collected data after 650 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [650]5.1788,[651]5.1681,[652]5.1570,[653]5.1523,[654]5.1478,[655]5.1419,[656]5.1315,[657]5.1249,[658]5.1194,[659]5.1122, |
| save_imatrix: stored collected data after 660 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [660]5.1026,[661]5.0926,[662]5.0856,[663]5.0767,[664]5.0729,[665]5.0666,[666]5.0593,[667]5.0497,[668]5.0473,[669]5.0400, |
| save_imatrix: stored collected data after 670 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [670]5.0358,[671]5.0312,[672]5.0276,[673]5.0215,[674]5.0113,[675]5.0023,[676]4.9960,[677]4.9874,[678]4.9790,[679]4.9751, |
| save_imatrix: stored collected data after 680 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [680]4.9707,[681]4.9679,[682]4.9652,[683]4.9612,[684]4.9580,[685]4.9531,[686]4.9502,[687]4.9484,[688]4.9451,[689]4.9410, |
| save_imatrix: stored collected data after 690 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [690]4.9371,[691]4.9344,[692]4.9317,[693]4.9281,[694]4.9253,[695]4.9205,[696]4.9239,[697]4.9236,[698]4.9250,[699]4.9253, |
| save_imatrix: stored collected data after 700 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [700]4.9264,[701]4.9266,[702]4.9274,[703]4.9282,[704]4.9293,[705]4.9305,[706]4.9297,[707]4.9306,[708]4.9321,[709]4.9341, |
| save_imatrix: stored collected data after 710 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [710]4.9370,[711]4.9386,[712]4.9391,[713]4.9395,[714]4.9398,[715]4.9423,[716]4.9440,[717]4.9440,[718]4.9427,[719]4.9408, |
| save_imatrix: stored collected data after 720 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [720]4.9421,[721]4.9446,[722]4.9459,[723]4.9476,[724]4.9484,[725]4.9493,[726]4.9485,[727]4.9486,[728]4.9493,[729]4.9506, |
| save_imatrix: stored collected data after 730 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [730]4.9509,[731]4.9526,[732]4.9524,[733]4.9536,[734]4.9544,[735]4.9562,[736]4.9564,[737]4.9573,[738]4.9576,[739]4.9599, |
| save_imatrix: stored collected data after 740 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [740]4.9624,[741]4.9633,[742]4.9636,[743]4.9641,[744]4.9640,[745]4.9665,[746]4.9665,[747]4.9676,[748]4.9677,[749]4.9695, |
| save_imatrix: stored collected data after 750 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [750]4.9703,[751]4.9701,[752]4.9708,[753]4.9718,[754]4.9729,[755]4.9751,[756]4.9740,[757]4.9740,[758]4.9761,[759]4.9784, |
| save_imatrix: stored collected data after 760 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [760]4.9807,[761]4.9807,[762]4.9810,[763]4.9809,[764]4.9803,[765]4.9808,[766]4.9811,[767]4.9815,[768]4.9813,[769]4.9834, |
| save_imatrix: stored collected data after 770 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [770]4.9832,[771]4.9852,[772]4.9855,[773]4.9849,[774]4.9859,[775]4.9868,[776]4.9901,[777]4.9946,[778]4.9947,[779]4.9945, |
| save_imatrix: stored collected data after 780 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [780]4.9944,[781]4.9979,[782]4.9989,[783]4.9984,[784]4.9997,[785]5.0025,[786]5.0034,[787]5.0038,[788]5.0037,[789]5.0039, |
| save_imatrix: stored collected data after 790 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| [790]5.0040,[791]5.0038,[792]5.0053,[793]5.0062,[794]5.0060,[795]5.0065,[796]5.0077, |
| save_imatrix: stored collected data after 796 chunks in /mnt/data/models/ubergarm/MiniMax-M2.7-GGUF/imatrix-MiniMax-M2.7-BF16.dat |
| |
| Final estimate: PPL = 5.0077 +/- 0.02927 |
| |
| ======================== sorted layer importances |
| 0: Layer 0, <cos_sim> = 0.314319 |
| 1: Layer 61, <cos_sim> = 0.747689 |
| 2: Layer 1, <cos_sim> = 0.756628 |
| 3: Layer 4, <cos_sim> = 0.83165 |
| 4: Layer 5, <cos_sim> = 0.85227 |
| 5: Layer 3, <cos_sim> = 0.879032 |
| 6: Layer 2, <cos_sim> = 0.913412 |
| 7: Layer 60, <cos_sim> = 0.921196 |
| 8: Layer 6, <cos_sim> = 0.929439 |
| 9: Layer 27, <cos_sim> = 0.929467 |
| 10: Layer 24, <cos_sim> = 0.936035 |
| 11: Layer 31, <cos_sim> = 0.936311 |
| 12: Layer 7, <cos_sim> = 0.936849 |
| 13: Layer 28, <cos_sim> = 0.937045 |
| 14: Layer 23, <cos_sim> = 0.939549 |
| 15: Layer 8, <cos_sim> = 0.94017 |
| 16: Layer 26, <cos_sim> = 0.940291 |
| 17: Layer 39, <cos_sim> = 0.942122 |
| 18: Layer 32, <cos_sim> = 0.942581 |
| 19: Layer 9, <cos_sim> = 0.94394 |
| 20: Layer 25, <cos_sim> = 0.944352 |
| 21: Layer 30, <cos_sim> = 0.945021 |
| 22: Layer 29, <cos_sim> = 0.945598 |
| 23: Layer 37, <cos_sim> = 0.946253 |
| 24: Layer 18, <cos_sim> = 0.947922 |
| 25: Layer 38, <cos_sim> = 0.949 |
| 26: Layer 11, <cos_sim> = 0.949036 |
| 27: Layer 34, <cos_sim> = 0.949104 |
| 28: Layer 41, <cos_sim> = 0.949253 |
| 29: Layer 17, <cos_sim> = 0.949477 |
| 30: Layer 22, <cos_sim> = 0.950325 |
| 31: Layer 10, <cos_sim> = 0.950418 |
| 32: Layer 35, <cos_sim> = 0.950613 |
| 33: Layer 58, <cos_sim> = 0.950771 |
| 34: Layer 15, <cos_sim> = 0.951046 |
| 35: Layer 59, <cos_sim> = 0.95122 |
| 36: Layer 49, <cos_sim> = 0.951834 |
| 37: Layer 43, <cos_sim> = 0.952029 |
| 38: Layer 16, <cos_sim> = 0.952079 |
| 39: Layer 36, <cos_sim> = 0.95235 |
| 40: Layer 40, <cos_sim> = 0.952539 |
| 41: Layer 21, <cos_sim> = 0.952563 |
| 42: Layer 12, <cos_sim> = 0.953459 |
| 43: Layer 46, <cos_sim> = 0.954189 |
| 44: Layer 33, <cos_sim> = 0.955066 |
| 45: Layer 57, <cos_sim> = 0.955185 |
| 46: Layer 13, <cos_sim> = 0.955958 |
| 47: Layer 19, <cos_sim> = 0.958471 |
| 48: Layer 48, <cos_sim> = 0.959151 |
| 49: Layer 54, <cos_sim> = 0.960254 |
| 50: Layer 51, <cos_sim> = 0.960338 |
| 51: Layer 44, <cos_sim> = 0.960788 |
| 52: Layer 42, <cos_sim> = 0.960864 |
| 53: Layer 45, <cos_sim> = 0.961023 |
| 54: Layer 50, <cos_sim> = 0.961289 |
| 55: Layer 56, <cos_sim> = 0.962136 |
| 56: Layer 20, <cos_sim> = 0.962164 |
| 57: Layer 52, <cos_sim> = 0.962365 |
| 58: Layer 47, <cos_sim> = 0.963786 |
| 59: Layer 53, <cos_sim> = 0.96446 |
| 60: Layer 55, <cos_sim> = 0.964589 |
| 61: Layer 14, <cos_sim> = 0.964797 |
| |
| ======================== sorted attention importances |
| 0: Layer 0, <cos_sim> = 0.070671 |
| 1: Layer 5, <cos_sim> = 0.325468 |
| 2: Layer 3, <cos_sim> = 0.369615 |
| 3: Layer 2, <cos_sim> = 0.412956 |
| 4: Layer 4, <cos_sim> = 0.573739 |
| 5: Layer 7, <cos_sim> = 0.585959 |
| 6: Layer 11, <cos_sim> = 0.586286 |
| 7: Layer 6, <cos_sim> = 0.595757 |
| 8: Layer 9, <cos_sim> = 0.607441 |
| 9: Layer 12, <cos_sim> = 0.655411 |
| 10: Layer 8, <cos_sim> = 0.666884 |
| 11: Layer 15, <cos_sim> = 0.668835 |
| 12: Layer 10, <cos_sim> = 0.66924 |
| 13: Layer 17, <cos_sim> = 0.685496 |
| 14: Layer 1, <cos_sim> = 0.695764 |
| 15: Layer 14, <cos_sim> = 0.696466 |
| 16: Layer 22, <cos_sim> = 0.708887 |
| 17: Layer 20, <cos_sim> = 0.73429 |
| 18: Layer 23, <cos_sim> = 0.734495 |
| 19: Layer 16, <cos_sim> = 0.738226 |
| 20: Layer 21, <cos_sim> = 0.740639 |
| 21: Layer 18, <cos_sim> = 0.742008 |
| 22: Layer 19, <cos_sim> = 0.761501 |
| 23: Layer 13, <cos_sim> = 0.762193 |
| 24: Layer 26, <cos_sim> = 0.792264 |
| 25: Layer 24, <cos_sim> = 0.801974 |
| 26: Layer 27, <cos_sim> = 0.811254 |
| 27: Layer 28, <cos_sim> = 0.822608 |
| 28: Layer 25, <cos_sim> = 0.823736 |
| 29: Layer 29, <cos_sim> = 0.841409 |
| 30: Layer 30, <cos_sim> = 0.848063 |
| 31: Layer 31, <cos_sim> = 0.862063 |
| 32: Layer 32, <cos_sim> = 0.86227 |
| 33: Layer 33, <cos_sim> = 0.869472 |
| 34: Layer 34, <cos_sim> = 0.881373 |
| 35: Layer 36, <cos_sim> = 0.884664 |
| 36: Layer 35, <cos_sim> = 0.893423 |
| 37: Layer 37, <cos_sim> = 0.894579 |
| 38: Layer 39, <cos_sim> = 0.89667 |
| 39: Layer 38, <cos_sim> = 0.896756 |
| 40: Layer 61, <cos_sim> = 0.899749 |
| 41: Layer 40, <cos_sim> = 0.904017 |
| 42: Layer 43, <cos_sim> = 0.922443 |
| 43: Layer 41, <cos_sim> = 0.927151 |
| 44: Layer 42, <cos_sim> = 0.93657 |
| 45: |
| llama_print_timings: load time = 95309.51 ms |
| llama_print_timings: sample time = 0.00 ms / 1 runs ( 0.00 ms per token, inf tokens per second) |
| llama_print_timings: prompt eval time = 3029558.42 ms / 407552 tokens ( 7.43 ms per token, 134.53 tokens per second) |
| llama_print_timings: eval time = 0.00 ms / 1 runs ( 0.00 ms per token, inf tokens per second) |
| llama_print_timings: total time = 3135252.92 ms / 407553 tokens |
| Layer 49, <cos_sim> = 0.941207 |
| 46: Layer 44, <cos_sim> = 0.94793 |
| 47: Layer 45, <cos_sim> = 0.948874 |
| 48: Layer 46, <cos_sim> = 0.951086 |
| 49: Layer 47, <cos_sim> = 0.954018 |
| 50: Layer 52, <cos_sim> = 0.955026 |
| 51: Layer 48, <cos_sim> = 0.960921 |
| 52: Layer 50, <cos_sim> = 0.96179 |
| 53: Layer 60, <cos_sim> = 0.962736 |
| 54: Layer 58, <cos_sim> = 0.965627 |
| 55: Layer 54, <cos_sim> = 0.965685 |
| 56: Layer 51, <cos_sim> = 0.966247 |
| 57: Layer 59, <cos_sim> = 0.969823 |
| 58: Layer 53, <cos_sim> = 0.970095 |
| 59: Layer 57, <cos_sim> = 0.970563 |
| 60: Layer 56, <cos_sim> = 0.972371 |
| 61: Layer 55, <cos_sim> = 0.974544 |
| |
| ======================== sorted ffn importances |
| 0: Layer 4, <cos_sim> = 0.317384 |
| 1: Layer 2, <cos_sim> = 0.460713 |
| 2: Layer 3, <cos_sim> = 0.566183 |
| 3: Layer 6, <cos_sim> = 0.57249 |
| 4: Layer 5, <cos_sim> = 0.579167 |
| 5: Layer 10, <cos_sim> = 0.601761 |
| 6: Layer 8, <cos_sim> = 0.601878 |
| 7: Layer 0, <cos_sim> = 0.622948 |
| 8: Layer 11, <cos_sim> = 0.638515 |
| 9: Layer 9, <cos_sim> = 0.6441 |
| 10: Layer 14, <cos_sim> = 0.649876 |
| 11: Layer 7, <cos_sim> = 0.670979 |
| 12: Layer 16, <cos_sim> = 0.679592 |
| 13: Layer 13, <cos_sim> = 0.684167 |
| 14: Layer 21, <cos_sim> = 0.689835 |
| 15: Layer 1, <cos_sim> = 0.709895 |
| 16: Layer 19, <cos_sim> = 0.710139 |
| 17: Layer 20, <cos_sim> = 0.721436 |
| 18: Layer 22, <cos_sim> = 0.7316 |
| 19: Layer 15, <cos_sim> = 0.732324 |
| 20: Layer 17, <cos_sim> = 0.742242 |
| 21: Layer 12, <cos_sim> = 0.742858 |
| 22: Layer 18, <cos_sim> = 0.746992 |
| 23: Layer 25, <cos_sim> = 0.779369 |
| 24: Layer 23, <cos_sim> = 0.781141 |
| 25: Layer 26, <cos_sim> = 0.796414 |
| 26: Layer 24, <cos_sim> = 0.809111 |
| 27: Layer 27, <cos_sim> = 0.810032 |
| 28: Layer 29, <cos_sim> = 0.821859 |
| 29: Layer 28, <cos_sim> = 0.824159 |
| 30: Layer 30, <cos_sim> = 0.843586 |
| 31: Layer 31, <cos_sim> = 0.848297 |
| 32: Layer 32, <cos_sim> = 0.855983 |
| 33: Layer 33, <cos_sim> = 0.86832 |
| 34: Layer 35, <cos_sim> = 0.871202 |
| 35: Layer 61, <cos_sim> = 0.872646 |
| 36: Layer 36, <cos_sim> = 0.883183 |
| 37: Layer 34, <cos_sim> = 0.88452 |
| 38: Layer 39, <cos_sim> = 0.888821 |
| 39: Layer 37, <cos_sim> = 0.892246 |
| 40: Layer 38, <cos_sim> = 0.895153 |
| 41: Layer 42, <cos_sim> = 0.907247 |
| 42: Layer 40, <cos_sim> = 0.908511 |
| 43: Layer 41, <cos_sim> = 0.916338 |
| 44: Layer 48, <cos_sim> = 0.926847 |
| 45: Layer 44, <cos_sim> = 0.927916 |
| 46: Layer 43, <cos_sim> = 0.931278 |
| 47: Layer 46, <cos_sim> = 0.933581 |
| 48: Layer 51, <cos_sim> = 0.937163 |
| 49: Layer 45, <cos_sim> = 0.937349 |
| 50: Layer 49, <cos_sim> = 0.939469 |
| 51: Layer 47, <cos_sim> = 0.943874 |
| 52: Layer 53, <cos_sim> = 0.947779 |
| 53: Layer 50, <cos_sim> = 0.947821 |
| 54: Layer 54, <cos_sim> = 0.951103 |
| 55: Layer 52, <cos_sim> = 0.951138 |
| 56: Layer 56, <cos_sim> = 0.955928 |
| 57: Layer 55, <cos_sim> = 0.956456 |
| 58: Layer 60, <cos_sim> = 0.957153 |
| 59: Layer 57, <cos_sim> = 0.962098 |
| 60: Layer 58, <cos_sim> = 0.970282 |
| 61: Layer 59, <cos_sim> = 0.971508 |
| |