File size: 3,641 Bytes
2c99f96 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 | {
"bits": 4,
"group_size": 128,
"sym": true,
"data_type": "int",
"seqlen": 512,
"batch_size": 1,
"scale_dtype": "None",
"gradient_accumulate_steps": 8,
"iters": 100,
"to_quant_block_names": "model.language_model.layers",
"dataset": "/data/fengdahu/tmp/dataset_calib1208/mobimind_calibration_20k.json",
"autoround_version": "0.9.2",
"provider": "auto-round",
"quant_method": "awq",
"zero_point": false,
"version": "gemm",
"modules_to_not_convert": [
"blocks.0.attn.qkv",
"blocks.0.attn.proj",
"blocks.0.mlp.linear_fc1",
"blocks.0.mlp.linear_fc2",
"blocks.1.attn.qkv",
"blocks.1.attn.proj",
"blocks.1.mlp.linear_fc1",
"blocks.1.mlp.linear_fc2",
"blocks.2.attn.qkv",
"blocks.2.attn.proj",
"blocks.2.mlp.linear_fc1",
"blocks.2.mlp.linear_fc2",
"blocks.3.attn.qkv",
"blocks.3.attn.proj",
"blocks.3.mlp.linear_fc1",
"blocks.3.mlp.linear_fc2",
"blocks.4.attn.qkv",
"blocks.4.attn.proj",
"blocks.4.mlp.linear_fc1",
"blocks.4.mlp.linear_fc2",
"blocks.5.attn.qkv",
"blocks.5.attn.proj",
"blocks.5.mlp.linear_fc1",
"blocks.5.mlp.linear_fc2",
"blocks.6.attn.qkv",
"blocks.6.attn.proj",
"blocks.6.mlp.linear_fc1",
"blocks.6.mlp.linear_fc2",
"blocks.7.attn.qkv",
"blocks.7.attn.proj",
"blocks.7.mlp.linear_fc1",
"blocks.7.mlp.linear_fc2",
"blocks.8.attn.qkv",
"blocks.8.attn.proj",
"blocks.8.mlp.linear_fc1",
"blocks.8.mlp.linear_fc2",
"blocks.9.attn.qkv",
"blocks.9.attn.proj",
"blocks.9.mlp.linear_fc1",
"blocks.9.mlp.linear_fc2",
"blocks.10.attn.qkv",
"blocks.10.attn.proj",
"blocks.10.mlp.linear_fc1",
"blocks.10.mlp.linear_fc2",
"blocks.11.attn.qkv",
"blocks.11.attn.proj",
"blocks.11.mlp.linear_fc1",
"blocks.11.mlp.linear_fc2",
"blocks.12.attn.qkv",
"blocks.12.attn.proj",
"blocks.12.mlp.linear_fc1",
"blocks.12.mlp.linear_fc2",
"blocks.13.attn.qkv",
"blocks.13.attn.proj",
"blocks.13.mlp.linear_fc1",
"blocks.13.mlp.linear_fc2",
"blocks.14.attn.qkv",
"blocks.14.attn.proj",
"blocks.14.mlp.linear_fc1",
"blocks.14.mlp.linear_fc2",
"blocks.15.attn.qkv",
"blocks.15.attn.proj",
"blocks.15.mlp.linear_fc1",
"blocks.15.mlp.linear_fc2",
"blocks.16.attn.qkv",
"blocks.16.attn.proj",
"blocks.16.mlp.linear_fc1",
"blocks.16.mlp.linear_fc2",
"blocks.17.attn.qkv",
"blocks.17.attn.proj",
"blocks.17.mlp.linear_fc1",
"blocks.17.mlp.linear_fc2",
"blocks.18.attn.qkv",
"blocks.18.attn.proj",
"blocks.18.mlp.linear_fc1",
"blocks.18.mlp.linear_fc2",
"blocks.19.attn.qkv",
"blocks.19.attn.proj",
"blocks.19.mlp.linear_fc1",
"blocks.19.mlp.linear_fc2",
"blocks.20.attn.qkv",
"blocks.20.attn.proj",
"blocks.20.mlp.linear_fc1",
"blocks.20.mlp.linear_fc2",
"blocks.21.attn.qkv",
"blocks.21.attn.proj",
"blocks.21.mlp.linear_fc1",
"blocks.21.mlp.linear_fc2",
"blocks.22.attn.qkv",
"blocks.22.attn.proj",
"blocks.22.mlp.linear_fc1",
"blocks.22.mlp.linear_fc2",
"blocks.23.attn.qkv",
"blocks.23.attn.proj",
"blocks.23.mlp.linear_fc1",
"blocks.23.mlp.linear_fc2",
"merger.linear_fc1",
"merger.linear_fc2",
"deepstack_merger_list.0.linear_fc1",
"deepstack_merger_list.0.linear_fc2",
"deepstack_merger_list.1.linear_fc1",
"deepstack_merger_list.1.linear_fc2",
"deepstack_merger_list.2.linear_fc1",
"deepstack_merger_list.2.linear_fc2",
"lm_head",
"model.visual.deepstack_merger_list",
"model.visual.blocks"
]
} |