| { | |
| "_name_or_path": "../plms/bert-base-uncased", | |
| "architectures": [ | |
| "SparseBertHidden" | |
| ], | |
| "attention_probs_dropout_prob": 0.1, | |
| "classifier_dropout": null, | |
| "gradient_checkpointing": false, | |
| "hidden_act": "gelu", | |
| "hidden_dropout_prob": 0.1, | |
| "hidden_size": 768, | |
| "initializer_range": 0.02, | |
| "intermediate_size": 3072, | |
| "layer_norm_eps": 1e-12, | |
| "layer_skip": 1, | |
| "max_position_embeddings": 512, | |
| "model_type": "bert", | |
| "num_attention_heads": 12, | |
| "num_hidden_layers": 12, | |
| "pad_token_id": 0, | |
| "position_embedding_type": "absolute", | |
| "sparsity": "0", | |
| "sparsity_map": { | |
| "0": { | |
| "head": {}, | |
| "hidden": { | |
| "-1": 0, | |
| "0": 0, | |
| "1": 0, | |
| "10": 0, | |
| "11": 0, | |
| "2": 0, | |
| "3": 0, | |
| "4": 0, | |
| "5": 0, | |
| "6": 0, | |
| "7": 0, | |
| "8": 0, | |
| "9": 0 | |
| }, | |
| "neuron": {} | |
| }, | |
| "10": { | |
| "head": { | |
| "1": 5, | |
| "11": 1, | |
| "3": 1 | |
| }, | |
| "hidden": { | |
| "-1": 38, | |
| "0": 38, | |
| "1": 38, | |
| "10": 38, | |
| "11": 38, | |
| "2": 38, | |
| "3": 38, | |
| "4": 38, | |
| "5": 38, | |
| "6": 38, | |
| "7": 38, | |
| "8": 38, | |
| "9": 38 | |
| }, | |
| "neuron": { | |
| "0": 190, | |
| "1": 298, | |
| "11": 1, | |
| "2": 1323, | |
| "3": 4, | |
| "4": 5, | |
| "5": 8, | |
| "6": 4, | |
| "7": 7, | |
| "8": 2, | |
| "9": 1 | |
| } | |
| }, | |
| "20": { | |
| "head": { | |
| "0": 1, | |
| "1": 7, | |
| "10": 1, | |
| "11": 4, | |
| "3": 2, | |
| "9": 1 | |
| }, | |
| "hidden": { | |
| "-1": 84, | |
| "0": 84, | |
| "1": 84, | |
| "10": 84, | |
| "11": 84, | |
| "2": 84, | |
| "3": 84, | |
| "4": 84, | |
| "5": 84, | |
| "6": 84, | |
| "7": 84, | |
| "8": 84, | |
| "9": 84 | |
| }, | |
| "neuron": { | |
| "0": 597, | |
| "1": 802, | |
| "11": 16, | |
| "2": 2294, | |
| "3": 48, | |
| "4": 78, | |
| "5": 123, | |
| "6": 22, | |
| "7": 47, | |
| "8": 23, | |
| "9": 5 | |
| } | |
| }, | |
| "30": { | |
| "head": { | |
| "0": 1, | |
| "1": 8, | |
| "10": 2, | |
| "11": 4, | |
| "2": 1, | |
| "3": 2, | |
| "6": 1, | |
| "7": 1, | |
| "8": 1, | |
| "9": 2 | |
| }, | |
| "hidden": { | |
| "-1": 123, | |
| "0": 123, | |
| "1": 123, | |
| "10": 123, | |
| "11": 123, | |
| "2": 123, | |
| "3": 123, | |
| "4": 123, | |
| "5": 123, | |
| "6": 123, | |
| "7": 123, | |
| "8": 123, | |
| "9": 123 | |
| }, | |
| "neuron": { | |
| "0": 980, | |
| "1": 1233, | |
| "10": 2, | |
| "11": 116, | |
| "2": 2512, | |
| "3": 132, | |
| "4": 233, | |
| "5": 386, | |
| "6": 61, | |
| "7": 146, | |
| "8": 73, | |
| "9": 24 | |
| } | |
| }, | |
| "40": { | |
| "head": { | |
| "0": 3, | |
| "1": 8, | |
| "10": 2, | |
| "11": 5, | |
| "2": 1, | |
| "3": 3, | |
| "4": 2, | |
| "5": 1, | |
| "6": 2, | |
| "7": 1, | |
| "8": 1, | |
| "9": 4 | |
| }, | |
| "hidden": { | |
| "-1": 177, | |
| "0": 177, | |
| "1": 177, | |
| "10": 177, | |
| "11": 177, | |
| "2": 177, | |
| "3": 177, | |
| "4": 177, | |
| "5": 177, | |
| "6": 177, | |
| "7": 177, | |
| "8": 177, | |
| "9": 177 | |
| }, | |
| "neuron": { | |
| "0": 1436, | |
| "1": 1664, | |
| "10": 6, | |
| "11": 518, | |
| "2": 2634, | |
| "3": 306, | |
| "4": 449, | |
| "5": 732, | |
| "6": 138, | |
| "7": 321, | |
| "8": 184, | |
| "9": 91 | |
| } | |
| }, | |
| "50": { | |
| "head": { | |
| "0": 5, | |
| "1": 8, | |
| "10": 3, | |
| "11": 5, | |
| "2": 2, | |
| "3": 3, | |
| "4": 3, | |
| "5": 2, | |
| "6": 3, | |
| "7": 2, | |
| "8": 2, | |
| "9": 4 | |
| }, | |
| "hidden": { | |
| "-1": 223, | |
| "0": 223, | |
| "1": 223, | |
| "10": 223, | |
| "11": 223, | |
| "2": 223, | |
| "3": 223, | |
| "4": 223, | |
| "5": 223, | |
| "6": 223, | |
| "7": 223, | |
| "8": 223, | |
| "9": 223 | |
| }, | |
| "neuron": { | |
| "0": 1749, | |
| "1": 1933, | |
| "10": 21, | |
| "11": 915, | |
| "2": 2699, | |
| "3": 519, | |
| "4": 664, | |
| "5": 976, | |
| "6": 252, | |
| "7": 469, | |
| "8": 307, | |
| "9": 187 | |
| } | |
| }, | |
| "60": { | |
| "head": { | |
| "0": 6, | |
| "1": 8, | |
| "10": 5, | |
| "11": 7, | |
| "2": 3, | |
| "3": 4, | |
| "4": 4, | |
| "5": 3, | |
| "6": 5, | |
| "7": 2, | |
| "8": 2, | |
| "9": 4 | |
| }, | |
| "hidden": { | |
| "-1": 284, | |
| "0": 284, | |
| "1": 284, | |
| "10": 284, | |
| "11": 284, | |
| "2": 284, | |
| "3": 284, | |
| "4": 284, | |
| "5": 284, | |
| "6": 284, | |
| "7": 284, | |
| "8": 284, | |
| "9": 284 | |
| }, | |
| "neuron": { | |
| "0": 2065, | |
| "1": 2200, | |
| "10": 67, | |
| "11": 1392, | |
| "2": 2762, | |
| "3": 817, | |
| "4": 991, | |
| "5": 1279, | |
| "6": 454, | |
| "7": 695, | |
| "8": 521, | |
| "9": 397 | |
| } | |
| }, | |
| "70": { | |
| "head": { | |
| "0": 6, | |
| "1": 8, | |
| "10": 6, | |
| "11": 7, | |
| "2": 4, | |
| "3": 6, | |
| "4": 4, | |
| "5": 5, | |
| "6": 6, | |
| "7": 3, | |
| "8": 5, | |
| "9": 5 | |
| }, | |
| "hidden": { | |
| "-1": 346, | |
| "0": 346, | |
| "1": 346, | |
| "10": 346, | |
| "11": 346, | |
| "2": 346, | |
| "3": 346, | |
| "4": 346, | |
| "5": 346, | |
| "6": 346, | |
| "7": 346, | |
| "8": 346, | |
| "9": 346 | |
| }, | |
| "neuron": { | |
| "0": 2266, | |
| "1": 2390, | |
| "10": 206, | |
| "11": 1745, | |
| "2": 2820, | |
| "3": 1173, | |
| "4": 1308, | |
| "5": 1537, | |
| "6": 694, | |
| "7": 951, | |
| "8": 791, | |
| "9": 708 | |
| } | |
| }, | |
| "80": { | |
| "head": { | |
| "0": 6, | |
| "1": 9, | |
| "10": 8, | |
| "11": 8, | |
| "2": 6, | |
| "3": 6, | |
| "4": 6, | |
| "5": 9, | |
| "6": 7, | |
| "7": 4, | |
| "8": 5, | |
| "9": 5 | |
| }, | |
| "hidden": { | |
| "-1": 422, | |
| "0": 422, | |
| "1": 422, | |
| "10": 422, | |
| "11": 422, | |
| "2": 422, | |
| "3": 422, | |
| "4": 422, | |
| "5": 422, | |
| "6": 422, | |
| "7": 422, | |
| "8": 422, | |
| "9": 422 | |
| }, | |
| "neuron": { | |
| "0": 2450, | |
| "1": 2541, | |
| "10": 574, | |
| "11": 2105, | |
| "2": 2863, | |
| "3": 1559, | |
| "4": 1676, | |
| "5": 1862, | |
| "6": 1071, | |
| "7": 1294, | |
| "8": 1154, | |
| "9": 1126 | |
| } | |
| }, | |
| "85": { | |
| "head": { | |
| "0": 6, | |
| "1": 9, | |
| "10": 10, | |
| "11": 8, | |
| "2": 6, | |
| "3": 6, | |
| "4": 7, | |
| "5": 9, | |
| "6": 8, | |
| "7": 7, | |
| "8": 5, | |
| "9": 7 | |
| }, | |
| "hidden": { | |
| "-1": 468, | |
| "0": 468, | |
| "1": 468, | |
| "10": 468, | |
| "11": 468, | |
| "2": 468, | |
| "3": 468, | |
| "4": 468, | |
| "5": 468, | |
| "6": 468, | |
| "7": 468, | |
| "8": 468, | |
| "9": 468 | |
| }, | |
| "neuron": { | |
| "0": 2554, | |
| "1": 2635, | |
| "10": 936, | |
| "11": 2278, | |
| "2": 2889, | |
| "3": 1780, | |
| "4": 1836, | |
| "5": 2037, | |
| "6": 1292, | |
| "7": 1489, | |
| "8": 1360, | |
| "9": 1401 | |
| } | |
| }, | |
| "90": { | |
| "head": { | |
| "0": 6, | |
| "1": 9, | |
| "10": 11, | |
| "11": 8, | |
| "2": 7, | |
| "3": 7, | |
| "4": 9, | |
| "5": 9, | |
| "6": 9, | |
| "7": 9, | |
| "8": 6, | |
| "9": 8 | |
| }, | |
| "hidden": { | |
| "-1": 522, | |
| "0": 522, | |
| "1": 522, | |
| "10": 522, | |
| "11": 522, | |
| "2": 522, | |
| "3": 522, | |
| "4": 522, | |
| "5": 522, | |
| "6": 522, | |
| "7": 522, | |
| "8": 522, | |
| "9": 522 | |
| }, | |
| "neuron": { | |
| "0": 2653, | |
| "1": 2713, | |
| "10": 1390, | |
| "11": 2433, | |
| "2": 2913, | |
| "3": 2013, | |
| "4": 2064, | |
| "5": 2243, | |
| "6": 1569, | |
| "7": 1741, | |
| "8": 1648, | |
| "9": 1688 | |
| } | |
| }, | |
| "95": { | |
| "head": { | |
| "0": 8, | |
| "1": 10, | |
| "10": 11, | |
| "11": 9, | |
| "2": 9, | |
| "3": 9, | |
| "4": 9, | |
| "5": 9, | |
| "6": 11, | |
| "7": 9, | |
| "8": 9, | |
| "9": 9 | |
| }, | |
| "hidden": { | |
| "-1": 599, | |
| "0": 599, | |
| "1": 599, | |
| "10": 599, | |
| "11": 599, | |
| "2": 599, | |
| "3": 599, | |
| "4": 599, | |
| "5": 599, | |
| "6": 599, | |
| "7": 599, | |
| "8": 599, | |
| "9": 599 | |
| }, | |
| "neuron": { | |
| "0": 2753, | |
| "1": 2799, | |
| "10": 2001, | |
| "11": 2654, | |
| "2": 2948, | |
| "3": 2337, | |
| "4": 2381, | |
| "5": 2519, | |
| "6": 1992, | |
| "7": 2148, | |
| "8": 2061, | |
| "9": 2161 | |
| } | |
| }, | |
| "96": { | |
| "head": { | |
| "0": 9, | |
| "1": 10, | |
| "10": 11, | |
| "11": 10, | |
| "2": 9, | |
| "3": 9, | |
| "4": 9, | |
| "5": 10, | |
| "6": 11, | |
| "7": 9, | |
| "8": 9, | |
| "9": 9 | |
| }, | |
| "hidden": { | |
| "-1": 614, | |
| "0": 614, | |
| "1": 614, | |
| "10": 614, | |
| "11": 614, | |
| "2": 614, | |
| "3": 614, | |
| "4": 614, | |
| "5": 614, | |
| "6": 614, | |
| "7": 614, | |
| "8": 614, | |
| "9": 614 | |
| }, | |
| "neuron": { | |
| "0": 2768, | |
| "1": 2822, | |
| "10": 2133, | |
| "11": 2689, | |
| "2": 2955, | |
| "3": 2392, | |
| "4": 2439, | |
| "5": 2579, | |
| "6": 2077, | |
| "7": 2223, | |
| "8": 2148, | |
| "9": 2266 | |
| } | |
| }, | |
| "97": { | |
| "head": { | |
| "0": 10, | |
| "1": 10, | |
| "10": 11, | |
| "11": 10, | |
| "2": 9, | |
| "3": 9, | |
| "4": 9, | |
| "5": 10, | |
| "6": 11, | |
| "7": 10, | |
| "8": 11, | |
| "9": 10 | |
| }, | |
| "hidden": { | |
| "-1": 637, | |
| "0": 637, | |
| "1": 637, | |
| "10": 637, | |
| "11": 637, | |
| "2": 637, | |
| "3": 637, | |
| "4": 637, | |
| "5": 637, | |
| "6": 637, | |
| "7": 637, | |
| "8": 637, | |
| "9": 637 | |
| }, | |
| "neuron": { | |
| "0": 2799, | |
| "1": 2846, | |
| "10": 2294, | |
| "11": 2746, | |
| "2": 2970, | |
| "3": 2487, | |
| "4": 2537, | |
| "5": 2656, | |
| "6": 2207, | |
| "7": 2355, | |
| "8": 2291, | |
| "9": 2409 | |
| } | |
| }, | |
| "98": { | |
| "head": { | |
| "0": 11, | |
| "1": 10, | |
| "10": 11, | |
| "11": 10, | |
| "2": 10, | |
| "3": 10, | |
| "4": 10, | |
| "5": 10, | |
| "6": 11, | |
| "7": 10, | |
| "8": 11, | |
| "9": 10 | |
| }, | |
| "hidden": { | |
| "-1": 660, | |
| "0": 660, | |
| "1": 660, | |
| "10": 660, | |
| "11": 660, | |
| "2": 660, | |
| "3": 660, | |
| "4": 660, | |
| "5": 660, | |
| "6": 660, | |
| "7": 660, | |
| "8": 660, | |
| "9": 660 | |
| }, | |
| "neuron": { | |
| "0": 2826, | |
| "1": 2870, | |
| "10": 2455, | |
| "11": 2794, | |
| "2": 2984, | |
| "3": 2588, | |
| "4": 2634, | |
| "5": 2726, | |
| "6": 2350, | |
| "7": 2501, | |
| "8": 2440, | |
| "9": 2535 | |
| } | |
| }, | |
| "99": { | |
| "head": { | |
| "0": 11, | |
| "1": 10, | |
| "10": 11, | |
| "11": 11, | |
| "2": 11, | |
| "3": 11, | |
| "4": 11, | |
| "5": 11, | |
| "6": 11, | |
| "7": 11, | |
| "8": 11, | |
| "9": 10 | |
| }, | |
| "hidden": { | |
| "-1": 691, | |
| "0": 691, | |
| "1": 691, | |
| "10": 691, | |
| "11": 691, | |
| "2": 691, | |
| "3": 691, | |
| "4": 691, | |
| "5": 691, | |
| "6": 691, | |
| "7": 691, | |
| "8": 691, | |
| "9": 691 | |
| }, | |
| "neuron": { | |
| "0": 2861, | |
| "1": 2915, | |
| "10": 2683, | |
| "11": 2862, | |
| "2": 2998, | |
| "3": 2709, | |
| "4": 2746, | |
| "5": 2845, | |
| "6": 2551, | |
| "7": 2678, | |
| "8": 2635, | |
| "9": 2695 | |
| } | |
| } | |
| }, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.12.0", | |
| "type_vocab_size": 2, | |
| "use_cache": true, | |
| "vocab_size": 30522 | |
| } | |