| { |
| "_name_or_path": "../plms/bert-base-uncased", |
| "architectures": [ |
| "SparseBertHidden" |
| ], |
| "attention_probs_dropout_prob": 0.1, |
| "classifier_dropout": null, |
| "gradient_checkpointing": false, |
| "hidden_act": "gelu", |
| "hidden_dropout_prob": 0.1, |
| "hidden_size": 768, |
| "initializer_range": 0.02, |
| "intermediate_size": 3072, |
| "layer_norm_eps": 1e-12, |
| "layer_skip": 1, |
| "max_position_embeddings": 512, |
| "model_type": "bert", |
| "num_attention_heads": 12, |
| "num_hidden_layers": 12, |
| "pad_token_id": 0, |
| "position_embedding_type": "absolute", |
| "sparsity": "0", |
| "sparsity_map": { |
| "0": { |
| "head": {}, |
| "hidden": { |
| "-1": 0, |
| "0": 0, |
| "1": 0, |
| "10": 0, |
| "11": 0, |
| "2": 0, |
| "3": 0, |
| "4": 0, |
| "5": 0, |
| "6": 0, |
| "7": 0, |
| "8": 0, |
| "9": 0 |
| }, |
| "neuron": {} |
| }, |
| "10": { |
| "head": { |
| "1": 5, |
| "11": 1, |
| "3": 1 |
| }, |
| "hidden": { |
| "-1": 38, |
| "0": 38, |
| "1": 38, |
| "10": 38, |
| "11": 38, |
| "2": 38, |
| "3": 38, |
| "4": 38, |
| "5": 38, |
| "6": 38, |
| "7": 38, |
| "8": 38, |
| "9": 38 |
| }, |
| "neuron": { |
| "0": 190, |
| "1": 298, |
| "11": 1, |
| "2": 1323, |
| "3": 4, |
| "4": 5, |
| "5": 8, |
| "6": 4, |
| "7": 7, |
| "8": 2, |
| "9": 1 |
| } |
| }, |
| "20": { |
| "head": { |
| "0": 1, |
| "1": 7, |
| "10": 1, |
| "11": 4, |
| "3": 2, |
| "9": 1 |
| }, |
| "hidden": { |
| "-1": 84, |
| "0": 84, |
| "1": 84, |
| "10": 84, |
| "11": 84, |
| "2": 84, |
| "3": 84, |
| "4": 84, |
| "5": 84, |
| "6": 84, |
| "7": 84, |
| "8": 84, |
| "9": 84 |
| }, |
| "neuron": { |
| "0": 597, |
| "1": 802, |
| "11": 16, |
| "2": 2294, |
| "3": 48, |
| "4": 78, |
| "5": 123, |
| "6": 22, |
| "7": 47, |
| "8": 23, |
| "9": 5 |
| } |
| }, |
| "30": { |
| "head": { |
| "0": 1, |
| "1": 8, |
| "10": 2, |
| "11": 4, |
| "2": 1, |
| "3": 2, |
| "6": 1, |
| "7": 1, |
| "8": 1, |
| "9": 2 |
| }, |
| "hidden": { |
| "-1": 123, |
| "0": 123, |
| "1": 123, |
| "10": 123, |
| "11": 123, |
| "2": 123, |
| "3": 123, |
| "4": 123, |
| "5": 123, |
| "6": 123, |
| "7": 123, |
| "8": 123, |
| "9": 123 |
| }, |
| "neuron": { |
| "0": 980, |
| "1": 1233, |
| "10": 2, |
| "11": 116, |
| "2": 2512, |
| "3": 132, |
| "4": 233, |
| "5": 386, |
| "6": 61, |
| "7": 146, |
| "8": 73, |
| "9": 24 |
| } |
| }, |
| "40": { |
| "head": { |
| "0": 3, |
| "1": 8, |
| "10": 2, |
| "11": 5, |
| "2": 1, |
| "3": 3, |
| "4": 2, |
| "5": 1, |
| "6": 2, |
| "7": 1, |
| "8": 1, |
| "9": 4 |
| }, |
| "hidden": { |
| "-1": 177, |
| "0": 177, |
| "1": 177, |
| "10": 177, |
| "11": 177, |
| "2": 177, |
| "3": 177, |
| "4": 177, |
| "5": 177, |
| "6": 177, |
| "7": 177, |
| "8": 177, |
| "9": 177 |
| }, |
| "neuron": { |
| "0": 1436, |
| "1": 1664, |
| "10": 6, |
| "11": 518, |
| "2": 2634, |
| "3": 306, |
| "4": 449, |
| "5": 732, |
| "6": 138, |
| "7": 321, |
| "8": 184, |
| "9": 91 |
| } |
| }, |
| "50": { |
| "head": { |
| "0": 5, |
| "1": 8, |
| "10": 3, |
| "11": 5, |
| "2": 2, |
| "3": 3, |
| "4": 3, |
| "5": 2, |
| "6": 3, |
| "7": 2, |
| "8": 2, |
| "9": 4 |
| }, |
| "hidden": { |
| "-1": 223, |
| "0": 223, |
| "1": 223, |
| "10": 223, |
| "11": 223, |
| "2": 223, |
| "3": 223, |
| "4": 223, |
| "5": 223, |
| "6": 223, |
| "7": 223, |
| "8": 223, |
| "9": 223 |
| }, |
| "neuron": { |
| "0": 1749, |
| "1": 1933, |
| "10": 21, |
| "11": 915, |
| "2": 2699, |
| "3": 519, |
| "4": 664, |
| "5": 976, |
| "6": 252, |
| "7": 469, |
| "8": 307, |
| "9": 187 |
| } |
| }, |
| "60": { |
| "head": { |
| "0": 6, |
| "1": 8, |
| "10": 5, |
| "11": 7, |
| "2": 3, |
| "3": 4, |
| "4": 4, |
| "5": 3, |
| "6": 5, |
| "7": 2, |
| "8": 2, |
| "9": 4 |
| }, |
| "hidden": { |
| "-1": 284, |
| "0": 284, |
| "1": 284, |
| "10": 284, |
| "11": 284, |
| "2": 284, |
| "3": 284, |
| "4": 284, |
| "5": 284, |
| "6": 284, |
| "7": 284, |
| "8": 284, |
| "9": 284 |
| }, |
| "neuron": { |
| "0": 2065, |
| "1": 2200, |
| "10": 67, |
| "11": 1392, |
| "2": 2762, |
| "3": 817, |
| "4": 991, |
| "5": 1279, |
| "6": 454, |
| "7": 695, |
| "8": 521, |
| "9": 397 |
| } |
| }, |
| "70": { |
| "head": { |
| "0": 6, |
| "1": 8, |
| "10": 6, |
| "11": 7, |
| "2": 4, |
| "3": 6, |
| "4": 4, |
| "5": 5, |
| "6": 6, |
| "7": 3, |
| "8": 5, |
| "9": 5 |
| }, |
| "hidden": { |
| "-1": 346, |
| "0": 346, |
| "1": 346, |
| "10": 346, |
| "11": 346, |
| "2": 346, |
| "3": 346, |
| "4": 346, |
| "5": 346, |
| "6": 346, |
| "7": 346, |
| "8": 346, |
| "9": 346 |
| }, |
| "neuron": { |
| "0": 2266, |
| "1": 2390, |
| "10": 206, |
| "11": 1745, |
| "2": 2820, |
| "3": 1173, |
| "4": 1308, |
| "5": 1537, |
| "6": 694, |
| "7": 951, |
| "8": 791, |
| "9": 708 |
| } |
| }, |
| "80": { |
| "head": { |
| "0": 6, |
| "1": 9, |
| "10": 8, |
| "11": 8, |
| "2": 6, |
| "3": 6, |
| "4": 6, |
| "5": 9, |
| "6": 7, |
| "7": 4, |
| "8": 5, |
| "9": 5 |
| }, |
| "hidden": { |
| "-1": 422, |
| "0": 422, |
| "1": 422, |
| "10": 422, |
| "11": 422, |
| "2": 422, |
| "3": 422, |
| "4": 422, |
| "5": 422, |
| "6": 422, |
| "7": 422, |
| "8": 422, |
| "9": 422 |
| }, |
| "neuron": { |
| "0": 2450, |
| "1": 2541, |
| "10": 574, |
| "11": 2105, |
| "2": 2863, |
| "3": 1559, |
| "4": 1676, |
| "5": 1862, |
| "6": 1071, |
| "7": 1294, |
| "8": 1154, |
| "9": 1126 |
| } |
| }, |
| "85": { |
| "head": { |
| "0": 6, |
| "1": 9, |
| "10": 10, |
| "11": 8, |
| "2": 6, |
| "3": 6, |
| "4": 7, |
| "5": 9, |
| "6": 8, |
| "7": 7, |
| "8": 5, |
| "9": 7 |
| }, |
| "hidden": { |
| "-1": 468, |
| "0": 468, |
| "1": 468, |
| "10": 468, |
| "11": 468, |
| "2": 468, |
| "3": 468, |
| "4": 468, |
| "5": 468, |
| "6": 468, |
| "7": 468, |
| "8": 468, |
| "9": 468 |
| }, |
| "neuron": { |
| "0": 2554, |
| "1": 2635, |
| "10": 936, |
| "11": 2278, |
| "2": 2889, |
| "3": 1780, |
| "4": 1836, |
| "5": 2037, |
| "6": 1292, |
| "7": 1489, |
| "8": 1360, |
| "9": 1401 |
| } |
| }, |
| "90": { |
| "head": { |
| "0": 6, |
| "1": 9, |
| "10": 11, |
| "11": 8, |
| "2": 7, |
| "3": 7, |
| "4": 9, |
| "5": 9, |
| "6": 9, |
| "7": 9, |
| "8": 6, |
| "9": 8 |
| }, |
| "hidden": { |
| "-1": 522, |
| "0": 522, |
| "1": 522, |
| "10": 522, |
| "11": 522, |
| "2": 522, |
| "3": 522, |
| "4": 522, |
| "5": 522, |
| "6": 522, |
| "7": 522, |
| "8": 522, |
| "9": 522 |
| }, |
| "neuron": { |
| "0": 2653, |
| "1": 2713, |
| "10": 1390, |
| "11": 2433, |
| "2": 2913, |
| "3": 2013, |
| "4": 2064, |
| "5": 2243, |
| "6": 1569, |
| "7": 1741, |
| "8": 1648, |
| "9": 1688 |
| } |
| }, |
| "95": { |
| "head": { |
| "0": 8, |
| "1": 10, |
| "10": 11, |
| "11": 9, |
| "2": 9, |
| "3": 9, |
| "4": 9, |
| "5": 9, |
| "6": 11, |
| "7": 9, |
| "8": 9, |
| "9": 9 |
| }, |
| "hidden": { |
| "-1": 599, |
| "0": 599, |
| "1": 599, |
| "10": 599, |
| "11": 599, |
| "2": 599, |
| "3": 599, |
| "4": 599, |
| "5": 599, |
| "6": 599, |
| "7": 599, |
| "8": 599, |
| "9": 599 |
| }, |
| "neuron": { |
| "0": 2753, |
| "1": 2799, |
| "10": 2001, |
| "11": 2654, |
| "2": 2948, |
| "3": 2337, |
| "4": 2381, |
| "5": 2519, |
| "6": 1992, |
| "7": 2148, |
| "8": 2061, |
| "9": 2161 |
| } |
| }, |
| "96": { |
| "head": { |
| "0": 9, |
| "1": 10, |
| "10": 11, |
| "11": 10, |
| "2": 9, |
| "3": 9, |
| "4": 9, |
| "5": 10, |
| "6": 11, |
| "7": 9, |
| "8": 9, |
| "9": 9 |
| }, |
| "hidden": { |
| "-1": 614, |
| "0": 614, |
| "1": 614, |
| "10": 614, |
| "11": 614, |
| "2": 614, |
| "3": 614, |
| "4": 614, |
| "5": 614, |
| "6": 614, |
| "7": 614, |
| "8": 614, |
| "9": 614 |
| }, |
| "neuron": { |
| "0": 2768, |
| "1": 2822, |
| "10": 2133, |
| "11": 2689, |
| "2": 2955, |
| "3": 2392, |
| "4": 2439, |
| "5": 2579, |
| "6": 2077, |
| "7": 2223, |
| "8": 2148, |
| "9": 2266 |
| } |
| }, |
| "97": { |
| "head": { |
| "0": 10, |
| "1": 10, |
| "10": 11, |
| "11": 10, |
| "2": 9, |
| "3": 9, |
| "4": 9, |
| "5": 10, |
| "6": 11, |
| "7": 10, |
| "8": 11, |
| "9": 10 |
| }, |
| "hidden": { |
| "-1": 637, |
| "0": 637, |
| "1": 637, |
| "10": 637, |
| "11": 637, |
| "2": 637, |
| "3": 637, |
| "4": 637, |
| "5": 637, |
| "6": 637, |
| "7": 637, |
| "8": 637, |
| "9": 637 |
| }, |
| "neuron": { |
| "0": 2799, |
| "1": 2846, |
| "10": 2294, |
| "11": 2746, |
| "2": 2970, |
| "3": 2487, |
| "4": 2537, |
| "5": 2656, |
| "6": 2207, |
| "7": 2355, |
| "8": 2291, |
| "9": 2409 |
| } |
| }, |
| "98": { |
| "head": { |
| "0": 11, |
| "1": 10, |
| "10": 11, |
| "11": 10, |
| "2": 10, |
| "3": 10, |
| "4": 10, |
| "5": 10, |
| "6": 11, |
| "7": 10, |
| "8": 11, |
| "9": 10 |
| }, |
| "hidden": { |
| "-1": 660, |
| "0": 660, |
| "1": 660, |
| "10": 660, |
| "11": 660, |
| "2": 660, |
| "3": 660, |
| "4": 660, |
| "5": 660, |
| "6": 660, |
| "7": 660, |
| "8": 660, |
| "9": 660 |
| }, |
| "neuron": { |
| "0": 2826, |
| "1": 2870, |
| "10": 2455, |
| "11": 2794, |
| "2": 2984, |
| "3": 2588, |
| "4": 2634, |
| "5": 2726, |
| "6": 2350, |
| "7": 2501, |
| "8": 2440, |
| "9": 2535 |
| } |
| }, |
| "99": { |
| "head": { |
| "0": 11, |
| "1": 10, |
| "10": 11, |
| "11": 11, |
| "2": 11, |
| "3": 11, |
| "4": 11, |
| "5": 11, |
| "6": 11, |
| "7": 11, |
| "8": 11, |
| "9": 10 |
| }, |
| "hidden": { |
| "-1": 691, |
| "0": 691, |
| "1": 691, |
| "10": 691, |
| "11": 691, |
| "2": 691, |
| "3": 691, |
| "4": 691, |
| "5": 691, |
| "6": 691, |
| "7": 691, |
| "8": 691, |
| "9": 691 |
| }, |
| "neuron": { |
| "0": 2861, |
| "1": 2915, |
| "10": 2683, |
| "11": 2862, |
| "2": 2998, |
| "3": 2709, |
| "4": 2746, |
| "5": 2845, |
| "6": 2551, |
| "7": 2678, |
| "8": 2635, |
| "9": 2695 |
| } |
| } |
| }, |
| "torch_dtype": "float32", |
| "transformers_version": "4.12.0", |
| "type_vocab_size": 2, |
| "use_cache": true, |
| "vocab_size": 30522 |
| } |
|
|