| { | |
| "_name_or_path": "google/vivit-b-16x2-kinetics400", | |
| "architectures": [ | |
| "VivitForVideoClassification" | |
| ], | |
| "attention_probs_dropout_prob": 0.0, | |
| "hidden_act": "gelu_fast", | |
| "hidden_dropout_prob": 0.0, | |
| "hidden_size": 768, | |
| "id2label": { | |
| "0": "W1", | |
| "1": "W10", | |
| "2": "W11", | |
| "3": "W12", | |
| "4": "W13", | |
| "5": "W14", | |
| "6": "W15", | |
| "7": "W16", | |
| "8": "W17", | |
| "9": "W18", | |
| "10": "W19", | |
| "11": "W2", | |
| "12": "W20", | |
| "13": "W21", | |
| "14": "W22", | |
| "15": "W23", | |
| "16": "W24", | |
| "17": "W25", | |
| "18": "W26", | |
| "19": "W27", | |
| "20": "W28", | |
| "21": "W29", | |
| "22": "W3", | |
| "23": "W30", | |
| "24": "W31", | |
| "25": "W32", | |
| "26": "W33", | |
| "27": "W34", | |
| "28": "W35", | |
| "29": "W36", | |
| "30": "W37", | |
| "31": "W38", | |
| "32": "W39", | |
| "33": "W4", | |
| "34": "W40", | |
| "35": "W41", | |
| "36": "W42", | |
| "37": "W43", | |
| "38": "W44", | |
| "39": "W45", | |
| "40": "W46", | |
| "41": "W47", | |
| "42": "W48", | |
| "43": "W49", | |
| "44": "W5", | |
| "45": "W50", | |
| "46": "W51", | |
| "47": "W52", | |
| "48": "W53", | |
| "49": "W54", | |
| "50": "W55", | |
| "51": "W56", | |
| "52": "W57", | |
| "53": "W58", | |
| "54": "W59", | |
| "55": "W6", | |
| "56": "W60", | |
| "57": "W61", | |
| "58": "W62", | |
| "59": "W63", | |
| "60": "W64", | |
| "61": "W7", | |
| "62": "W8", | |
| "63": "W9" | |
| }, | |
| "image_size": 224, | |
| "initializer_range": 0.02, | |
| "intermediate_size": 3072, | |
| "label2id": { | |
| "W1": 0, | |
| "W10": 1, | |
| "W11": 2, | |
| "W12": 3, | |
| "W13": 4, | |
| "W14": 5, | |
| "W15": 6, | |
| "W16": 7, | |
| "W17": 8, | |
| "W18": 9, | |
| "W19": 10, | |
| "W2": 11, | |
| "W20": 12, | |
| "W21": 13, | |
| "W22": 14, | |
| "W23": 15, | |
| "W24": 16, | |
| "W25": 17, | |
| "W26": 18, | |
| "W27": 19, | |
| "W28": 20, | |
| "W29": 21, | |
| "W3": 22, | |
| "W30": 23, | |
| "W31": 24, | |
| "W32": 25, | |
| "W33": 26, | |
| "W34": 27, | |
| "W35": 28, | |
| "W36": 29, | |
| "W37": 30, | |
| "W38": 31, | |
| "W39": 32, | |
| "W4": 33, | |
| "W40": 34, | |
| "W41": 35, | |
| "W42": 36, | |
| "W43": 37, | |
| "W44": 38, | |
| "W45": 39, | |
| "W46": 40, | |
| "W47": 41, | |
| "W48": 42, | |
| "W49": 43, | |
| "W5": 44, | |
| "W50": 45, | |
| "W51": 46, | |
| "W52": 47, | |
| "W53": 48, | |
| "W54": 49, | |
| "W55": 50, | |
| "W56": 51, | |
| "W57": 52, | |
| "W58": 53, | |
| "W59": 54, | |
| "W6": 55, | |
| "W60": 56, | |
| "W61": 57, | |
| "W62": 58, | |
| "W63": 59, | |
| "W64": 60, | |
| "W7": 61, | |
| "W8": 62, | |
| "W9": 63 | |
| }, | |
| "layer_norm_eps": 1e-06, | |
| "model_type": "vivit", | |
| "num_attention_heads": 12, | |
| "num_channels": 3, | |
| "num_frames": 32, | |
| "num_hidden_layers": 12, | |
| "qkv_bias": true, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.46.1", | |
| "tubelet_size": [ | |
| 2, | |
| 16, | |
| 16 | |
| ], | |
| "video_size": [ | |
| 32, | |
| 224, | |
| 224 | |
| ] | |
| } | |