ViViT_lsa64_coR / config.json
Shawon16's picture
Training in progress, epoch 0
cc99ded verified
{
"_name_or_path": "google/vivit-b-16x2-kinetics400",
"architectures": [
"VivitForVideoClassification"
],
"attention_probs_dropout_prob": 0.0,
"hidden_act": "gelu_fast",
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"id2label": {
"0": "W1",
"1": "W10",
"2": "W11",
"3": "W12",
"4": "W13",
"5": "W14",
"6": "W15",
"7": "W16",
"8": "W17",
"9": "W18",
"10": "W19",
"11": "W2",
"12": "W20",
"13": "W21",
"14": "W22",
"15": "W23",
"16": "W24",
"17": "W25",
"18": "W26",
"19": "W27",
"20": "W28",
"21": "W29",
"22": "W3",
"23": "W30",
"24": "W31",
"25": "W32",
"26": "W33",
"27": "W34",
"28": "W35",
"29": "W36",
"30": "W37",
"31": "W38",
"32": "W39",
"33": "W4",
"34": "W40",
"35": "W41",
"36": "W42",
"37": "W43",
"38": "W44",
"39": "W45",
"40": "W46",
"41": "W47",
"42": "W48",
"43": "W49",
"44": "W5",
"45": "W50",
"46": "W51",
"47": "W52",
"48": "W53",
"49": "W54",
"50": "W55",
"51": "W56",
"52": "W57",
"53": "W58",
"54": "W59",
"55": "W6",
"56": "W60",
"57": "W61",
"58": "W62",
"59": "W63",
"60": "W64",
"61": "W7",
"62": "W8",
"63": "W9"
},
"image_size": 224,
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"W1": 0,
"W10": 1,
"W11": 2,
"W12": 3,
"W13": 4,
"W14": 5,
"W15": 6,
"W16": 7,
"W17": 8,
"W18": 9,
"W19": 10,
"W2": 11,
"W20": 12,
"W21": 13,
"W22": 14,
"W23": 15,
"W24": 16,
"W25": 17,
"W26": 18,
"W27": 19,
"W28": 20,
"W29": 21,
"W3": 22,
"W30": 23,
"W31": 24,
"W32": 25,
"W33": 26,
"W34": 27,
"W35": 28,
"W36": 29,
"W37": 30,
"W38": 31,
"W39": 32,
"W4": 33,
"W40": 34,
"W41": 35,
"W42": 36,
"W43": 37,
"W44": 38,
"W45": 39,
"W46": 40,
"W47": 41,
"W48": 42,
"W49": 43,
"W5": 44,
"W50": 45,
"W51": 46,
"W52": 47,
"W53": 48,
"W54": 49,
"W55": 50,
"W56": 51,
"W57": 52,
"W58": 53,
"W59": 54,
"W6": 55,
"W60": 56,
"W61": 57,
"W62": 58,
"W63": 59,
"W64": 60,
"W7": 61,
"W8": 62,
"W9": 63
},
"layer_norm_eps": 1e-06,
"model_type": "vivit",
"num_attention_heads": 12,
"num_channels": 3,
"num_frames": 32,
"num_hidden_layers": 12,
"qkv_bias": true,
"torch_dtype": "float32",
"transformers_version": "4.46.1",
"tubelet_size": [
2,
16,
16
],
"video_size": [
32,
224,
224
]
}