vit-food-classifier / config.json
Nav772's picture
Upload ViTForImageClassification
edad6a6 verified
{
"architectures": [
"ViTForImageClassification"
],
"attention_probs_dropout_prob": 0.0,
"dtype": "float32",
"encoder_stride": 16,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"id2label": {
"0": "pizza",
"1": "sushi",
"2": "hamburger",
"3": "ice_cream",
"4": "steak",
"5": "baklava",
"6": "cheesecake",
"7": "pancakes",
"8": "tacos",
"9": "ramen"
},
"image_size": 224,
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"baklava": 5,
"cheesecake": 6,
"hamburger": 2,
"ice_cream": 3,
"pancakes": 7,
"pizza": 0,
"ramen": 9,
"steak": 4,
"sushi": 1,
"tacos": 8
},
"layer_norm_eps": 1e-12,
"model_type": "vit",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"patch_size": 16,
"pooler_act": "tanh",
"pooler_output_size": 768,
"problem_type": "single_label_classification",
"qkv_bias": true,
"transformers_version": "4.57.3"
}