Upload model_metadata.json with huggingface_hub
Browse files- model_metadata.json +20 -12
model_metadata.json
CHANGED
|
@@ -1,14 +1,18 @@
|
|
| 1 |
{
|
| 2 |
-
"version": "clean-baseline-
|
| 3 |
"model": "vit_base_patch16_224",
|
| 4 |
-
"num_classes":
|
| 5 |
"class_names": [
|
| 6 |
"call",
|
| 7 |
"dislike",
|
| 8 |
"fist",
|
| 9 |
"four",
|
|
|
|
|
|
|
| 10 |
"like",
|
|
|
|
| 11 |
"mute",
|
|
|
|
| 12 |
"ok",
|
| 13 |
"one",
|
| 14 |
"palm",
|
|
@@ -19,22 +23,25 @@
|
|
| 19 |
"stop_inverted",
|
| 20 |
"three",
|
| 21 |
"three2",
|
|
|
|
| 22 |
"two_up",
|
| 23 |
"two_up_inverted"
|
| 24 |
],
|
| 25 |
"img_size": 224,
|
| 26 |
-
"test_accuracy": 0.
|
| 27 |
-
"confusion_matrix_diagonality":
|
| 28 |
"best_epoch": 15,
|
| 29 |
-
"best_val_acc":
|
| 30 |
-
"best_val_f1": 0.
|
| 31 |
"train_acc": 100.0,
|
| 32 |
"dataset": {
|
| 33 |
-
"name": "HaGRID
|
| 34 |
-
"source": "
|
| 35 |
-
"
|
| 36 |
-
"
|
| 37 |
-
"
|
|
|
|
|
|
|
| 38 |
},
|
| 39 |
"training_config": {
|
| 40 |
"batch_size": 32,
|
|
@@ -59,6 +66,7 @@
|
|
| 59 |
0.225
|
| 60 |
],
|
| 61 |
"augmentation": "none",
|
|
|
|
| 62 |
"tta": false
|
| 63 |
},
|
| 64 |
"architecture": {
|
|
@@ -67,5 +75,5 @@
|
|
| 67 |
"hidden_dim": null,
|
| 68 |
"dropout": 0.0
|
| 69 |
},
|
| 70 |
-
"timestamp": "2026-01-
|
| 71 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"version": "clean-baseline-v2.0-hf",
|
| 3 |
"model": "vit_base_patch16_224",
|
| 4 |
+
"num_classes": 23,
|
| 5 |
"class_names": [
|
| 6 |
"call",
|
| 7 |
"dislike",
|
| 8 |
"fist",
|
| 9 |
"four",
|
| 10 |
+
"grabbing",
|
| 11 |
+
"grip",
|
| 12 |
"like",
|
| 13 |
+
"middle_finger",
|
| 14 |
"mute",
|
| 15 |
+
"no_gesture",
|
| 16 |
"ok",
|
| 17 |
"one",
|
| 18 |
"palm",
|
|
|
|
| 23 |
"stop_inverted",
|
| 24 |
"three",
|
| 25 |
"three2",
|
| 26 |
+
"three3",
|
| 27 |
"two_up",
|
| 28 |
"two_up_inverted"
|
| 29 |
],
|
| 30 |
"img_size": 224,
|
| 31 |
+
"test_accuracy": 0.9248953459738981,
|
| 32 |
+
"confusion_matrix_diagonality": 92.4895345973898,
|
| 33 |
"best_epoch": 15,
|
| 34 |
+
"best_val_acc": 89.87750372454892,
|
| 35 |
+
"best_val_f1": 0.9248777400191369,
|
| 36 |
"train_acc": 100.0,
|
| 37 |
"dataset": {
|
| 38 |
+
"name": "HaGRID Subset",
|
| 39 |
+
"source": "local",
|
| 40 |
+
"path": "data/hagrid_subset",
|
| 41 |
+
"train_size": 103171,
|
| 42 |
+
"val_size": 12082,
|
| 43 |
+
"test_size": 20305,
|
| 44 |
+
"splits": "fixed"
|
| 45 |
},
|
| 46 |
"training_config": {
|
| 47 |
"batch_size": 32,
|
|
|
|
| 66 |
0.225
|
| 67 |
],
|
| 68 |
"augmentation": "none",
|
| 69 |
+
"rationale": "augmentation corrupts gesture semantics",
|
| 70 |
"tta": false
|
| 71 |
},
|
| 72 |
"architecture": {
|
|
|
|
| 75 |
"hidden_dim": null,
|
| 76 |
"dropout": 0.0
|
| 77 |
},
|
| 78 |
+
"timestamp": "2026-01-14T22:44:08.208470"
|
| 79 |
}
|