End of training
Browse files- README.md +24 -5
- all_results.json +6 -6
- config.json +1 -0
- eval_results.json +3 -3
- runs/Mar02_14-41-50_04f752329dca/events.out.tfevents.1709390811.04f752329dca.283.1 +3 -0
- train_results.json +3 -3
- trainer_state.json +3 -3
README.md
CHANGED
|
@@ -2,23 +2,42 @@
|
|
| 2 |
license: apache-2.0
|
| 3 |
base_model: facebook/deit-base-distilled-patch16-224
|
| 4 |
tags:
|
|
|
|
|
|
|
| 5 |
- generated_from_trainer
|
| 6 |
metrics:
|
| 7 |
- accuracy
|
| 8 |
model-index:
|
| 9 |
-
- name: base
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
results: []
|
| 11 |
---
|
| 12 |
|
| 13 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
| 14 |
should probably proofread and complete it, then remove this comment. -->
|
| 15 |
|
| 16 |
-
# base
|
| 17 |
-
|
| 18 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 19 |
It achieves the following results on the evaluation set:
|
| 20 |
-
- Accuracy: 0.906
|
| 21 |
- Loss: 0.3054
|
|
|
|
| 22 |
|
| 23 |
## Model description
|
| 24 |
|
|
|
|
| 2 |
license: apache-2.0
|
| 3 |
base_model: facebook/deit-base-distilled-patch16-224
|
| 4 |
tags:
|
| 5 |
+
- image-classification
|
| 6 |
+
- vision
|
| 7 |
- generated_from_trainer
|
| 8 |
metrics:
|
| 9 |
- accuracy
|
| 10 |
model-index:
|
| 11 |
+
- name: "DeiT-base-DatasetDict({\n train: Dataset({\n features: ['img',\
|
| 12 |
+
\ 'fine_label', 'coarse_label'],\n num_rows: 50000\n })\n test: Dataset({\n\
|
| 13 |
+
\ features: ['img', 'fine_label', 'coarse_label'],\n num_rows: 10000\n\
|
| 14 |
+
\ })\n validation: Dataset({\n features: ['img', 'fine_label', 'coarse_label'],\n\
|
| 15 |
+
\ num_rows: 10000\n })\n})"
|
| 16 |
results: []
|
| 17 |
---
|
| 18 |
|
| 19 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
| 20 |
should probably proofread and complete it, then remove this comment. -->
|
| 21 |
|
| 22 |
+
# DeiT-base-DatasetDict({
|
| 23 |
+
train: Dataset({
|
| 24 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
| 25 |
+
num_rows: 50000
|
| 26 |
+
})
|
| 27 |
+
test: Dataset({
|
| 28 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
| 29 |
+
num_rows: 10000
|
| 30 |
+
})
|
| 31 |
+
validation: Dataset({
|
| 32 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
| 33 |
+
num_rows: 10000
|
| 34 |
+
})
|
| 35 |
+
})
|
| 36 |
+
|
| 37 |
+
This model is a fine-tuned version of [facebook/deit-base-distilled-patch16-224](https://huggingface.co/facebook/deit-base-distilled-patch16-224) on the cifar100 dataset.
|
| 38 |
It achieves the following results on the evaluation set:
|
|
|
|
| 39 |
- Loss: 0.3054
|
| 40 |
+
- Accuracy: 0.906
|
| 41 |
|
| 42 |
## Model description
|
| 43 |
|
all_results.json
CHANGED
|
@@ -2,12 +2,12 @@
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"eval_accuracy": 0.906,
|
| 4 |
"eval_loss": 0.3053509294986725,
|
| 5 |
-
"eval_runtime":
|
| 6 |
-
"eval_samples_per_second":
|
| 7 |
-
"eval_steps_per_second":
|
| 8 |
"total_flos": 3.8815447523328e+19,
|
| 9 |
"train_loss": 0.0,
|
| 10 |
-
"train_runtime":
|
| 11 |
-
"train_samples_per_second":
|
| 12 |
-
"train_steps_per_second":
|
| 13 |
}
|
|
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"eval_accuracy": 0.906,
|
| 4 |
"eval_loss": 0.3053509294986725,
|
| 5 |
+
"eval_runtime": 175.7662,
|
| 6 |
+
"eval_samples_per_second": 56.894,
|
| 7 |
+
"eval_steps_per_second": 56.894,
|
| 8 |
"total_flos": 3.8815447523328e+19,
|
| 9 |
"train_loss": 0.0,
|
| 10 |
+
"train_runtime": 36.1375,
|
| 11 |
+
"train_samples_per_second": 13836.038,
|
| 12 |
+
"train_steps_per_second": 216.396
|
| 13 |
}
|
config.json
CHANGED
|
@@ -222,6 +222,7 @@
|
|
| 222 |
"num_channels": 3,
|
| 223 |
"num_hidden_layers": 12,
|
| 224 |
"patch_size": 16,
|
|
|
|
| 225 |
"qkv_bias": true,
|
| 226 |
"torch_dtype": "float32",
|
| 227 |
"transformers_version": "4.38.1"
|
|
|
|
| 222 |
"num_channels": 3,
|
| 223 |
"num_hidden_layers": 12,
|
| 224 |
"patch_size": 16,
|
| 225 |
+
"problem_type": "single_label_classification",
|
| 226 |
"qkv_bias": true,
|
| 227 |
"torch_dtype": "float32",
|
| 228 |
"transformers_version": "4.38.1"
|
eval_results.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"eval_accuracy": 0.906,
|
| 4 |
"eval_loss": 0.3053509294986725,
|
| 5 |
-
"eval_runtime":
|
| 6 |
-
"eval_samples_per_second":
|
| 7 |
-
"eval_steps_per_second":
|
| 8 |
}
|
|
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"eval_accuracy": 0.906,
|
| 4 |
"eval_loss": 0.3053509294986725,
|
| 5 |
+
"eval_runtime": 175.7662,
|
| 6 |
+
"eval_samples_per_second": 56.894,
|
| 7 |
+
"eval_steps_per_second": 56.894
|
| 8 |
}
|
runs/Mar02_14-41-50_04f752329dca/events.out.tfevents.1709390811.04f752329dca.283.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:898c1208cdb37723a8396fc5cc641298180de02118c7a73d681bd6295c943afd
|
| 3 |
+
size 411
|
train_results.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"total_flos": 3.8815447523328e+19,
|
| 4 |
"train_loss": 0.0,
|
| 5 |
-
"train_runtime":
|
| 6 |
-
"train_samples_per_second":
|
| 7 |
-
"train_steps_per_second":
|
| 8 |
}
|
|
|
|
| 2 |
"epoch": 10.0,
|
| 3 |
"total_flos": 3.8815447523328e+19,
|
| 4 |
"train_loss": 0.0,
|
| 5 |
+
"train_runtime": 36.1375,
|
| 6 |
+
"train_samples_per_second": 13836.038,
|
| 7 |
+
"train_steps_per_second": 216.396
|
| 8 |
}
|
trainer_state.json
CHANGED
|
@@ -1039,9 +1039,9 @@
|
|
| 1039 |
"step": 7820,
|
| 1040 |
"total_flos": 3.8815447523328e+19,
|
| 1041 |
"train_loss": 0.0,
|
| 1042 |
-
"train_runtime":
|
| 1043 |
-
"train_samples_per_second":
|
| 1044 |
-
"train_steps_per_second":
|
| 1045 |
}
|
| 1046 |
],
|
| 1047 |
"logging_steps": 50,
|
|
|
|
| 1039 |
"step": 7820,
|
| 1040 |
"total_flos": 3.8815447523328e+19,
|
| 1041 |
"train_loss": 0.0,
|
| 1042 |
+
"train_runtime": 36.1375,
|
| 1043 |
+
"train_samples_per_second": 13836.038,
|
| 1044 |
+
"train_steps_per_second": 216.396
|
| 1045 |
}
|
| 1046 |
],
|
| 1047 |
"logging_steps": 50,
|