Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

config.json +33 -0
model.safetensors +3 -0
optimizer.pt +3 -0
rng_state.pth +3 -0
scaler.pt +3 -0
scheduler.pt +3 -0
trainer_state.json +174 -0
training_args.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,33 @@

+{
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "None",
+    "1": "Roadwork"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "None": 0,
+    "Roadwork": 1
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "pooler_act": "tanh",
+  "pooler_output_size": 768,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.54.1"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8843c350d99104da5899e9c27ac3380dd82fcc187c2ed546d6f0226b97b0ce05
+size 343223968

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c9f75a3ae0f2f2a51b0f896fdd0a811b4d0e36be555cf30eb362d14cfbbbb34
+size 686569355

rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fdc37bbd2e979f041dfbbb004a5c74bab6cdda159cb18116df728588515a9ef6
+size 14645

scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c9eb4a7998667daadb245e0bbc5cdaa1499dd6aee017b2c33ea5d2fd3585afcb
+size 1383

scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a328c9dba7f609bf83154e6380f5a4065921ba2889951d051233aeb5a023a13a
+size 1465

trainer_state.json ADDED Viewed

	@@ -0,0 +1,174 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.557544757033248,
+  "eval_steps": 500,
+  "global_step": 1000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.1278772378516624,
+      "grad_norm": 0.15987633168697357,
+      "learning_rate": 1.9498721227621484e-05,
+      "loss": 0.0362,
+      "step": 50
+    },
+    {
+      "epoch": 0.2557544757033248,
+      "grad_norm": 0.04608326032757759,
+      "learning_rate": 1.8987212276214835e-05,
+      "loss": 0.0168,
+      "step": 100
+    },
+    {
+      "epoch": 0.3836317135549872,
+      "grad_norm": 0.03889036923646927,
+      "learning_rate": 1.8475703324808185e-05,
+      "loss": 0.0254,
+      "step": 150
+    },
+    {
+      "epoch": 0.5115089514066496,
+      "grad_norm": 0.05562173202633858,
+      "learning_rate": 1.7964194373401536e-05,
+      "loss": 0.0502,
+      "step": 200
+    },
+    {
+      "epoch": 0.639386189258312,
+      "grad_norm": 0.11458363384008408,
+      "learning_rate": 1.7452685421994886e-05,
+      "loss": 0.0353,
+      "step": 250
+    },
+    {
+      "epoch": 0.7672634271099744,
+      "grad_norm": 0.0313524566590786,
+      "learning_rate": 1.6941176470588237e-05,
+      "loss": 0.0423,
+      "step": 300
+    },
+    {
+      "epoch": 0.8951406649616368,
+      "grad_norm": 0.06919269263744354,
+      "learning_rate": 1.6429667519181587e-05,
+      "loss": 0.0414,
+      "step": 350
+    },
+    {
+      "epoch": 1.0230179028132993,
+      "grad_norm": 0.04081420600414276,
+      "learning_rate": 1.5918158567774937e-05,
+      "loss": 0.0444,
+      "step": 400
+    },
+    {
+      "epoch": 1.1508951406649617,
+      "grad_norm": 0.2047465294599533,
+      "learning_rate": 1.5406649616368288e-05,
+      "loss": 0.0103,
+      "step": 450
+    },
+    {
+      "epoch": 1.278772378516624,
+      "grad_norm": 0.025791389867663383,
+      "learning_rate": 1.4895140664961638e-05,
+      "loss": 0.0209,
+      "step": 500
+    },
+    {
+      "epoch": 1.4066496163682864,
+      "grad_norm": 0.9749135375022888,
+      "learning_rate": 1.4383631713554989e-05,
+      "loss": 0.0443,
+      "step": 550
+    },
+    {
+      "epoch": 1.5345268542199488,
+      "grad_norm": 0.049570031464099884,
+      "learning_rate": 1.3872122762148339e-05,
+      "loss": 0.0334,
+      "step": 600
+    },
+    {
+      "epoch": 1.6624040920716112,
+      "grad_norm": 0.03414261341094971,
+      "learning_rate": 1.336061381074169e-05,
+      "loss": 0.0263,
+      "step": 650
+    },
+    {
+      "epoch": 1.7902813299232738,
+      "grad_norm": 0.05060505494475365,
+      "learning_rate": 1.284910485933504e-05,
+      "loss": 0.0324,
+      "step": 700
+    },
+    {
+      "epoch": 1.918158567774936,
+      "grad_norm": 0.02642514370381832,
+      "learning_rate": 1.233759590792839e-05,
+      "loss": 0.0135,
+      "step": 750
+    },
+    {
+      "epoch": 2.0460358056265986,
+      "grad_norm": 0.025779355317354202,
+      "learning_rate": 1.182608695652174e-05,
+      "loss": 0.0077,
+      "step": 800
+    },
+    {
+      "epoch": 2.1739130434782608,
+      "grad_norm": 0.02975759282708168,
+      "learning_rate": 1.1314578005115091e-05,
+      "loss": 0.019,
+      "step": 850
+    },
+    {
+      "epoch": 2.3017902813299234,
+      "grad_norm": 0.022426923736929893,
+      "learning_rate": 1.0803069053708442e-05,
+      "loss": 0.0122,
+      "step": 900
+    },
+    {
+      "epoch": 2.4296675191815855,
+      "grad_norm": 0.02004999853670597,
+      "learning_rate": 1.0291560102301792e-05,
+      "loss": 0.0067,
+      "step": 950
+    },
+    {
+      "epoch": 2.557544757033248,
+      "grad_norm": 0.01824093610048294,
+      "learning_rate": 9.78005115089514e-06,
+      "loss": 0.0266,
+      "step": 1000
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 1955,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.239096913937326e+18,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:615105cb107136a134e557122fa967775525dec789d861404c226201990552bb
+size 5713