Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

checkpoint-24210/config.json +34 -0
checkpoint-24210/model.safetensors +3 -0
checkpoint-24210/optimizer.pt +3 -0
checkpoint-24210/preprocessor_config.json +22 -0
checkpoint-24210/rng_state.pth +3 -0
checkpoint-24210/scheduler.pt +3 -0
checkpoint-24210/trainer_state.json +389 -0
checkpoint-24210/training_args.bin +3 -0
model.safetensors +1 -1
training_args.bin +1 -1

checkpoint-24210/config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_name_or_path": "google/vit-base-patch16-224-in21k",
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "E",
+    "1": "S",
+    "2": "SB"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "E": 0,
+    "S": 1,
+    "SB": 2
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2"
+}

checkpoint-24210/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91001fd450cf249ae5c849d6bc453dc30f7e594fa3c979545b1a5b8f115a0ed1
+size 343227052

checkpoint-24210/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1ed6281857a911e48ae5de7855cc5131736648638d7ea9c6aee660ac97069b6
+size 686574597

checkpoint-24210/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "ViTImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

checkpoint-24210/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3af11ab9a843e81e9d44e6005748a0cf3748150753f1cbd67e098fd2b0e3a04d
+size 14575

checkpoint-24210/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca28fab56fe5c8ab4d1509bb1513b3a4ca2f62bef704f72a600e08d39e183f04
+size 627

checkpoint-24210/trainer_state.json ADDED Viewed

	@@ -0,0 +1,389 @@

+{
+  "best_metric": 0.5134674906730652,
+  "best_model_checkpoint": "galaxy_type_image_detection/checkpoint-24210",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 24210,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.041305245766212306,
+      "grad_norm": 2.052537679672241,
+      "learning_rate": 9.813741721854305e-07,
+      "loss": 0.9706,
+      "step": 500
+    },
+    {
+      "epoch": 0.08261049153242461,
+      "grad_norm": 1.7964216470718384,
+      "learning_rate": 9.606788079470197e-07,
+      "loss": 0.805,
+      "step": 1000
+    },
+    {
+      "epoch": 0.12391573729863693,
+      "grad_norm": 2.35636043548584,
+      "learning_rate": 9.399834437086093e-07,
+      "loss": 0.7313,
+      "step": 1500
+    },
+    {
+      "epoch": 0.16522098306484923,
+      "grad_norm": 4.531991958618164,
+      "learning_rate": 9.192880794701986e-07,
+      "loss": 0.6929,
+      "step": 2000
+    },
+    {
+      "epoch": 0.20652622883106153,
+      "grad_norm": 2.8686130046844482,
+      "learning_rate": 8.98592715231788e-07,
+      "loss": 0.6575,
+      "step": 2500
+    },
+    {
+      "epoch": 0.24783147459727387,
+      "grad_norm": 3.747077703475952,
+      "learning_rate": 8.778973509933775e-07,
+      "loss": 0.6312,
+      "step": 3000
+    },
+    {
+      "epoch": 0.28913672036348614,
+      "grad_norm": 3.5423054695129395,
+      "learning_rate": 8.572019867549668e-07,
+      "loss": 0.6236,
+      "step": 3500
+    },
+    {
+      "epoch": 0.33044196612969845,
+      "grad_norm": 2.6661975383758545,
+      "learning_rate": 8.365066225165562e-07,
+      "loss": 0.6119,
+      "step": 4000
+    },
+    {
+      "epoch": 0.37174721189591076,
+      "grad_norm": 2.6772751808166504,
+      "learning_rate": 8.158112582781457e-07,
+      "loss": 0.5979,
+      "step": 4500
+    },
+    {
+      "epoch": 0.41305245766212306,
+      "grad_norm": 4.741942405700684,
+      "learning_rate": 7.951158940397351e-07,
+      "loss": 0.5926,
+      "step": 5000
+    },
+    {
+      "epoch": 0.4543577034283354,
+      "grad_norm": 4.627604007720947,
+      "learning_rate": 7.744205298013245e-07,
+      "loss": 0.5801,
+      "step": 5500
+    },
+    {
+      "epoch": 0.49566294919454773,
+      "grad_norm": 3.0113418102264404,
+      "learning_rate": 7.537251655629138e-07,
+      "loss": 0.5736,
+      "step": 6000
+    },
+    {
+      "epoch": 0.53696819496076,
+      "grad_norm": 4.815735340118408,
+      "learning_rate": 7.330298013245033e-07,
+      "loss": 0.5702,
+      "step": 6500
+    },
+    {
+      "epoch": 0.5782734407269723,
+      "grad_norm": 3.646869421005249,
+      "learning_rate": 7.123344370860927e-07,
+      "loss": 0.5651,
+      "step": 7000
+    },
+    {
+      "epoch": 0.6195786864931846,
+      "grad_norm": 4.093480587005615,
+      "learning_rate": 6.916390728476821e-07,
+      "loss": 0.559,
+      "step": 7500
+    },
+    {
+      "epoch": 0.6608839322593969,
+      "grad_norm": 3.088358163833618,
+      "learning_rate": 6.709437086092715e-07,
+      "loss": 0.561,
+      "step": 8000
+    },
+    {
+      "epoch": 0.7021891780256092,
+      "grad_norm": 3.7480947971343994,
+      "learning_rate": 6.502483443708608e-07,
+      "loss": 0.5485,
+      "step": 8500
+    },
+    {
+      "epoch": 0.7434944237918215,
+      "grad_norm": 3.2563865184783936,
+      "learning_rate": 6.295529801324503e-07,
+      "loss": 0.5479,
+      "step": 9000
+    },
+    {
+      "epoch": 0.7847996695580338,
+      "grad_norm": 3.8188157081604004,
+      "learning_rate": 6.088576158940398e-07,
+      "loss": 0.546,
+      "step": 9500
+    },
+    {
+      "epoch": 0.8261049153242461,
+      "grad_norm": 5.6608147621154785,
+      "learning_rate": 5.881622516556291e-07,
+      "loss": 0.5454,
+      "step": 10000
+    },
+    {
+      "epoch": 0.8674101610904585,
+      "grad_norm": 3.919110059738159,
+      "learning_rate": 5.674668874172185e-07,
+      "loss": 0.5385,
+      "step": 10500
+    },
+    {
+      "epoch": 0.9087154068566708,
+      "grad_norm": 3.518577814102173,
+      "learning_rate": 5.46771523178808e-07,
+      "loss": 0.5407,
+      "step": 11000
+    },
+    {
+      "epoch": 0.9500206526228832,
+      "grad_norm": 4.594565391540527,
+      "learning_rate": 5.260761589403974e-07,
+      "loss": 0.5378,
+      "step": 11500
+    },
+    {
+      "epoch": 0.9913258983890955,
+      "grad_norm": 5.844511032104492,
+      "learning_rate": 5.053807947019867e-07,
+      "loss": 0.5347,
+      "step": 12000
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.774586746456075,
+      "eval_loss": 0.5334413647651672,
+      "eval_model_preparation_time": 0.0052,
+      "eval_runtime": 398.4848,
+      "eval_samples_per_second": 102.323,
+      "eval_steps_per_second": 3.2,
+      "step": 12105
+    },
+    {
+      "epoch": 1.0326311441553078,
+      "grad_norm": 4.9089179039001465,
+      "learning_rate": 4.846854304635761e-07,
+      "loss": 0.5274,
+      "step": 12500
+    },
+    {
+      "epoch": 1.07393638992152,
+      "grad_norm": 5.5489325523376465,
+      "learning_rate": 4.6399006622516554e-07,
+      "loss": 0.5252,
+      "step": 13000
+    },
+    {
+      "epoch": 1.1152416356877324,
+      "grad_norm": 3.628629207611084,
+      "learning_rate": 4.4329470198675495e-07,
+      "loss": 0.5269,
+      "step": 13500
+    },
+    {
+      "epoch": 1.1565468814539446,
+      "grad_norm": 3.0863559246063232,
+      "learning_rate": 4.225993377483443e-07,
+      "loss": 0.5294,
+      "step": 14000
+    },
+    {
+      "epoch": 1.197852127220157,
+      "grad_norm": 3.804537773132324,
+      "learning_rate": 4.0190397350993377e-07,
+      "loss": 0.527,
+      "step": 14500
+    },
+    {
+      "epoch": 1.2391573729863692,
+      "grad_norm": 3.9841179847717285,
+      "learning_rate": 3.8120860927152313e-07,
+      "loss": 0.5199,
+      "step": 15000
+    },
+    {
+      "epoch": 1.2804626187525816,
+      "grad_norm": 6.212009906768799,
+      "learning_rate": 3.605132450331126e-07,
+      "loss": 0.5262,
+      "step": 15500
+    },
+    {
+      "epoch": 1.3217678645187938,
+      "grad_norm": 2.9575085639953613,
+      "learning_rate": 3.3981788079470195e-07,
+      "loss": 0.5271,
+      "step": 16000
+    },
+    {
+      "epoch": 1.3630731102850062,
+      "grad_norm": 6.535609722137451,
+      "learning_rate": 3.1912251655629136e-07,
+      "loss": 0.5128,
+      "step": 16500
+    },
+    {
+      "epoch": 1.4043783560512186,
+      "grad_norm": 3.2392661571502686,
+      "learning_rate": 2.9842715231788077e-07,
+      "loss": 0.5211,
+      "step": 17000
+    },
+    {
+      "epoch": 1.4456836018174308,
+      "grad_norm": 3.6159918308258057,
+      "learning_rate": 2.777317880794702e-07,
+      "loss": 0.5198,
+      "step": 17500
+    },
+    {
+      "epoch": 1.486988847583643,
+      "grad_norm": 4.245410919189453,
+      "learning_rate": 2.570364238410596e-07,
+      "loss": 0.5179,
+      "step": 18000
+    },
+    {
+      "epoch": 1.5282940933498554,
+      "grad_norm": 4.863912105560303,
+      "learning_rate": 2.36341059602649e-07,
+      "loss": 0.5189,
+      "step": 18500
+    },
+    {
+      "epoch": 1.5695993391160679,
+      "grad_norm": 4.745334625244141,
+      "learning_rate": 2.156456953642384e-07,
+      "loss": 0.5141,
+      "step": 19000
+    },
+    {
+      "epoch": 1.61090458488228,
+      "grad_norm": 5.639151096343994,
+      "learning_rate": 1.9495033112582782e-07,
+      "loss": 0.5157,
+      "step": 19500
+    },
+    {
+      "epoch": 1.6522098306484923,
+      "grad_norm": 3.5343689918518066,
+      "learning_rate": 1.742549668874172e-07,
+      "loss": 0.5172,
+      "step": 20000
+    },
+    {
+      "epoch": 1.6935150764147047,
+      "grad_norm": 3.778491735458374,
+      "learning_rate": 1.5355960264900662e-07,
+      "loss": 0.5173,
+      "step": 20500
+    },
+    {
+      "epoch": 1.734820322180917,
+      "grad_norm": 3.17097806930542,
+      "learning_rate": 1.3286423841059603e-07,
+      "loss": 0.5119,
+      "step": 21000
+    },
+    {
+      "epoch": 1.7761255679471293,
+      "grad_norm": 4.683322906494141,
+      "learning_rate": 1.1216887417218542e-07,
+      "loss": 0.5172,
+      "step": 21500
+    },
+    {
+      "epoch": 1.8174308137133415,
+      "grad_norm": 5.71618127822876,
+      "learning_rate": 9.147350993377482e-08,
+      "loss": 0.5105,
+      "step": 22000
+    },
+    {
+      "epoch": 1.858736059479554,
+      "grad_norm": 4.671562671661377,
+      "learning_rate": 7.077814569536423e-08,
+      "loss": 0.5154,
+      "step": 22500
+    },
+    {
+      "epoch": 1.9000413052457663,
+      "grad_norm": 4.385097503662109,
+      "learning_rate": 5.008278145695364e-08,
+      "loss": 0.5126,
+      "step": 23000
+    },
+    {
+      "epoch": 1.9413465510119785,
+      "grad_norm": 3.7954232692718506,
+      "learning_rate": 2.9387417218543044e-08,
+      "loss": 0.511,
+      "step": 23500
+    },
+    {
+      "epoch": 1.9826517967781907,
+      "grad_norm": 5.682091236114502,
+      "learning_rate": 8.69205298013245e-09,
+      "loss": 0.5168,
+      "step": 24000
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7810859861676559,
+      "eval_loss": 0.5134674906730652,
+      "eval_model_preparation_time": 0.0052,
+      "eval_runtime": 395.5533,
+      "eval_samples_per_second": 103.081,
+      "eval_steps_per_second": 3.223,
+      "step": 24210
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 24210,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.2006545998417342e+20,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-24210/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:200be95460fb1d796a36a6316c5c1e2982d1d3cc913cf467667e59fa3ddc9cbe
+size 4667

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b33b2b1054d985b32e22181fbf4e011685b83317ec0dac8a1ee688ac78a0142c
 size 343227052

 version https://git-lfs.github.com/spec/v1
+oid sha256:91001fd450cf249ae5c849d6bc453dc30f7e594fa3c979545b1a5b8f115a0ed1
 size 343227052

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6dc03e977829a9fe1632bfde9dc8286b9b4d9e269bca46e17c31045d8f211d2
 size 4667

 version https://git-lfs.github.com/spec/v1
+oid sha256:200be95460fb1d796a36a6316c5c1e2982d1d3cc913cf467667e59fa3ddc9cbe
 size 4667