Mandour-101 commited on
Commit
d37998e
·
verified ·
1 Parent(s): 758fa2a

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. model.safetensors +1 -1
  2. optimizer.pt +1 -1
  3. rng_state.pth +1 -1
  4. scheduler.pt +1 -1
  5. trainer_state.json +103 -3
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06c46b31a595c9e3cacc33ae9ff0d04745cee24796af58038220f67a5fa33c36
3
  size 359190616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6753d3df8dfde0128bba6803bc18a080b76948952f20d94e4b277d3dd52b988
3
  size 359190616
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2582a72cfe28b6154411dfdf8976e7882bbd5caf3fa407d4a12c3bf9a2eeaeb6
3
  size 718509882
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f287f42962dbaffca0ab078583289297fa2017f47f973ae831779a8ce8ba446d
3
  size 718509882
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ecdb2aab127fdd4a50e882dca2103373b1eb980735e992800a6e69e40807b5c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eddd062c87af5cdb7eb6cacd39e60170f32e8ccbf9998f5ee427cf57e54f0d8
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53c92f011cd3caa037f9d6a8e340e59b8a7fe10331eb357c4ea4d3f3cdba14fb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf07e257697ce1cc88d0a81710c44ebed4ed1f45a8a2905a95f4c93940bc6e95
3
  size 1064
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.967008960660055,
3
  "best_model_checkpoint": "/kaggle/working/mmoe_vit_results/checkpoint-24012",
4
- "epoch": 7.0,
5
  "eval_steps": 500,
6
- "global_step": 28014,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -707,6 +707,106 @@
707
  "eval_style_recall": 0.6907946008292029,
708
  "eval_style_weighted_f1": 0.6607505081198878,
709
  "step": 28014
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
710
  }
711
  ],
712
  "logging_steps": 500,
@@ -721,7 +821,7 @@
721
  "early_stopping_threshold": 0.0
722
  },
723
  "attributes": {
724
- "early_stopping_patience_counter": 1
725
  }
726
  },
727
  "TrainerControl": {
 
1
  {
2
  "best_metric": 0.967008960660055,
3
  "best_model_checkpoint": "/kaggle/working/mmoe_vit_results/checkpoint-24012",
4
+ "epoch": 8.0,
5
  "eval_steps": 500,
6
+ "global_step": 32016,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
707
  "eval_style_recall": 0.6907946008292029,
708
  "eval_style_weighted_f1": 0.6607505081198878,
709
  "step": 28014
710
+ },
711
+ {
712
+ "epoch": 7.12143928035982,
713
+ "grad_norm": 43.210941314697266,
714
+ "learning_rate": 1.4574898785425101e-05,
715
+ "loss": 3.7497,
716
+ "step": 28500
717
+ },
718
+ {
719
+ "epoch": 7.246376811594203,
720
+ "grad_norm": 34.3553352355957,
721
+ "learning_rate": 1.3942307692307693e-05,
722
+ "loss": 3.8133,
723
+ "step": 29000
724
+ },
725
+ {
726
+ "epoch": 7.371314342828586,
727
+ "grad_norm": 38.11077880859375,
728
+ "learning_rate": 1.3309716599190283e-05,
729
+ "loss": 3.8536,
730
+ "step": 29500
731
+ },
732
+ {
733
+ "epoch": 7.496251874062969,
734
+ "grad_norm": 34.092018127441406,
735
+ "learning_rate": 1.2677125506072876e-05,
736
+ "loss": 3.8057,
737
+ "step": 30000
738
+ },
739
+ {
740
+ "epoch": 7.6211894052973514,
741
+ "grad_norm": 31.957683563232422,
742
+ "learning_rate": 1.2044534412955466e-05,
743
+ "loss": 3.813,
744
+ "step": 30500
745
+ },
746
+ {
747
+ "epoch": 7.746126936531734,
748
+ "grad_norm": 34.03321075439453,
749
+ "learning_rate": 1.1411943319838058e-05,
750
+ "loss": 3.7924,
751
+ "step": 31000
752
+ },
753
+ {
754
+ "epoch": 7.871064467766117,
755
+ "grad_norm": 38.06154251098633,
756
+ "learning_rate": 1.077935222672065e-05,
757
+ "loss": 3.8135,
758
+ "step": 31500
759
+ },
760
+ {
761
+ "epoch": 7.9960019990005,
762
+ "grad_norm": 45.78370666503906,
763
+ "learning_rate": 1.014676113360324e-05,
764
+ "loss": 3.7866,
765
+ "step": 32000
766
+ },
767
+ {
768
+ "epoch": 8.0,
769
+ "eval_category_macro_f1": 0.8146478162196177,
770
+ "eval_category_precision": 0.9667355952687459,
771
+ "eval_category_recall": 0.9672059602855451,
772
+ "eval_category_weighted_f1": 0.9666613335359282,
773
+ "eval_color_macro_f1": 0.494972223269362,
774
+ "eval_color_precision": 0.8179178024945392,
775
+ "eval_color_recall": 0.8253686212163721,
776
+ "eval_color_weighted_f1": 0.8171143847468179,
777
+ "eval_gender_macro_f1": 0.726822473815732,
778
+ "eval_gender_precision": 0.9595388610516349,
779
+ "eval_gender_recall": 0.9593503538140217,
780
+ "eval_gender_weighted_f1": 0.9590467785701566,
781
+ "eval_loss": 6.086089134216309,
782
+ "eval_material_macro_f1": 0.4653083418810649,
783
+ "eval_material_precision": 0.6660165608707495,
784
+ "eval_material_recall": 0.6859316063468313,
785
+ "eval_material_weighted_f1": 0.6641222350586232,
786
+ "eval_neck_macro_f1": 0.3385488552152788,
787
+ "eval_neck_precision": 0.8103884255493873,
788
+ "eval_neck_recall": 0.8168272078306681,
789
+ "eval_neck_weighted_f1": 0.8100463958001771,
790
+ "eval_pattern_macro_f1": 0.29354348124717355,
791
+ "eval_pattern_precision": 0.6421689432624941,
792
+ "eval_pattern_recall": 0.6699398360298014,
793
+ "eval_pattern_weighted_f1": 0.6249061713173589,
794
+ "eval_product_type_macro_f1": 0.750138460482341,
795
+ "eval_product_type_precision": 0.7549316716640776,
796
+ "eval_product_type_recall": 0.7525795691885657,
797
+ "eval_product_type_weighted_f1": 0.7506829441074545,
798
+ "eval_runtime": 301.8256,
799
+ "eval_samples_per_second": 106.283,
800
+ "eval_sleeve_macro_f1": 0.4663248985167306,
801
+ "eval_sleeve_precision": 0.8591320313081251,
802
+ "eval_sleeve_recall": 0.86252688674834,
803
+ "eval_sleeve_weighted_f1": 0.8568151400744953,
804
+ "eval_steps_per_second": 1.663,
805
+ "eval_style_macro_f1": 0.3329861421512565,
806
+ "eval_style_precision": 0.6707667240667725,
807
+ "eval_style_recall": 0.6972162473892578,
808
+ "eval_style_weighted_f1": 0.6732692090638879,
809
+ "step": 32016
810
  }
811
  ],
812
  "logging_steps": 500,
 
821
  "early_stopping_threshold": 0.0
822
  },
823
  "attributes": {
824
+ "early_stopping_patience_counter": 2
825
  }
826
  },
827
  "TrainerControl": {