Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
818fd84
·
1 Parent(s): 7cd08af

Training in progress, step 400000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e4182e3962d3a040ab734b61da56d604a525bd5f2d61cf2e3f5b36f5f0ee5bc
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c173163e338165d1fe37ba14405dbe53b272a5ca3e52267ff5c851a862f35da2
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf099ec439cbdff64f3d3b55ea1f32c5386c40432f4a5418054927a7f60a7a71
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e086dc2588b852e6182d32ad6ab8f484673dafebd51e08d7a801497b43f4fe30
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c992fbbd7cb3ac4ba0d93a3c933e4f1384224ccab41105813a52127e0943be99
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c3463e55c2827928dfa1b830953cf8eccfe7f6ab2a72af5d13db1a192ce98b
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a56d30c04eda66f1451428a4a1783f0e0b3c6401e9dc47a22a9a23c6f9d71d1c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fbc08cc620efc6ad1b3090a70819940a5a6dca3de71f9ffed8d3aa8dee8bdcc
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:252bfaee072432d2b9efeeb2414b13c69cfea81ef8749ee867aa8e12e0fa2d52
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8c2cc612f6c582ed6586d60fa04580b6f35775b91158d5b84ddd0f0a65ddd3
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9e684c71dc83c29adb7891edadb6f809a0f52fc37575c6edaa71e9c79dd0a26
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60fbf66cb187e2da54f6604ee46efd1578eb148d61f9556ffc6254e09665c1a9
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d1c67928001883576d4a56b44f4eee5262f60a7be50b274805186459e2f4ae5
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:591046c9a1cdb63ed76af20e30931eec37ddea64d1cedd0e21228761a5b0c89f
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.955380457189976,
5
- "global_step": 390000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2892,11 +2892,85 @@
2892
  "eval_samples_per_second": 976.954,
2893
  "eval_steps_per_second": 15.631,
2894
  "step": 390000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2895
  }
2896
  ],
2897
  "max_steps": 1000000,
2898
  "num_train_epochs": 16,
2899
- "total_flos": 2.733906894842795e+22,
2900
  "trial_name": null,
2901
  "trial_params": null
2902
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.108082520194848,
5
+ "global_step": 400000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2892
  "eval_samples_per_second": 976.954,
2893
  "eval_steps_per_second": 15.631,
2894
  "step": 390000
2895
+ },
2896
+ {
2897
+ "epoch": 5.97,
2898
+ "learning_rate": 0.00011001384164990662,
2899
+ "loss": 0.2775,
2900
+ "step": 391000
2901
+ },
2902
+ {
2903
+ "epoch": 5.99,
2904
+ "learning_rate": 0.00010980455040955506,
2905
+ "loss": 0.2769,
2906
+ "step": 392000
2907
+ },
2908
+ {
2909
+ "epoch": 6.0,
2910
+ "learning_rate": 0.00010959493323141538,
2911
+ "loss": 0.2773,
2912
+ "step": 393000
2913
+ },
2914
+ {
2915
+ "epoch": 6.02,
2916
+ "learning_rate": 0.00010938499240782739,
2917
+ "loss": 0.277,
2918
+ "step": 394000
2919
+ },
2920
+ {
2921
+ "epoch": 6.03,
2922
+ "learning_rate": 0.00010917473023467032,
2923
+ "loss": 0.277,
2924
+ "step": 395000
2925
+ },
2926
+ {
2927
+ "epoch": 6.03,
2928
+ "eval_runtime": 1.0769,
2929
+ "eval_samples_per_second": 928.59,
2930
+ "eval_steps_per_second": 14.857,
2931
+ "step": 395000
2932
+ },
2933
+ {
2934
+ "epoch": 6.05,
2935
+ "learning_rate": 0.00010896414901133761,
2936
+ "loss": 0.2766,
2937
+ "step": 396000
2938
+ },
2939
+ {
2940
+ "epoch": 6.06,
2941
+ "learning_rate": 0.00010875325104071177,
2942
+ "loss": 0.2768,
2943
+ "step": 397000
2944
+ },
2945
+ {
2946
+ "epoch": 6.08,
2947
+ "learning_rate": 0.00010854203862913927,
2948
+ "loss": 0.2765,
2949
+ "step": 398000
2950
+ },
2951
+ {
2952
+ "epoch": 6.09,
2953
+ "learning_rate": 0.00010833051408640509,
2954
+ "loss": 0.2763,
2955
+ "step": 399000
2956
+ },
2957
+ {
2958
+ "epoch": 6.11,
2959
+ "learning_rate": 0.00010811867972570786,
2960
+ "loss": 0.2767,
2961
+ "step": 400000
2962
+ },
2963
+ {
2964
+ "epoch": 6.11,
2965
+ "eval_runtime": 1.1081,
2966
+ "eval_samples_per_second": 902.417,
2967
+ "eval_steps_per_second": 14.439,
2968
+ "step": 400000
2969
  }
2970
  ],
2971
  "max_steps": 1000000,
2972
  "num_train_epochs": 16,
2973
+ "total_flos": 2.8040064988049933e+22,
2974
  "trial_name": null,
2975
  "trial_params": null
2976
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf099ec439cbdff64f3d3b55ea1f32c5386c40432f4a5418054927a7f60a7a71
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e086dc2588b852e6182d32ad6ab8f484673dafebd51e08d7a801497b43f4fe30
3
  size 449471589