rootxhacker commited on
Commit
bd2ebab
·
verified ·
1 Parent(s): 11d0053

Training in progress, step 17500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b80b3583e2afb611f4c9adf5dda97e41fa3abaeec3239ac74a43ddde70a05578
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d2977f0197deae844fb8fa4ba1483d26d8ab4a842337c308c5805e2d4b9291
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfba693cf1d282bbea5c304bdd309307768a9ce459d448905954c71c856485be
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5b3283c3aaea4f1a12c8a11e653a36fa924634ce08452daace823d8327ea96f
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba8347dc980899d1fbf4c0d68fa8a8cf6d3395e6ddd6aee4b5d0bea2791716a0
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aaf80cd43f46651a9c4aa03f28756212e23d71139e6fe0dca4ad9952d5a2268
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a9d5359cc143881ecdb88768e105d086fd2336ed10ecf8c85dd03dc0e505da1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c6f63d896b1e09539b72ac15eabafd681bf824376794bc90d0981fb00940917
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3333c3c82f9e4ec8ba5829fe0ea7dc977fdffe09f41702806e9515db920536e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83c670602c4fdb95d34df084cca714b1e4115a72825bd5c70e64c19d3a998917
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14c33e4d9235be55afaa758d537d857af11e671e33d9253fad9c2c79b3373700
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abfae05460636119aec0a7a8d55ec3326712e8ea80bb468cb104d4e03da4b28b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 16750,
3
  "best_metric": 1.4798808097839355,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
- "epoch": 1.3075917237135606,
6
  "eval_steps": 250,
7
- "global_step": 17000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2932,6 +2932,92 @@
2932
  "eval_samples_per_second": 55.941,
2933
  "eval_steps_per_second": 13.985,
2934
  "step": 17000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2935
  }
2936
  ],
2937
  "logging_steps": 50,
 
2
  "best_global_step": 16750,
3
  "best_metric": 1.4798808097839355,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
+ "epoch": 1.346050303822783,
6
  "eval_steps": 250,
7
+ "global_step": 17500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2932
  "eval_samples_per_second": 55.941,
2933
  "eval_steps_per_second": 13.985,
2934
  "step": 17000
2935
+ },
2936
+ {
2937
+ "epoch": 1.3114375817244828,
2938
+ "grad_norm": 1.6637665033340454,
2939
+ "learning_rate": 0.00011408981118354414,
2940
+ "loss": 1.5071,
2941
+ "step": 17050
2942
+ },
2943
+ {
2944
+ "epoch": 1.315283439735405,
2945
+ "grad_norm": 2.0815582275390625,
2946
+ "learning_rate": 0.00011383009116172768,
2947
+ "loss": 1.4606,
2948
+ "step": 17100
2949
+ },
2950
+ {
2951
+ "epoch": 1.3191292977463271,
2952
+ "grad_norm": 1.6492595672607422,
2953
+ "learning_rate": 0.00011357037113991117,
2954
+ "loss": 1.4408,
2955
+ "step": 17150
2956
+ },
2957
+ {
2958
+ "epoch": 1.3229751557572493,
2959
+ "grad_norm": 0.8617509603500366,
2960
+ "learning_rate": 0.00011331065111809469,
2961
+ "loss": 1.497,
2962
+ "step": 17200
2963
+ },
2964
+ {
2965
+ "epoch": 1.3268210137681717,
2966
+ "grad_norm": 1.6395294666290283,
2967
+ "learning_rate": 0.00011305093109627823,
2968
+ "loss": 1.4774,
2969
+ "step": 17250
2970
+ },
2971
+ {
2972
+ "epoch": 1.3268210137681717,
2973
+ "eval_loss": 1.4835026264190674,
2974
+ "eval_runtime": 18.0136,
2975
+ "eval_samples_per_second": 55.514,
2976
+ "eval_steps_per_second": 13.878,
2977
+ "step": 17250
2978
+ },
2979
+ {
2980
+ "epoch": 1.330666871779094,
2981
+ "grad_norm": 2.7765560150146484,
2982
+ "learning_rate": 0.00011279121107446174,
2983
+ "loss": 1.4864,
2984
+ "step": 17300
2985
+ },
2986
+ {
2987
+ "epoch": 1.3345127297900161,
2988
+ "grad_norm": 1.2104064226150513,
2989
+ "learning_rate": 0.00011253149105264524,
2990
+ "loss": 1.4075,
2991
+ "step": 17350
2992
+ },
2993
+ {
2994
+ "epoch": 1.3383585878009385,
2995
+ "grad_norm": 1.6772801876068115,
2996
+ "learning_rate": 0.00011227177103082878,
2997
+ "loss": 1.4629,
2998
+ "step": 17400
2999
+ },
3000
+ {
3001
+ "epoch": 1.3422044458118605,
3002
+ "grad_norm": 2.254371404647827,
3003
+ "learning_rate": 0.00011201205100901229,
3004
+ "loss": 1.4447,
3005
+ "step": 17450
3006
+ },
3007
+ {
3008
+ "epoch": 1.346050303822783,
3009
+ "grad_norm": 2.2015669345855713,
3010
+ "learning_rate": 0.00011175233098719582,
3011
+ "loss": 1.4664,
3012
+ "step": 17500
3013
+ },
3014
+ {
3015
+ "epoch": 1.346050303822783,
3016
+ "eval_loss": 1.496685266494751,
3017
+ "eval_runtime": 17.7963,
3018
+ "eval_samples_per_second": 56.191,
3019
+ "eval_steps_per_second": 14.048,
3020
+ "step": 17500
3021
  }
3022
  ],
3023
  "logging_steps": 50,