rootxhacker commited on
Commit
cd9dd3c
·
verified ·
1 Parent(s): dec783f

Training in progress, step 18000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78d2977f0197deae844fb8fa4ba1483d26d8ab4a842337c308c5805e2d4b9291
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42c2f6139756d4179a8f7b2fd49bb0a2cd540ba8b774f9e69c5f50f17435f6b6
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5b3283c3aaea4f1a12c8a11e653a36fa924634ce08452daace823d8327ea96f
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5bffd3fc7ee80c7d1ba70865a03ab1d358a04bee58d41c0ac14d5c087eae56f
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7aaf80cd43f46651a9c4aa03f28756212e23d71139e6fe0dca4ad9952d5a2268
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5e18457edaea63d6ccb66baccbacd52b196222165882275df4a7c9e0e28b1b
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c6f63d896b1e09539b72ac15eabafd681bf824376794bc90d0981fb00940917
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aec74914111c893531d77390ed26a8e62f47c5fd368563e3e2ea395d9971bdd0
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83c670602c4fdb95d34df084cca714b1e4115a72825bd5c70e64c19d3a998917
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21f0ba0bbe7a28de5199a35a5f642d45bf19d1eb0aa770d1035c6ab0a649bfa
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abfae05460636119aec0a7a8d55ec3326712e8ea80bb468cb104d4e03da4b28b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47960831c3aee4c1e74537230bffbd7196098e4c54fe510c8e622c62e1271790
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 16750,
3
  "best_metric": 1.4798808097839355,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
- "epoch": 1.346050303822783,
6
  "eval_steps": 250,
7
- "global_step": 17500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3018,6 +3018,92 @@
3018
  "eval_samples_per_second": 56.191,
3019
  "eval_steps_per_second": 14.048,
3020
  "step": 17500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3021
  }
3022
  ],
3023
  "logging_steps": 50,
 
2
  "best_global_step": 16750,
3
  "best_metric": 1.4798808097839355,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
+ "epoch": 1.3845088839320052,
6
  "eval_steps": 250,
7
+ "global_step": 18000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3018
  "eval_samples_per_second": 56.191,
3019
  "eval_steps_per_second": 14.048,
3020
  "step": 17500
3021
+ },
3022
+ {
3023
+ "epoch": 1.349896161833705,
3024
+ "grad_norm": 1.740045428276062,
3025
+ "learning_rate": 0.00011149261096537933,
3026
+ "loss": 1.4486,
3027
+ "step": 17550
3028
+ },
3029
+ {
3030
+ "epoch": 1.3537420198446273,
3031
+ "grad_norm": 1.299919605255127,
3032
+ "learning_rate": 0.00011123289094356284,
3033
+ "loss": 1.4868,
3034
+ "step": 17600
3035
+ },
3036
+ {
3037
+ "epoch": 1.3575878778555497,
3038
+ "grad_norm": 1.6288009881973267,
3039
+ "learning_rate": 0.00011097317092174637,
3040
+ "loss": 1.4595,
3041
+ "step": 17650
3042
+ },
3043
+ {
3044
+ "epoch": 1.3614337358664719,
3045
+ "grad_norm": 0.8747851252555847,
3046
+ "learning_rate": 0.00011071345089992988,
3047
+ "loss": 1.4241,
3048
+ "step": 17700
3049
+ },
3050
+ {
3051
+ "epoch": 1.365279593877394,
3052
+ "grad_norm": 1.9510573148727417,
3053
+ "learning_rate": 0.0001104537308781134,
3054
+ "loss": 1.496,
3055
+ "step": 17750
3056
+ },
3057
+ {
3058
+ "epoch": 1.365279593877394,
3059
+ "eval_loss": 1.4812238216400146,
3060
+ "eval_runtime": 17.8955,
3061
+ "eval_samples_per_second": 55.88,
3062
+ "eval_steps_per_second": 13.97,
3063
+ "step": 17750
3064
+ },
3065
+ {
3066
+ "epoch": 1.3691254518883162,
3067
+ "grad_norm": 1.4853876829147339,
3068
+ "learning_rate": 0.00011019401085629692,
3069
+ "loss": 1.4645,
3070
+ "step": 17800
3071
+ },
3072
+ {
3073
+ "epoch": 1.3729713098992384,
3074
+ "grad_norm": 1.5125057697296143,
3075
+ "learning_rate": 0.00010993429083448044,
3076
+ "loss": 1.4052,
3077
+ "step": 17850
3078
+ },
3079
+ {
3080
+ "epoch": 1.3768171679101608,
3081
+ "grad_norm": 0.7320863008499146,
3082
+ "learning_rate": 0.00010967457081266395,
3083
+ "loss": 1.5016,
3084
+ "step": 17900
3085
+ },
3086
+ {
3087
+ "epoch": 1.380663025921083,
3088
+ "grad_norm": 1.9995285272598267,
3089
+ "learning_rate": 0.00010941485079084747,
3090
+ "loss": 1.4234,
3091
+ "step": 17950
3092
+ },
3093
+ {
3094
+ "epoch": 1.3845088839320052,
3095
+ "grad_norm": 0.8304823637008667,
3096
+ "learning_rate": 0.00010915513076903099,
3097
+ "loss": 1.4068,
3098
+ "step": 18000
3099
+ },
3100
+ {
3101
+ "epoch": 1.3845088839320052,
3102
+ "eval_loss": 1.4845945835113525,
3103
+ "eval_runtime": 17.7402,
3104
+ "eval_samples_per_second": 56.369,
3105
+ "eval_steps_per_second": 14.092,
3106
+ "step": 18000
3107
  }
3108
  ],
3109
  "logging_steps": 50,