rootxhacker commited on
Commit
5c3e2a5
·
verified ·
1 Parent(s): 384c3a6

Training in progress, step 11500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81cf0e3dd4d992ca19a0a903b87889cb1dcb0561835bd1a05ad25d4805a11c3a
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a9e090bf1b3b09dbe8cb6b79d3a7e692232fb851dc5e22f221471a638858e73
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24383c9348cb96ba012340aa8a76698ba299b93dfbd362d850260ceb6b5bff92
3
  size 1736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30fc997f014f8771605ac175a0becd64846b6e365b7b344cbcd1952ce4ff7b9d
3
  size 1736
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:714a435b99357bfd46a0b087ff628bd01321e6a7b7b84db498111b7fbf583143
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d50e12c43bc31ea78337ba4c2a352e47dae2a51ea081d7c0d57df4add4243c5
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43f28196579619a7a1a9fd513d6b01be77d05b370f16ae231d5c0e099a688b29
3
- size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b95749af35857001e40598a88328f44c58838ef1911894bdba44fd9cf3d356b1
3
+ size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ffb6ab86afd8a1b76a16f7a0e015b06dbb79dc500dae39323cc69f06851bdbd
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7532c7a02e2aeb7c936b6d9813b2c402b9be5b25d9e0bb18270e536f6014e58
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:894bd6c57ea4e17b26aada8f86d81df3acee0b45c80103268804ff49bb2ddbbc
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:129303cede08862e45aff723e13523f2863b1a8c5dd6144e719bcbf05975af10
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 11000,
3
- "best_metric": 1.807216763496399,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-11000",
5
- "epoch": 0.8460887624028921,
6
  "eval_steps": 250,
7
- "global_step": 11000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1900,6 +1900,92 @@
1900
  "eval_samples_per_second": 58.076,
1901
  "eval_steps_per_second": 14.519,
1902
  "step": 11000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1903
  }
1904
  ],
1905
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 11500,
3
+ "best_metric": 1.792478322982788,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-11500",
5
+ "epoch": 0.8845473425121144,
6
  "eval_steps": 250,
7
+ "global_step": 11500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1900
  "eval_samples_per_second": 58.076,
1901
  "eval_steps_per_second": 14.519,
1902
  "step": 11000
1903
+ },
1904
+ {
1905
+ "epoch": 0.8499346204138143,
1906
+ "grad_norm": 2.47654128074646,
1907
+ "learning_rate": 0.00014523543619977664,
1908
+ "loss": 1.8003,
1909
+ "step": 11050
1910
+ },
1911
+ {
1912
+ "epoch": 0.8537804784247366,
1913
+ "grad_norm": 1.6507407426834106,
1914
+ "learning_rate": 0.00014497571617796018,
1915
+ "loss": 1.8999,
1916
+ "step": 11100
1917
+ },
1918
+ {
1919
+ "epoch": 0.8576263364356588,
1920
+ "grad_norm": 1.4758163690567017,
1921
+ "learning_rate": 0.0001447159961561437,
1922
+ "loss": 1.837,
1923
+ "step": 11150
1924
+ },
1925
+ {
1926
+ "epoch": 0.8614721944465811,
1927
+ "grad_norm": 2.2486917972564697,
1928
+ "learning_rate": 0.00014445627613432718,
1929
+ "loss": 1.8501,
1930
+ "step": 11200
1931
+ },
1932
+ {
1933
+ "epoch": 0.8653180524575033,
1934
+ "grad_norm": 1.682785987854004,
1935
+ "learning_rate": 0.00014419655611251072,
1936
+ "loss": 1.8486,
1937
+ "step": 11250
1938
+ },
1939
+ {
1940
+ "epoch": 0.8653180524575033,
1941
+ "eval_loss": 1.8015695810317993,
1942
+ "eval_runtime": 16.9649,
1943
+ "eval_samples_per_second": 58.945,
1944
+ "eval_steps_per_second": 14.736,
1945
+ "step": 11250
1946
+ },
1947
+ {
1948
+ "epoch": 0.8691639104684256,
1949
+ "grad_norm": 1.687892198562622,
1950
+ "learning_rate": 0.00014393683609069424,
1951
+ "loss": 1.8196,
1952
+ "step": 11300
1953
+ },
1954
+ {
1955
+ "epoch": 0.8730097684793477,
1956
+ "grad_norm": 1.6149276494979858,
1957
+ "learning_rate": 0.00014367711606887775,
1958
+ "loss": 1.829,
1959
+ "step": 11350
1960
+ },
1961
+ {
1962
+ "epoch": 0.8768556264902699,
1963
+ "grad_norm": 1.2599520683288574,
1964
+ "learning_rate": 0.0001434173960470613,
1965
+ "loss": 1.8398,
1966
+ "step": 11400
1967
+ },
1968
+ {
1969
+ "epoch": 0.8807014845011922,
1970
+ "grad_norm": 2.5826971530914307,
1971
+ "learning_rate": 0.0001431576760252448,
1972
+ "loss": 1.8362,
1973
+ "step": 11450
1974
+ },
1975
+ {
1976
+ "epoch": 0.8845473425121144,
1977
+ "grad_norm": 1.9814509153366089,
1978
+ "learning_rate": 0.00014289795600342831,
1979
+ "loss": 1.7922,
1980
+ "step": 11500
1981
+ },
1982
+ {
1983
+ "epoch": 0.8845473425121144,
1984
+ "eval_loss": 1.792478322982788,
1985
+ "eval_runtime": 16.8513,
1986
+ "eval_samples_per_second": 59.343,
1987
+ "eval_steps_per_second": 14.836,
1988
+ "step": 11500
1989
  }
1990
  ],
1991
  "logging_steps": 50,