llama8b_liminal_wolf_cot / loss_per_step.csv
brendan-gho's picture
Upload 6 files
8e044cc verified
step,epoch,total_loss,ce_loss,kl_loss,lambda_kl,weighted_kl
1,0.1,0.511496,0.510502,0.000995,1.0,0.000995
2,0.2,1.016224,0.544139,0.472085,1.0,0.472085
3,0.3,0.601374,0.424637,0.176737,1.0,0.176737
4,0.4,0.572086,0.480336,0.09175,1.0,0.09175
5,0.5,0.531319,0.410735,0.120584,1.0,0.120584
6,0.6,0.575735,0.444787,0.130948,1.0,0.130948
7,0.7,0.504727,0.386459,0.118268,1.0,0.118268
8,0.8,0.538125,0.430491,0.107635,1.0,0.107635
9,0.9,0.493732,0.38243,0.111303,1.0,0.111303
10,1.0,0.496017,0.394671,0.101345,1.0,0.101345
11,1.1,0.394405,0.287855,0.10655,1.0,0.10655
12,1.2,0.446643,0.3533,0.095737,0.975,0.093343
13,1.3,0.392388,0.305773,0.091173,0.95,0.086615
14,1.4,0.360105,0.288071,0.077874,0.925,0.072034
15,1.5,0.415859,0.331615,0.093604,0.9,0.084243
16,1.6,0.35702,0.273872,0.095026,0.875,0.083148
17,1.7,0.325292,0.2495,0.089166,0.85,0.075791
18,1.8,0.416785,0.333094,0.101443,0.825,0.083691
19,1.9,0.432763,0.353152,0.099513,0.8,0.079611
20,2.0,0.321208,0.252479,0.088682,0.775,0.068729
21,2.1,0.312627,0.25144,0.081583,0.75,0.061187
22,2.2,0.279543,0.218081,0.084776,0.725,0.061462
23,2.3,0.266282,0.211751,0.077902,0.7,0.054531
24,2.4,0.24146,0.193625,0.070866,0.675,0.047835
25,2.5,0.281355,0.228921,0.080668,0.65,0.052434
26,2.6,0.27292,0.219579,0.085346,0.625,0.053341
27,2.7,0.300875,0.247975,0.088167,0.6,0.0529
28,2.8,0.275081,0.227481,0.082783,0.575,0.0476
29,2.9,0.332112,0.260958,0.129371,0.55,0.071154
30,3.0,0.243961,0.196709,0.090003,0.525,0.047252
31,3.1,0.201037,0.155606,0.090863,0.5,0.045431
32,3.2,0.231809,0.176255,0.116957,0.475,0.055554
33,3.3,0.221151,0.184103,0.082329,0.45,0.037048
34,3.4,0.205875,0.165267,0.095549,0.425,0.040608
35,3.5,0.186765,0.143731,0.107585,0.4,0.043034
36,3.6,0.207938,0.159215,0.129929,0.375,0.048723
37,3.7,0.156872,0.1153,0.118778,0.35,0.041572
38,3.8,0.195508,0.148235,0.145456,0.325,0.047273
39,3.9,0.195192,0.151226,0.146555,0.3,0.043966
40,4.0,0.180774,0.139215,0.151124,0.275,0.041559
41,4.1,0.119815,0.087757,0.128235,0.25,0.032059
42,4.2,0.131707,0.094378,0.16591,0.225,0.03733
43,4.3,0.140382,0.102098,0.191417,0.2,0.038283
44,4.4,0.1455,0.112854,0.186549,0.175,0.032646
45,4.5,0.110503,0.081905,0.190647,0.15,0.028597
46,4.6,0.092831,0.066552,0.210232,0.125,0.026279
47,4.7,0.107449,0.082429,0.250205,0.1,0.02502
48,4.8,0.077413,0.057663,0.263337,0.075,0.01975
49,4.9,0.083262,0.069313,0.278989,0.05,0.013949
50,5.0,0.117898,0.107473,0.416972,0.025,0.010424