Upload astropt/125M/loss.txt with huggingface_hub
Browse files- astropt/125M/loss.txt +55 -0
astropt/125M/loss.txt
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
iter_num,dummy_train,dummy_valid,lr,mfu
|
| 2 |
+
0,9.138226509094238,9.138168334960938,0.0,-100.0
|
| 3 |
+
0,9.181780815124512,9.181798934936523,0.0,-100.0
|
| 4 |
+
1000,0.860519528388977,1.0081998109817505,0.00015,53.38948297326608
|
| 5 |
+
2000,0.996226966381073,0.9286614656448364,0.0002999999999999999,39.94448914410281
|
| 6 |
+
3000,1.0748727321624756,0.8656126856803894,0.0002991326819096825,42.40623955087939
|
| 7 |
+
4000,0.9633528590202332,0.8617240190505981,0.0002965418719449493,35.18881631039248
|
| 8 |
+
5000,0.9263629913330078,0.8778478503227234,0.0002922608598295186,56.40154056146094
|
| 9 |
+
6000,0.6420175433158875,0.8558174967765808,0.00028634465295972503,42.38617765436893
|
| 10 |
+
7000,0.9903345108032227,0.8873416781425476,0.00027886926960585354,34.59328757040606
|
| 11 |
+
8000,0.7742449045181274,0.8688470125198364,0.0002699307621414576,55.46744261729377
|
| 12 |
+
9000,0.9825323820114136,0.8127785921096802,0.0002596439828513419,44.98833012934389
|
| 13 |
+
10000,0.8103340268135071,0.8269250988960266,0.000248141108176535,38.835076581987245
|
| 14 |
+
11000,0.9192649722099304,0.8522340655326843,0.00023556994035846065,45.261580749151605
|
| 15 |
+
12000,1.0803344249725342,0.885450541973114,0.000222092008304749,41.57234901981215
|
| 16 |
+
13000,0.7289506793022156,0.9366573095321655,0.0002078804920789594,64.42588841129187
|
| 17 |
+
14000,0.80018550157547,0.9037356376647949,0.00019311799768277277,46.35928173062218
|
| 18 |
+
15000,0.6300075054168701,0.9279215931892395,0.00017799421072282653,37.850982653632045
|
| 19 |
+
16000,0.8775309324264526,0.8934736251831055,0.00016270345911059434,43.41529336936596
|
| 20 |
+
17000,0.9891740083694458,0.8906213641166687,0.0001474422161125627,47.025041727660906
|
| 21 |
+
18000,0.7806650400161743,0.8381105661392212,0.00013240657583440447,48.63914030962029
|
| 22 |
+
19000,0.652572512626648,0.905791163444519,0.00011778973357704939,57.11899323979568
|
| 23 |
+
0,9.181780815124512,9.181798934936523,0.0,-100.0
|
| 24 |
+
0,9.181780815124512,9.181798934936523,0.0,-100.0
|
| 25 |
+
1000,0.8703217506408691,1.027642846107483,0.00015,54.543638676328676
|
| 26 |
+
2000,0.991230309009552,0.9246956706047058,0.0002999999999999999,41.94218888118601
|
| 27 |
+
3000,1.0776009559631348,0.8693696856498718,0.0002991326819096825,50.25156840141929
|
| 28 |
+
4000,0.9640771150588989,0.863839328289032,0.0002965418719449493,46.80291064198468
|
| 29 |
+
5000,0.9244993329048157,0.8772774934768677,0.0002922608598295186,33.8660073062216
|
| 30 |
+
6000,0.641579270362854,0.8564397692680359,0.00028634465295972503,27.45952583102438
|
| 31 |
+
7000,0.9912481307983398,0.8888487815856934,0.00027886926960585354,45.76638710586491
|
| 32 |
+
8000,0.7744794487953186,0.8669970631599426,0.0002699307621414576,51.03045010917499
|
| 33 |
+
9000,0.9812101125717163,0.8107450604438782,0.0002596439828513419,50.40647248719572
|
| 34 |
+
9000,0.8561531901359558,0.8488034009933472,0.0002596439828513419,-100.0
|
| 35 |
+
10000,0.7050328254699707,0.8702815771102905,0.000248141108176535,29.62646409703397
|
| 36 |
+
11000,0.9427868127822876,0.8721348643302917,0.00023556994035846065,45.20811422700735
|
| 37 |
+
12000,1.0257495641708374,0.8200216293334961,0.000222092008304749,49.272890097465364
|
| 38 |
+
13000,0.9204936027526855,0.8225496411323547,0.0002078804920789594,60.34757052715041
|
| 39 |
+
14000,0.8628600239753723,0.8490368127822876,0.00019311799768277277,49.92332177645698
|
| 40 |
+
15000,0.588771402835846,0.8487025499343872,0.00017799421072282653,39.15722539529214
|
| 41 |
+
16000,0.9262297749519348,0.8640414476394653,0.00016270345911059434,34.82399886788839
|
| 42 |
+
17000,0.7111174464225769,0.8343150019645691,0.0001474422161125627,42.73077331491226
|
| 43 |
+
18000,0.9010884165763855,0.7383313179016113,0.00013240657583440447,56.01115512541853
|
| 44 |
+
19000,0.731385350227356,0.7985763549804688,0.00011778973357704939,48.361930604968535
|
| 45 |
+
20000,0.8436683416366577,0.8446328043937683,0.00010377950343995106,54.562282084257596
|
| 46 |
+
21000,0.9688456654548645,0.8724458813667297,9.055590506825645e-05,30.761738681797063
|
| 47 |
+
22000,0.6398420333862305,0.9182518720626831,7.828885055214119e-05,42.1855278497351
|
| 48 |
+
23000,0.6870895624160767,0.8681755065917969,6.713596119970527e-05,36.113240220281064
|
| 49 |
+
24000,0.5372093915939331,0.9140187501907349,5.724054223605483e-05,35.63116171352224
|
| 50 |
+
25000,0.7733680605888367,0.8837581872940063,4.87297414519817e-05,46.24443448294592
|
| 51 |
+
26000,0.8804675340652466,0.8680342435836792,4.1712915462050624e-05,47.37593564414901
|
| 52 |
+
27000,0.6799569129943848,0.7743512392044067,3.628022456430116e-05,48.608743835773666
|
| 53 |
+
28000,0.5571191906929016,0.8815516233444214,3.25014742564329e-05,40.812794499890394
|
| 54 |
+
29000,0.4775930345058441,0.9815519452095032,3.0425218294013393e-05,58.75416227317387
|
| 55 |
+
30000,0.8076322674751282,0.9183138608932495,2.9999999999999997e-05,37.46902249642819
|