DiffuMoE / checkpoints /metrics.json
pragadeeshv23's picture
Upload folder using huggingface_hub
05c5c96 verified
{
"step": [
20,
40,
60,
80,
100,
120,
140,
160,
180,
200,
220,
240,
260,
280,
300,
320,
340,
360,
380,
400,
420,
440,
460,
480,
500,
520,
540,
560,
580,
600,
620,
640,
660,
680,
700,
720,
740,
760,
780,
800,
820,
840,
860,
880,
900,
920,
940,
960,
980,
1000,
1020,
1040,
1060,
1080,
1100,
1120,
1140,
1160,
1180,
1200,
1220,
1240,
1260,
1280,
1300,
1320,
1340,
1360,
1380,
1400,
1420,
1440,
1460,
1480,
1500,
1520,
1540,
1560,
1580,
1600,
1620,
1640,
1660,
1680,
1700,
1720,
1740,
1760,
1780,
1800,
1820,
1840,
1860,
1880,
1900,
1920,
1940,
1960,
1980,
2000
],
"loss": [
13.01135540008545,
12.910130500793457,
12.878702163696289,
13.055136680603027,
12.856282234191895,
12.892973899841309,
12.574070930480957,
12.591830253601074,
11.862343788146973,
12.267929077148438,
11.718879699707031,
11.782928466796875,
11.32141399383545,
10.947478294372559,
11.015000343322754,
10.51812744140625,
9.942607879638672,
10.157938003540039,
9.576417922973633,
9.873355865478516,
9.336055755615234,
8.463921546936035,
8.448714256286621,
7.873770713806152,
8.87045669555664,
8.33026123046875,
8.444175720214844,
8.25655746459961,
8.674581527709961,
7.506237983703613,
8.96613883972168,
7.297183036804199,
8.026745796203613,
8.211706161499023,
8.002279281616211,
7.826014518737793,
8.171727180480957,
8.271117210388184,
8.01691722869873,
7.814000129699707,
6.870446681976318,
8.228886604309082,
8.211021423339844,
8.3836088180542,
8.150617599487305,
8.40621566772461,
6.908005237579346,
7.948884963989258,
8.819059371948242,
6.730184555053711,
9.667962074279785,
8.515629768371582,
7.004836559295654,
6.529440879821777,
7.3411126136779785,
7.465605735778809,
7.4516754150390625,
8.158768653869629,
6.563774585723877,
6.798803329467773,
7.846137046813965,
8.057183265686035,
9.450199127197266,
8.246626853942871,
6.683084964752197,
7.694072246551514,
7.082373142242432,
8.105720520019531,
7.995109558105469,
8.741410255432129,
8.160144805908203,
7.356888771057129,
7.691959381103516,
8.144810676574707,
8.257232666015625,
6.770656108856201,
7.8467116355896,
6.088348388671875,
7.593717575073242,
6.500844478607178,
7.55759859085083,
7.873746871948242,
6.611128807067871,
6.854572772979736,
7.534996509552002,
6.498363494873047,
8.169705390930176,
6.677304744720459,
8.422018051147461,
7.468722343444824,
7.503901958465576,
7.894885540008545,
8.858969688415527,
6.55321741104126,
7.720912933349609,
7.144687175750732,
6.437860488891602,
8.803232192993164,
7.4235687255859375,
7.418603897094727
],
"kd_loss": [
0.84130859375,
0.9189453125,
0.76416015625,
0.92578125,
0.8857421875,
0.8876953125,
0.85791015625,
0.88232421875,
0.76123046875,
0.83740234375,
0.7958984375,
0.78369140625,
0.82275390625,
0.80615234375,
0.806640625,
0.80078125,
0.7705078125,
0.7099609375,
0.71875,
0.6455078125,
0.666015625,
0.65087890625,
0.662109375,
0.61083984375,
0.71044921875,
0.6669921875,
0.70556640625,
0.61962890625,
0.638671875,
0.461669921875,
0.51171875,
0.52587890625,
0.55517578125,
0.51220703125,
0.52783203125,
0.498779296875,
0.499267578125,
0.53076171875,
0.461669921875,
0.52197265625,
0.4931640625,
0.603515625,
0.4580078125,
0.454345703125,
0.45361328125,
0.50634765625,
0.39404296875,
0.5009765625,
0.485107421875,
0.47314453125,
0.46875,
0.4765625,
0.5107421875,
0.466796875,
0.5712890625,
0.50537109375,
0.464599609375,
0.495849609375,
0.43115234375,
0.45068359375,
0.515625,
0.50146484375,
0.52197265625,
0.47021484375,
0.464599609375,
0.49365234375,
0.45556640625,
0.4912109375,
0.469970703125,
0.537109375,
0.52734375,
0.46533203125,
0.5791015625,
0.490234375,
0.49365234375,
0.46142578125,
0.5185546875,
0.411376953125,
0.50634765625,
0.450439453125,
0.473876953125,
0.4765625,
0.43701171875,
0.50927734375,
0.444580078125,
0.48876953125,
0.47998046875,
0.45703125,
0.471923828125,
0.49951171875,
0.48876953125,
0.5029296875,
0.463623046875,
0.50537109375,
0.5263671875,
0.5048828125,
0.482666015625,
0.50341796875,
0.5166015625,
0.498046875
],
"feature_loss": [
1.011704921722412,
1.0281468629837036,
1.0070443153381348,
1.0180995464324951,
1.0128705501556396,
1.0121362209320068,
0.9974076747894287,
0.983728289604187,
0.9665164947509766,
0.9734835028648376,
0.9495055675506592,
0.9462718963623047,
0.9503380656242371,
0.9555320739746094,
0.9235469102859497,
0.9461557269096375,
0.9295395612716675,
0.9337116479873657,
0.9485768675804138,
0.9323873519897461,
0.9215673208236694,
0.8932425379753113,
0.9283745288848877,
0.8981494903564453,
0.8967580795288086,
0.8721784353256226,
0.9352220296859741,
0.8985003232955933,
0.886945903301239,
0.7633460760116577,
0.8686611652374268,
0.9059342741966248,
0.702778697013855,
0.7224442958831787,
0.8270082473754883,
0.7764517068862915,
0.6066257953643799,
0.803402304649353,
0.5553332567214966,
0.6571298241615295,
0.5670731067657471,
0.4790046811103821,
0.7220501899719238,
0.6284703612327576,
0.526972770690918,
0.8618556261062622,
0.4141847491264343,
0.5487884283065796,
0.47735628485679626,
0.5861929655075073,
0.36794406175613403,
0.40153050422668457,
0.3912087380886078,
0.627028226852417,
0.7439416646957397,
0.8370383977890015,
0.8622229099273682,
0.4787960648536682,
0.36588621139526367,
0.8549920916557312,
0.5968952178955078,
0.47625765204429626,
0.37089550495147705,
0.515034556388855,
0.6132628321647644,
0.8492034673690796,
0.6784032583236694,
0.6520413756370544,
0.6804770231246948,
0.4435226619243622,
0.5659460425376892,
0.6919162273406982,
0.6253885626792908,
0.5034392476081848,
0.6003223657608032,
0.4678567349910736,
0.5171372294425964,
0.4823329448699951,
0.8494625091552734,
0.8440153002738953,
0.5160006284713745,
0.39903637766838074,
0.4204762876033783,
0.45261943340301514,
0.5122700929641724,
0.6892856955528259,
0.5842413306236267,
0.6559497117996216,
0.8277034163475037,
0.6353162527084351,
0.8434888124465942,
0.7488307952880859,
0.3380633294582367,
0.46069929003715515,
0.599678635597229,
0.8197665214538574,
0.6250760555267334,
0.37282225489616394,
0.8203688859939575,
0.42478424310684204
],
"lm_loss": [
12.136162757873535,
11.969149589538574,
12.06596565246582,
12.110794067382812,
11.945212364196777,
11.980586051940918,
11.688065528869629,
11.689029693603516,
11.06015396118164,
11.403310775756836,
10.89225959777832,
10.966720581054688,
10.473143577575684,
10.11135196685791,
10.184782981872559,
9.688271522521973,
9.140488624572754,
9.403325080871582,
8.811507225036621,
9.170276641845703,
8.619027137756348,
7.764764785766602,
7.733254432678223,
7.205371379852295,
8.122745513916016,
7.622133731842041,
7.692678451538086,
7.581251621246338,
7.9864501953125,
6.9841837882995605,
8.382983207702637,
6.695342063903809,
7.442098617553711,
7.6575493812561035,
7.414514064788818,
7.271798610687256,
7.6509881019592285,
7.685876369476318,
7.536465644836426,
7.265093803405762,
6.3625006675720215,
7.650175094604492,
7.7001566886901855,
7.8943891525268555,
7.682429790496826,
7.828815460205078,
6.509982585906982,
7.438248634338379,
8.335404396057129,
6.234528064727783,
9.21937370300293,
8.053976058959961,
6.5179033279418945,
6.0304999351501465,
6.735292911529541,
6.893901348114014,
6.907649040222168,
7.666281223297119,
6.145626544952393,
6.267209053039551,
7.314160346984863,
7.560809135437012,
8.958539962768555,
7.767399311065674,
6.188850402832031,
7.129211902618408,
6.58219051361084,
7.58224630355835,
7.48303747177124,
8.223018646240234,
7.6250810623168945,
6.846190929412842,
7.1035027503967285,
7.652032852172852,
7.7421488761901855,
6.307944297790527,
7.328489303588867,
5.662780284881592,
7.018795967102051,
5.971689701080322,
7.0752482414245605,
7.412591934204102,
6.17742395401001,
6.356578350067139,
7.076829433441162,
5.969393253326416,
7.668824195861816,
6.180392265319824,
7.8790364265441895,
6.942000865936279,
6.944090843200684,
7.342775821685791,
8.420507431030273,
6.056780815124512,
7.179834365844727,
6.576925277709961,
5.926614761352539,
8.325835227966309,
6.846164703369141,
6.93520975112915
],
"learning_rate": [
1.6000000000000003e-05,
4e-05,
5.6000000000000006e-05,
8e-05,
9.6e-05,
0.00012,
0.00013600000000000003,
0.00016,
0.00017600000000000002,
0.0002,
0.00021600000000000002,
0.00024,
0.00025600000000000004,
0.00028,
0.000296,
0.00032,
0.000336,
0.00036,
0.000376,
0.0004,
0.00041600000000000003,
0.00044000000000000007,
0.00045599999999999997,
0.00048,
0.000496,
0.0005200000000000001,
0.000536,
0.00056,
0.000576,
0.0006000000000000001,
0.000616,
0.00064,
0.000656,
0.00068,
0.000696,
0.00072,
0.0007360000000000001,
0.00076,
0.000776,
0.0008,
0.0007999978128320429,
0.0007999863302656699,
0.0007999732074672132,
0.0007999453219969876,
0.0007999212644649572,
0.000799876977996814,
0.00079984198737551,
0.0007997813029363705,
0.0007997353816173558,
0.0007996583033549204,
0.000799601454476856,
0.0007995079876593219,
0.000799440215107753,
0.0007993303661234531,
0.0007992516745305437,
0.0007991254508875099,
0.0007990358456317257,
0.0007988932559571764,
0.0007987927431629178,
0.000798633797202668,
0.0007985223837398507,
0.0007983470923576455,
0.0007982247858412321,
0.0007980331610180046,
0.0007978999698074827,
0.0007976920246405352,
0.000797547957839347,
0.0007973237065414553,
0.0007971687739963757,
0.000796928231894818,
0.0007967624441952804,
0.0007965056277307901,
0.0007963289962081636,
0.0007960559229338047,
0.0007958684596606193,
0.0007955791482405875,
0.0007953808660297086,
0.0007950753362380551,
0.0007948662486418088,
0.000794544521361089,
0.0007943246426703345,
0.0007939867398901808,
0.0007937560851333347,
0.000793402029948953,
0.0007931606148909615,
0.0007927904315015536,
0.0007925382726428152,
0.0007921519863499238,
0.0007918891009251616,
0.0007914867381309418,
0.0007912131441080255,
0.0007907947323134398,
0.0007905104483921571,
0.000790076016195096,
0.0007897810618058754,
0.0007893306388992024,
0.0007890250342017847,
0.0007885586513713071,
0.0007882424172533675,
0.0007877601063757322
]
}