icarus112 commited on
Commit
4100e0f
·
verified ·
1 Parent(s): 5087576

Upload v14p14/ckpt_034000.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. v14p14/ckpt_034000.json +1 -0
v14p14/ckpt_034000.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"sent": 34000, "total_steps": 637934, "eval_results": [{"sent": 2000, "train_loss": 2.085123744664439, "train_acc": 0.4408124704770902, "eval_loss": 1.5152359620462006, "eval_acc": 0.44594594594594594, "ppl": 4.55049474422526, "w_freq": 0.001069752044629863, "w_bigram": 0.017389398230965417, "w_trigram": 0.07154396580765796, "w_skip_bi": 0.23805648573810956, "w_skip_tri": 0.465205430367037, "w_neural_phoneme": 0.3555831372188447, "w_neural_word": 0.3540519218134524, "word_vocab": 1593, "elapsed_s": 22.99993133544922, "steps_per_sec": 1380.6562957454057}, {"sent": 4000, "train_loss": 2.015406930693783, "train_acc": 0.449146110056926, "eval_loss": 1.5451346801541017, "eval_acc": 0.524390243902439, "ppl": 4.688603046282032, "w_freq": 0.003511844702708052, "w_bigram": 0.02321205769493682, "w_trigram": 0.0931775383776142, "w_skip_bi": 0.1623459701262452, "w_skip_tri": 0.4805304250923348, "w_neural_phoneme": 0.3684824684955725, "w_neural_word": 0.36741944722849984, "word_vocab": 2198, "elapsed_s": 40.84769368171692, "steps_per_sec": 1422.479331458738}, {"sent": 6000, "train_loss": 2.0513120565987895, "train_acc": 0.4426420659144689, "eval_loss": 2.385693284711908, "eval_acc": 0.37755102040816324, "ppl": 10.866593697324928, "w_freq": 0.0038737517974814202, "w_bigram": 0.042317026166645025, "w_trigram": 0.07485745911932162, "w_skip_bi": 0.16210056927329614, "w_skip_tri": 0.4859366519149216, "w_neural_phoneme": 0.35027883460856923, "w_neural_word": 0.3608633910216888, "word_vocab": 2819, "elapsed_s": 60.424288749694824, "steps_per_sec": 1444.1874584819293}, {"sent": 8000, "train_loss": 2.048645793655169, "train_acc": 0.4365337183420562, "eval_loss": 1.598692538850994, "eval_acc": 0.423728813559322, "ppl": 4.946560758578182, "w_freq": 0.00032966983389561694, "w_bigram": 0.0002418866251740584, "w_trigram": 0.1405691853149911, "w_skip_bi": 0.1781139578091503, "w_skip_tri": 0.53065518561347, "w_neural_phoneme": 0.3518465404687118, "w_neural_word": 0.35171821085490185, "word_vocab": 3459, "elapsed_s": 82.65294742584229, "steps_per_sec": 1458.0242296637243}, {"sent": 10000, "train_loss": 2.0392960710502033, "train_acc": 0.4366373172928835, "eval_loss": 1.5101141782385703, "eval_acc": 0.4852941176470588, "ppl": 4.5272476779707, "w_freq": 0.0005806880985354682, "w_bigram": 0.00650279613709746, "w_trigram": 0.05842327539161242, "w_skip_bi": 0.3587923930954613, "w_skip_tri": 0.55, "w_neural_phoneme": 0.3528922903222367, "w_neural_word": 0.35288160843142014, "word_vocab": 4067, "elapsed_s": 105.56567192077637, "steps_per_sec": 1467.5509299676955}, {"sent": 12000, "train_loss": 1.9055074628648694, "train_acc": 0.4613161614575153, "eval_loss": 1.6948638109062797, "eval_acc": 0.47368421052631576, "ppl": 5.4459042419434365, "w_freq": 0.0028678857932047954, "w_bigram": 0.01396978335657545, "w_trigram": 0.018171927977086527, "w_skip_bi": 0.4, "w_skip_tri": 0.55, "w_neural_phoneme": 0.3501947007286266, "w_neural_word": 0.35327151723764794, "word_vocab": 4455, "elapsed_s": 126.81924510002136, "steps_per_sec": 1472.6313806134503}, {"sent": 14000, "train_loss": 1.988357764454176, "train_acc": 0.44365667322606783, "eval_loss": 2.019602058013299, "eval_acc": 0.4647887323943662, "ppl": 7.535325714458626, "w_freq": 0.0012078577103194924, "w_bigram": 0.0018435259292709206, "w_trigram": 0.0021833600088577193, "w_skip_bi": 0.21387570596017932, "w_skip_tri": 0.5215356352951087, "w_neural_phoneme": 0.353403763158099, "w_neural_word": 0.35306716376230435, "word_vocab": 4946, "elapsed_s": 149.80217838287354, "steps_per_sec": 1477.3750448031014}, {"sent": 16000, "train_loss": 1.8859793216408223, "train_acc": 0.46099375900144024, "eval_loss": 1.8679316252331395, "eval_acc": 0.4805194805194805, "ppl": 6.474890040201499, "w_freq": 0.001179423340823594, "w_bigram": 0.012159731056554247, "w_trigram": 0.0169469737566637, "w_skip_bi": 0.2567323738435507, "w_skip_tri": 0.5097042745823981, "w_neural_phoneme": 0.35950514245749043, "w_neural_word": 0.3580844852439058, "word_vocab": 5338, "elapsed_s": 172.0545299053192, "steps_per_sec": 1480.0075309852539}, {"sent": 18000, "train_loss": 1.888715130293185, "train_acc": 0.4616469417099878, "eval_loss": 1.7267277988732628, "eval_acc": 0.46153846153846156, "ppl": 5.622226719529882, "w_freq": 0.00038247254425608033, "w_bigram": 0.0004838296631879124, "w_trigram": 0.00031333466511156654, "w_skip_bi": 0.38464589601824545, "w_skip_tri": 0.55, "w_neural_phoneme": 0.3507923324885186, "w_neural_word": 0.3507842421818335, "word_vocab": 5752, "elapsed_s": 196.0739209651947, "steps_per_sec": 1483.1447168928769}, {"sent": 20000, "train_loss": 1.8248699290471841, "train_acc": 0.4760111493298541, "eval_loss": 1.4147613475506724, "eval_acc": 0.5585585585585585, "ppl": 4.115504173613433, "w_freq": 0.000288660021262548, "w_bigram": 0.013234249848771156, "w_trigram": 0.04723915440803704, "w_skip_bi": 0.21981749405887852, "w_skip_tri": 0.5492620941688723, "w_neural_phoneme": 0.3508149228116177, "w_neural_word": 0.350867933031737, "word_vocab": 6098, "elapsed_s": 218.57639145851135, "steps_per_sec": 1484.74406515033}, {"sent": 22000, "train_loss": 1.859303542487796, "train_acc": 0.4664312020769184, "eval_loss": 1.9223074086263836, "eval_acc": 0.37681159420289856, "ppl": 6.836715379527306, "w_freq": 0.0004853969397382425, "w_bigram": 0.0022979376559019654, "w_trigram": 0.03038502034964991, "w_skip_bi": 0.321226650084887, "w_skip_tri": 0.55, "w_neural_phoneme": 0.3528267656705988, "w_neural_word": 0.35324112850123973, "word_vocab": 6393, "elapsed_s": 240.77224731445312, "steps_per_sec": 1485.4535935484894}, {"sent": 24000, "train_loss": 1.8658042247479767, "train_acc": 0.4647563340015116, "eval_loss": 1.571835950298054, "eval_acc": 0.4606741573033708, "ppl": 4.815481066836054, "w_freq": 0.0003947745855737373, "w_bigram": 0.0021288640814372695, "w_trigram": 0.008892850994688641, "w_skip_bi": 0.2151799741193014, "w_skip_tri": 0.5494586444588437, "w_neural_phoneme": 0.35164240574284245, "w_neural_word": 0.35154536242438766, "word_vocab": 6673, "elapsed_s": 261.119859457016, "steps_per_sec": 1486.2408428336512}, {"sent": 26000, "train_loss": 1.9037415796300843, "train_acc": 0.4523525999206131, "eval_loss": 1.9425843992588354, "eval_acc": 0.45161290322580644, "ppl": 6.976758420685662, "w_freq": 0.0006006081329066348, "w_bigram": 0.0005690353716866797, "w_trigram": 0.0013654439743136914, "w_skip_bi": 0.2776214065459763, "w_skip_tri": 0.5499870923599193, "w_neural_phoneme": 0.351135376628905, "w_neural_word": 0.35107115587949034, "word_vocab": 6984, "elapsed_s": 282.8300018310547, "steps_per_sec": 1487.9538849325568}, {"sent": 28000, "train_loss": 2.082350984559117, "train_acc": 0.4174616482744556, "eval_loss": 1.81444532469722, "eval_acc": 0.4539877300613497, "ppl": 6.137670818678332, "w_freq": 0.0004568467129081488, "w_bigram": 0.0013958726076375811, "w_trigram": 0.1025999549684254, "w_skip_bi": 0.0898673705321814, "w_skip_tri": 0.5449725158155078, "w_neural_phoneme": 0.3510743381651484, "w_neural_word": 0.3508859956298796, "word_vocab": 7648, "elapsed_s": 311.79852175712585, "steps_per_sec": 1491.2482502472724}, {"sent": 30000, "train_loss": 2.1732246622767892, "train_acc": 0.39509158067095695, "eval_loss": 1.8401622981332397, "eval_acc": 0.40397350993377484, "ppl": 6.297560260364343, "w_freq": 0.0007952189097450425, "w_bigram": 0.0036082508640084884, "w_trigram": 0.06551654636633653, "w_skip_bi": 0.08166040334936842, "w_skip_tri": 0.5358785756164435, "w_neural_phoneme": 0.3499206204808939, "w_neural_word": 0.3499055848770112, "word_vocab": 8515, "elapsed_s": 346.07197523117065, "steps_per_sec": 1495.3276689172076}, {"sent": 32000, "train_loss": 2.1405475605529576, "train_acc": 0.3960335077855372, "eval_loss": 1.631776288293821, "eval_acc": 0.49572649572649574, "ppl": 5.112948728095009, "w_freq": 0.00017931807862246708, "w_bigram": 0.0003158384002599147, "w_trigram": 0.03999761261350022, "w_skip_bi": 0.1859542926743709, "w_skip_tri": 0.5764628643819252, "w_neural_phoneme": 0.34240172448767076, "w_neural_word": 0.3423426166280084, "word_vocab": 9486, "elapsed_s": 386.3890173435211, "steps_per_sec": 1499.0281141584628}, {"sent": 34000, "train_loss": 2.1376852612836825, "train_acc": 0.39764329257909614, "eval_loss": 1.742513397956904, "eval_acc": 0.44155844155844154, "ppl": 5.711681124617898, "w_freq": 0.0001245063290761764, "w_bigram": 0.00016668010508834847, "w_trigram": 0.04930964258637601, "w_skip_bi": 0.12497648242560751, "w_skip_tri": 0.5939806870363084, "w_neural_phoneme": 0.33643750059565924, "w_neural_word": 0.3364241947052025, "word_vocab": 10546, "elapsed_s": 424.8360140323639, "steps_per_sec": 1501.6005680521293}], "mixing_weights": {"w_freq": 0.0001245063290761764, "w_bigram": 0.00016668010508834847, "w_trigram": 0.04930964258637601, "w_skip_bi": 0.12497648242560751, "w_skip_tri": 0.5939806870363084, "w_neural_phoneme": 0.33643750059565924, "w_neural_word": 0.3364241947052025}, "word_vocab": 10546, "elapsed_s": 424.8360140323639, "steps_per_sec": 1501.6005680521293}