Invalid JSON: Unexpected token 'I', ..."ad_norm": Infinity,
"... is not valid JSON
| { | |
| "best_global_step": null, | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 1.6502057613168724, | |
| "eval_steps": 200, | |
| "global_step": 200, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.00823045267489712, | |
| "grad_norm": Infinity, | |
| "learning_rate": 0.0, | |
| "loss": 4.3088, | |
| "step": 1 | |
| }, | |
| { | |
| "epoch": 0.823045267489712, | |
| "grad_norm": 3.1721928119659424, | |
| "learning_rate": 4.4163763066202094e-05, | |
| "loss": 1.9026, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 1.6502057613168724, | |
| "grad_norm": 2.9604015350341797, | |
| "learning_rate": 3.5452961672473864e-05, | |
| "loss": 0.9336, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 1.6502057613168724, | |
| "eval_full_de_cosine_accuracy@1": 0.2955665024630542, | |
| "eval_full_de_cosine_accuracy@100": 0.9901477832512315, | |
| "eval_full_de_cosine_accuracy@150": 0.9901477832512315, | |
| "eval_full_de_cosine_accuracy@20": 0.9852216748768473, | |
| "eval_full_de_cosine_accuracy@200": 0.9901477832512315, | |
| "eval_full_de_cosine_accuracy@50": 0.9852216748768473, | |
| "eval_full_de_cosine_map@1": 0.2955665024630542, | |
| "eval_full_de_cosine_map@100": 0.3618162919366333, | |
| "eval_full_de_cosine_map@150": 0.37673093284239206, | |
| "eval_full_de_cosine_map@20": 0.3952556219642319, | |
| "eval_full_de_cosine_map@200": 0.3850375691141728, | |
| "eval_full_de_cosine_map@50": 0.3565895386599598, | |
| "eval_full_de_cosine_map@500": 0.3976475131909832, | |
| "eval_full_de_cosine_mrr@1": 0.2955665024630542, | |
| "eval_full_de_cosine_mrr@100": 0.5141580130059386, | |
| "eval_full_de_cosine_mrr@150": 0.5141580130059386, | |
| "eval_full_de_cosine_mrr@20": 0.5140785596450613, | |
| "eval_full_de_cosine_mrr@200": 0.5141580130059386, | |
| "eval_full_de_cosine_mrr@50": 0.5140785596450613, | |
| "eval_full_de_cosine_ndcg@1": 0.2955665024630542, | |
| "eval_full_de_cosine_ndcg@100": 0.5568512483442096, | |
| "eval_full_de_cosine_ndcg@150": 0.5891923427833955, | |
| "eval_full_de_cosine_ndcg@20": 0.5342874353496432, | |
| "eval_full_de_cosine_ndcg@200": 0.6108910915140433, | |
| "eval_full_de_cosine_ndcg@50": 0.5251712513704461, | |
| "eval_full_de_cosine_precision@1": 0.2955665024630542, | |
| "eval_full_de_cosine_precision@100": 0.24177339901477832, | |
| "eval_full_de_cosine_precision@150": 0.18187192118226603, | |
| "eval_full_de_cosine_precision@20": 0.5073891625615764, | |
| "eval_full_de_cosine_precision@200": 0.1470689655172414, | |
| "eval_full_de_cosine_precision@50": 0.3681773399014779, | |
| "eval_full_de_cosine_recall@1": 0.01108543831680986, | |
| "eval_full_de_cosine_recall@100": 0.6244233924508789, | |
| "eval_full_de_cosine_recall@150": 0.687486468465792, | |
| "eval_full_de_cosine_recall@20": 0.31887986522832873, | |
| "eval_full_de_cosine_recall@200": 0.7334854348170513, | |
| "eval_full_de_cosine_recall@50": 0.5004342335550164, | |
| "eval_full_en_cosine_accuracy@1": 0.6571428571428571, | |
| "eval_full_en_cosine_accuracy@100": 0.9904761904761905, | |
| "eval_full_en_cosine_accuracy@150": 0.9904761904761905, | |
| "eval_full_en_cosine_accuracy@20": 0.9904761904761905, | |
| "eval_full_en_cosine_accuracy@200": 0.9904761904761905, | |
| "eval_full_en_cosine_accuracy@50": 0.9904761904761905, | |
| "eval_full_en_cosine_map@1": 0.6571428571428571, | |
| "eval_full_en_cosine_map@100": 0.5799091076338031, | |
| "eval_full_en_cosine_map@150": 0.5895042547793764, | |
| "eval_full_en_cosine_map@20": 0.5516314386214587, | |
| "eval_full_en_cosine_map@200": 0.5930550248640567, | |
| "eval_full_en_cosine_map@50": 0.5474217433291914, | |
| "eval_full_en_cosine_map@500": 0.5967311945998978, | |
| "eval_full_en_cosine_mrr@1": 0.6571428571428571, | |
| "eval_full_en_cosine_mrr@100": 0.8111111111111111, | |
| "eval_full_en_cosine_mrr@150": 0.8111111111111111, | |
| "eval_full_en_cosine_mrr@20": 0.8111111111111111, | |
| "eval_full_en_cosine_mrr@200": 0.8111111111111111, | |
| "eval_full_en_cosine_mrr@50": 0.8111111111111111, | |
| "eval_full_en_cosine_ndcg@1": 0.6571428571428571, | |
| "eval_full_en_cosine_ndcg@100": 0.7690946845916871, | |
| "eval_full_en_cosine_ndcg@150": 0.7923061459636489, | |
| "eval_full_en_cosine_ndcg@20": 0.6923506957704934, | |
| "eval_full_en_cosine_ndcg@200": 0.8023952171736648, | |
| "eval_full_en_cosine_ndcg@50": 0.7170311913169547, | |
| "eval_full_en_cosine_precision@1": 0.6571428571428571, | |
| "eval_full_en_cosine_precision@100": 0.18971428571428572, | |
| "eval_full_en_cosine_precision@150": 0.13619047619047617, | |
| "eval_full_en_cosine_precision@20": 0.5133333333333332, | |
| "eval_full_en_cosine_precision@200": 0.10561904761904761, | |
| "eval_full_en_cosine_precision@50": 0.3169523809523809, | |
| "eval_full_en_cosine_recall@1": 0.06695957251887064, | |
| "eval_full_en_cosine_recall@100": 0.8467073011936345, | |
| "eval_full_en_cosine_recall@150": 0.9010846211520122, | |
| "eval_full_en_cosine_recall@20": 0.5478306503729546, | |
| "eval_full_en_cosine_recall@200": 0.9256595392715059, | |
| "eval_full_en_cosine_recall@50": 0.7470276357469449, | |
| "eval_full_es_cosine_accuracy@1": 0.11891891891891893, | |
| "eval_full_es_cosine_accuracy@100": 1.0, | |
| "eval_full_es_cosine_accuracy@150": 1.0, | |
| "eval_full_es_cosine_accuracy@20": 1.0, | |
| "eval_full_es_cosine_accuracy@200": 1.0, | |
| "eval_full_es_cosine_accuracy@50": 1.0, | |
| "eval_full_es_cosine_map@1": 0.11891891891891893, | |
| "eval_full_es_cosine_map@100": 0.43522297182400527, | |
| "eval_full_es_cosine_map@150": 0.4511056582755023, | |
| "eval_full_es_cosine_map@20": 0.4839539531842883, | |
| "eval_full_es_cosine_map@200": 0.45802493743471273, | |
| "eval_full_es_cosine_map@50": 0.4288206349412292, | |
| "eval_full_es_cosine_map@500": 0.47075604946048677, | |
| "eval_full_es_cosine_mrr@1": 0.11891891891891893, | |
| "eval_full_es_cosine_mrr@100": 0.5554054054054054, | |
| "eval_full_es_cosine_mrr@150": 0.5554054054054054, | |
| "eval_full_es_cosine_mrr@20": 0.5554054054054054, | |
| "eval_full_es_cosine_mrr@200": 0.5554054054054054, | |
| "eval_full_es_cosine_mrr@50": 0.5554054054054054, | |
| "eval_full_es_cosine_ndcg@1": 0.11891891891891893, | |
| "eval_full_es_cosine_ndcg@100": 0.6196114606257926, | |
| "eval_full_es_cosine_ndcg@150": 0.6530674955405338, | |
| "eval_full_es_cosine_ndcg@20": 0.6158554243812342, | |
| "eval_full_es_cosine_ndcg@200": 0.670287400819268, | |
| "eval_full_es_cosine_ndcg@50": 0.5886857089260162, | |
| "eval_full_es_cosine_precision@1": 0.11891891891891893, | |
| "eval_full_es_cosine_precision@100": 0.2541621621621622, | |
| "eval_full_es_cosine_precision@150": 0.19225225225225226, | |
| "eval_full_es_cosine_precision@20": 0.5767567567567567, | |
| "eval_full_es_cosine_precision@200": 0.15264864864864866, | |
| "eval_full_es_cosine_precision@50": 0.3907027027027027, | |
| "eval_full_es_cosine_recall@1": 0.0035436931012884127, | |
| "eval_full_es_cosine_recall@100": 0.6836436316189977, | |
| "eval_full_es_cosine_recall@150": 0.7496865406970199, | |
| "eval_full_es_cosine_recall@20": 0.3862419782331355, | |
| "eval_full_es_cosine_recall@200": 0.7852629043380305, | |
| "eval_full_es_cosine_recall@50": 0.5625768407738393, | |
| "eval_full_zh_cosine_accuracy@1": 0.6601941747572816, | |
| "eval_full_zh_cosine_accuracy@100": 0.9902912621359223, | |
| "eval_full_zh_cosine_accuracy@150": 0.9902912621359223, | |
| "eval_full_zh_cosine_accuracy@20": 0.9902912621359223, | |
| "eval_full_zh_cosine_accuracy@200": 0.9902912621359223, | |
| "eval_full_zh_cosine_accuracy@50": 0.9902912621359223, | |
| "eval_full_zh_cosine_map@1": 0.6601941747572816, | |
| "eval_full_zh_cosine_map@100": 0.5346277197767966, | |
| "eval_full_zh_cosine_map@150": 0.5441006347287816, | |
| "eval_full_zh_cosine_map@20": 0.5176817014415404, | |
| "eval_full_zh_cosine_map@200": 0.547804939644668, | |
| "eval_full_zh_cosine_map@50": 0.5050961591489588, | |
| "eval_full_zh_cosine_map@500": 0.5524877228701637, | |
| "eval_full_zh_cosine_mrr@1": 0.6601941747572816, | |
| "eval_full_zh_cosine_mrr@100": 0.8068423485899215, | |
| "eval_full_zh_cosine_mrr@150": 0.8068423485899215, | |
| "eval_full_zh_cosine_mrr@20": 0.8068423485899215, | |
| "eval_full_zh_cosine_mrr@200": 0.8068423485899215, | |
| "eval_full_zh_cosine_mrr@50": 0.8068423485899215, | |
| "eval_full_zh_cosine_ndcg@1": 0.6601941747572816, | |
| "eval_full_zh_cosine_ndcg@100": 0.7344118850318737, | |
| "eval_full_zh_cosine_ndcg@150": 0.7580048379992059, | |
| "eval_full_zh_cosine_ndcg@20": 0.6629898844211244, | |
| "eval_full_zh_cosine_ndcg@200": 0.769464510105362, | |
| "eval_full_zh_cosine_ndcg@50": 0.682216395408567, | |
| "eval_full_zh_cosine_precision@1": 0.6601941747572816, | |
| "eval_full_zh_cosine_precision@100": 0.17902912621359218, | |
| "eval_full_zh_cosine_precision@150": 0.12912621359223303, | |
| "eval_full_zh_cosine_precision@20": 0.4868932038834952, | |
| "eval_full_zh_cosine_precision@200": 0.10063106796116503, | |
| "eval_full_zh_cosine_precision@50": 0.2959223300970874, | |
| "eval_full_zh_cosine_recall@1": 0.06669332811942774, | |
| "eval_full_zh_cosine_recall@100": 0.813864097315397, | |
| "eval_full_zh_cosine_recall@150": 0.8683619147921042, | |
| "eval_full_zh_cosine_recall@20": 0.52040897323663, | |
| "eval_full_zh_cosine_recall@200": 0.8964210248615742, | |
| "eval_full_zh_cosine_recall@50": 0.7067236634036261, | |
| "eval_mix_de_cosine_accuracy@1": 0.642225689027561, | |
| "eval_mix_de_cosine_accuracy@100": 0.9771190847633905, | |
| "eval_mix_de_cosine_accuracy@150": 0.984919396775871, | |
| "eval_mix_de_cosine_accuracy@20": 0.9240769630785232, | |
| "eval_mix_de_cosine_accuracy@200": 0.9901196047841914, | |
| "eval_mix_de_cosine_accuracy@50": 0.9635985439417577, | |
| "eval_mix_de_cosine_map@1": 0.642225689027561, | |
| "eval_mix_de_cosine_map@100": 0.6570111325791598, | |
| "eval_mix_de_cosine_map@150": 0.6572712744212402, | |
| "eval_mix_de_cosine_map@20": 0.6521189972338849, | |
| "eval_mix_de_cosine_map@200": 0.6574012324541948, | |
| "eval_mix_de_cosine_map@50": 0.6561813596290409, | |
| "eval_mix_de_cosine_map@500": 0.6575399010277455, | |
| "eval_mix_de_cosine_mrr@1": 0.642225689027561, | |
| "eval_mix_de_cosine_mrr@100": 0.7262168772880452, | |
| "eval_mix_de_cosine_mrr@150": 0.7262822017289415, | |
| "eval_mix_de_cosine_mrr@20": 0.7246816496840639, | |
| "eval_mix_de_cosine_mrr@200": 0.7263128860080087, | |
| "eval_mix_de_cosine_mrr@50": 0.7260235454700952, | |
| "eval_mix_de_cosine_ndcg@1": 0.642225689027561, | |
| "eval_mix_de_cosine_ndcg@100": 0.7547612967303503, | |
| "eval_mix_de_cosine_ndcg@150": 0.7575184392863841, | |
| "eval_mix_de_cosine_ndcg@20": 0.7332013199323174, | |
| "eval_mix_de_cosine_ndcg@200": 0.7593986816807992, | |
| "eval_mix_de_cosine_ndcg@50": 0.7490333180034867, | |
| "eval_mix_de_cosine_precision@1": 0.642225689027561, | |
| "eval_mix_de_cosine_precision@100": 0.0261622464898596, | |
| "eval_mix_de_cosine_precision@150": 0.01770844167100017, | |
| "eval_mix_de_cosine_precision@20": 0.11911076443057722, | |
| "eval_mix_de_cosine_precision@200": 0.013424336973478942, | |
| "eval_mix_de_cosine_precision@50": 0.05086843473738951, | |
| "eval_mix_de_cosine_recall@1": 0.2405616224648986, | |
| "eval_mix_de_cosine_recall@100": 0.9480412549835328, | |
| "eval_mix_de_cosine_recall@150": 0.9618651412723176, | |
| "eval_mix_de_cosine_recall@20": 0.8650459351707401, | |
| "eval_mix_de_cosine_recall@200": 0.9720922170220142, | |
| "eval_mix_de_cosine_recall@50": 0.9226295718495406, | |
| "eval_mix_es_cosine_accuracy@1": 0.7009880395215808, | |
| "eval_mix_es_cosine_accuracy@100": 0.9885595423816953, | |
| "eval_mix_es_cosine_accuracy@150": 0.9921996879875195, | |
| "eval_mix_es_cosine_accuracy@20": 0.9474778991159646, | |
| "eval_mix_es_cosine_accuracy@200": 0.9932397295891836, | |
| "eval_mix_es_cosine_accuracy@50": 0.9776391055642226, | |
| "eval_mix_es_cosine_map@1": 0.7009880395215808, | |
| "eval_mix_es_cosine_map@100": 0.6984889579958145, | |
| "eval_mix_es_cosine_map@150": 0.6986621032108891, | |
| "eval_mix_es_cosine_map@20": 0.6938173897965141, | |
| "eval_mix_es_cosine_map@200": 0.6987465392575996, | |
| "eval_mix_es_cosine_map@50": 0.6978248868009254, | |
| "eval_mix_es_cosine_map@500": 0.6988876342368443, | |
| "eval_mix_es_cosine_mrr@1": 0.7009880395215808, | |
| "eval_mix_es_cosine_mrr@100": 0.7724347923967887, | |
| "eval_mix_es_cosine_mrr@150": 0.7724644404043258, | |
| "eval_mix_es_cosine_mrr@20": 0.7712491671812917, | |
| "eval_mix_es_cosine_mrr@200": 0.7724705526191206, | |
| "eval_mix_es_cosine_mrr@50": 0.7722842539435679, | |
| "eval_mix_es_cosine_ndcg@1": 0.7009880395215808, | |
| "eval_mix_es_cosine_ndcg@100": 0.7884317468596705, | |
| "eval_mix_es_cosine_ndcg@150": 0.7902844804245556, | |
| "eval_mix_es_cosine_ndcg@20": 0.7690336236998598, | |
| "eval_mix_es_cosine_ndcg@200": 0.7913994944724545, | |
| "eval_mix_es_cosine_ndcg@50": 0.7838732562697655, | |
| "eval_mix_es_cosine_precision@1": 0.7009880395215808, | |
| "eval_mix_es_cosine_precision@100": 0.02598543941757671, | |
| "eval_mix_es_cosine_precision@150": 0.017493499739989597, | |
| "eval_mix_es_cosine_precision@20": 0.11968278731149247, | |
| "eval_mix_es_cosine_precision@200": 0.013198127925117008, | |
| "eval_mix_es_cosine_precision@50": 0.05085803432137287, | |
| "eval_mix_es_cosine_recall@1": 0.27067577941212884, | |
| "eval_mix_es_cosine_recall@100": 0.9599497313225862, | |
| "eval_mix_es_cosine_recall@150": 0.9695527821112844, | |
| "eval_mix_es_cosine_recall@20": 0.8850840700294678, | |
| "eval_mix_es_cosine_recall@200": 0.9758970358814353, | |
| "eval_mix_es_cosine_recall@50": 0.9390968972092216, | |
| "eval_mix_zh_cosine_accuracy@1": 0.7713987473903967, | |
| "eval_mix_zh_cosine_accuracy@100": 0.9947807933194155, | |
| "eval_mix_zh_cosine_accuracy@150": 0.9963465553235908, | |
| "eval_mix_zh_cosine_accuracy@20": 0.9806889352818372, | |
| "eval_mix_zh_cosine_accuracy@200": 0.9973903966597077, | |
| "eval_mix_zh_cosine_accuracy@50": 0.9916492693110647, | |
| "eval_mix_zh_cosine_map@1": 0.7713987473903967, | |
| "eval_mix_zh_cosine_map@100": 0.6981100717727863, | |
| "eval_mix_zh_cosine_map@150": 0.6982601227257159, | |
| "eval_mix_zh_cosine_map@20": 0.6929147114308428, | |
| "eval_mix_zh_cosine_map@200": 0.6983171494463136, | |
| "eval_mix_zh_cosine_map@50": 0.6972607407491801, | |
| "eval_mix_zh_cosine_map@500": 0.6984116893552017, | |
| "eval_mix_zh_cosine_mrr@1": 0.7713987473903967, | |
| "eval_mix_zh_cosine_mrr@100": 0.8436803457907981, | |
| "eval_mix_zh_cosine_mrr@150": 0.8436922193976949, | |
| "eval_mix_zh_cosine_mrr@20": 0.8432785828350186, | |
| "eval_mix_zh_cosine_mrr@200": 0.8436986631082636, | |
| "eval_mix_zh_cosine_mrr@50": 0.8436385628906108, | |
| "eval_mix_zh_cosine_ndcg@1": 0.7713987473903967, | |
| "eval_mix_zh_cosine_ndcg@100": 0.8115576206060865, | |
| "eval_mix_zh_cosine_ndcg@150": 0.8129087269558002, | |
| "eval_mix_zh_cosine_ndcg@20": 0.7926986810043013, | |
| "eval_mix_zh_cosine_ndcg@200": 0.8135973837485255, | |
| "eval_mix_zh_cosine_ndcg@50": 0.8066848794942646, | |
| "eval_mix_zh_cosine_precision@1": 0.7713987473903967, | |
| "eval_mix_zh_cosine_precision@100": 0.02944676409185805, | |
| "eval_mix_zh_cosine_precision@150": 0.0197633959638135, | |
| "eval_mix_zh_cosine_precision@20": 0.13656054279749477, | |
| "eval_mix_zh_cosine_precision@200": 0.014877348643006268, | |
| "eval_mix_zh_cosine_precision@50": 0.05762004175365346, | |
| "eval_mix_zh_cosine_recall@1": 0.2585731683069888, | |
| "eval_mix_zh_cosine_recall@100": 0.9715031315240084, | |
| "eval_mix_zh_cosine_recall@150": 0.9781576200417537, | |
| "eval_mix_zh_cosine_recall@20": 0.9014352818371607, | |
| "eval_mix_zh_cosine_recall@200": 0.9818110647181629, | |
| "eval_mix_zh_cosine_recall@50": 0.950347947112039, | |
| "eval_runtime": 11.3241, | |
| "eval_samples_per_second": 0.0, | |
| "eval_sequential_score": 0.8135973837485255, | |
| "eval_steps_per_second": 0.0, | |
| "step": 200 | |
| } | |
| ], | |
| "logging_steps": 100, | |
| "max_steps": 605, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 5, | |
| "save_steps": 200, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 4.5625697398559293e+18, | |
| "train_batch_size": 128, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |