pj-mathematician's picture
Add files using upload-large-folder tool
8fd808f verified
Invalid JSON: Unexpected token 'I', ..."ad_norm": Infinity, "... is not valid JSON
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.6502057613168724,
"eval_steps": 200,
"global_step": 200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.00823045267489712,
"grad_norm": Infinity,
"learning_rate": 0.0,
"loss": 4.3088,
"step": 1
},
{
"epoch": 0.823045267489712,
"grad_norm": 3.1721928119659424,
"learning_rate": 4.4163763066202094e-05,
"loss": 1.9026,
"step": 100
},
{
"epoch": 1.6502057613168724,
"grad_norm": 2.9604015350341797,
"learning_rate": 3.5452961672473864e-05,
"loss": 0.9336,
"step": 200
},
{
"epoch": 1.6502057613168724,
"eval_full_de_cosine_accuracy@1": 0.2955665024630542,
"eval_full_de_cosine_accuracy@100": 0.9901477832512315,
"eval_full_de_cosine_accuracy@150": 0.9901477832512315,
"eval_full_de_cosine_accuracy@20": 0.9852216748768473,
"eval_full_de_cosine_accuracy@200": 0.9901477832512315,
"eval_full_de_cosine_accuracy@50": 0.9852216748768473,
"eval_full_de_cosine_map@1": 0.2955665024630542,
"eval_full_de_cosine_map@100": 0.3618162919366333,
"eval_full_de_cosine_map@150": 0.37673093284239206,
"eval_full_de_cosine_map@20": 0.3952556219642319,
"eval_full_de_cosine_map@200": 0.3850375691141728,
"eval_full_de_cosine_map@50": 0.3565895386599598,
"eval_full_de_cosine_map@500": 0.3976475131909832,
"eval_full_de_cosine_mrr@1": 0.2955665024630542,
"eval_full_de_cosine_mrr@100": 0.5141580130059386,
"eval_full_de_cosine_mrr@150": 0.5141580130059386,
"eval_full_de_cosine_mrr@20": 0.5140785596450613,
"eval_full_de_cosine_mrr@200": 0.5141580130059386,
"eval_full_de_cosine_mrr@50": 0.5140785596450613,
"eval_full_de_cosine_ndcg@1": 0.2955665024630542,
"eval_full_de_cosine_ndcg@100": 0.5568512483442096,
"eval_full_de_cosine_ndcg@150": 0.5891923427833955,
"eval_full_de_cosine_ndcg@20": 0.5342874353496432,
"eval_full_de_cosine_ndcg@200": 0.6108910915140433,
"eval_full_de_cosine_ndcg@50": 0.5251712513704461,
"eval_full_de_cosine_precision@1": 0.2955665024630542,
"eval_full_de_cosine_precision@100": 0.24177339901477832,
"eval_full_de_cosine_precision@150": 0.18187192118226603,
"eval_full_de_cosine_precision@20": 0.5073891625615764,
"eval_full_de_cosine_precision@200": 0.1470689655172414,
"eval_full_de_cosine_precision@50": 0.3681773399014779,
"eval_full_de_cosine_recall@1": 0.01108543831680986,
"eval_full_de_cosine_recall@100": 0.6244233924508789,
"eval_full_de_cosine_recall@150": 0.687486468465792,
"eval_full_de_cosine_recall@20": 0.31887986522832873,
"eval_full_de_cosine_recall@200": 0.7334854348170513,
"eval_full_de_cosine_recall@50": 0.5004342335550164,
"eval_full_en_cosine_accuracy@1": 0.6571428571428571,
"eval_full_en_cosine_accuracy@100": 0.9904761904761905,
"eval_full_en_cosine_accuracy@150": 0.9904761904761905,
"eval_full_en_cosine_accuracy@20": 0.9904761904761905,
"eval_full_en_cosine_accuracy@200": 0.9904761904761905,
"eval_full_en_cosine_accuracy@50": 0.9904761904761905,
"eval_full_en_cosine_map@1": 0.6571428571428571,
"eval_full_en_cosine_map@100": 0.5799091076338031,
"eval_full_en_cosine_map@150": 0.5895042547793764,
"eval_full_en_cosine_map@20": 0.5516314386214587,
"eval_full_en_cosine_map@200": 0.5930550248640567,
"eval_full_en_cosine_map@50": 0.5474217433291914,
"eval_full_en_cosine_map@500": 0.5967311945998978,
"eval_full_en_cosine_mrr@1": 0.6571428571428571,
"eval_full_en_cosine_mrr@100": 0.8111111111111111,
"eval_full_en_cosine_mrr@150": 0.8111111111111111,
"eval_full_en_cosine_mrr@20": 0.8111111111111111,
"eval_full_en_cosine_mrr@200": 0.8111111111111111,
"eval_full_en_cosine_mrr@50": 0.8111111111111111,
"eval_full_en_cosine_ndcg@1": 0.6571428571428571,
"eval_full_en_cosine_ndcg@100": 0.7690946845916871,
"eval_full_en_cosine_ndcg@150": 0.7923061459636489,
"eval_full_en_cosine_ndcg@20": 0.6923506957704934,
"eval_full_en_cosine_ndcg@200": 0.8023952171736648,
"eval_full_en_cosine_ndcg@50": 0.7170311913169547,
"eval_full_en_cosine_precision@1": 0.6571428571428571,
"eval_full_en_cosine_precision@100": 0.18971428571428572,
"eval_full_en_cosine_precision@150": 0.13619047619047617,
"eval_full_en_cosine_precision@20": 0.5133333333333332,
"eval_full_en_cosine_precision@200": 0.10561904761904761,
"eval_full_en_cosine_precision@50": 0.3169523809523809,
"eval_full_en_cosine_recall@1": 0.06695957251887064,
"eval_full_en_cosine_recall@100": 0.8467073011936345,
"eval_full_en_cosine_recall@150": 0.9010846211520122,
"eval_full_en_cosine_recall@20": 0.5478306503729546,
"eval_full_en_cosine_recall@200": 0.9256595392715059,
"eval_full_en_cosine_recall@50": 0.7470276357469449,
"eval_full_es_cosine_accuracy@1": 0.11891891891891893,
"eval_full_es_cosine_accuracy@100": 1.0,
"eval_full_es_cosine_accuracy@150": 1.0,
"eval_full_es_cosine_accuracy@20": 1.0,
"eval_full_es_cosine_accuracy@200": 1.0,
"eval_full_es_cosine_accuracy@50": 1.0,
"eval_full_es_cosine_map@1": 0.11891891891891893,
"eval_full_es_cosine_map@100": 0.43522297182400527,
"eval_full_es_cosine_map@150": 0.4511056582755023,
"eval_full_es_cosine_map@20": 0.4839539531842883,
"eval_full_es_cosine_map@200": 0.45802493743471273,
"eval_full_es_cosine_map@50": 0.4288206349412292,
"eval_full_es_cosine_map@500": 0.47075604946048677,
"eval_full_es_cosine_mrr@1": 0.11891891891891893,
"eval_full_es_cosine_mrr@100": 0.5554054054054054,
"eval_full_es_cosine_mrr@150": 0.5554054054054054,
"eval_full_es_cosine_mrr@20": 0.5554054054054054,
"eval_full_es_cosine_mrr@200": 0.5554054054054054,
"eval_full_es_cosine_mrr@50": 0.5554054054054054,
"eval_full_es_cosine_ndcg@1": 0.11891891891891893,
"eval_full_es_cosine_ndcg@100": 0.6196114606257926,
"eval_full_es_cosine_ndcg@150": 0.6530674955405338,
"eval_full_es_cosine_ndcg@20": 0.6158554243812342,
"eval_full_es_cosine_ndcg@200": 0.670287400819268,
"eval_full_es_cosine_ndcg@50": 0.5886857089260162,
"eval_full_es_cosine_precision@1": 0.11891891891891893,
"eval_full_es_cosine_precision@100": 0.2541621621621622,
"eval_full_es_cosine_precision@150": 0.19225225225225226,
"eval_full_es_cosine_precision@20": 0.5767567567567567,
"eval_full_es_cosine_precision@200": 0.15264864864864866,
"eval_full_es_cosine_precision@50": 0.3907027027027027,
"eval_full_es_cosine_recall@1": 0.0035436931012884127,
"eval_full_es_cosine_recall@100": 0.6836436316189977,
"eval_full_es_cosine_recall@150": 0.7496865406970199,
"eval_full_es_cosine_recall@20": 0.3862419782331355,
"eval_full_es_cosine_recall@200": 0.7852629043380305,
"eval_full_es_cosine_recall@50": 0.5625768407738393,
"eval_full_zh_cosine_accuracy@1": 0.6601941747572816,
"eval_full_zh_cosine_accuracy@100": 0.9902912621359223,
"eval_full_zh_cosine_accuracy@150": 0.9902912621359223,
"eval_full_zh_cosine_accuracy@20": 0.9902912621359223,
"eval_full_zh_cosine_accuracy@200": 0.9902912621359223,
"eval_full_zh_cosine_accuracy@50": 0.9902912621359223,
"eval_full_zh_cosine_map@1": 0.6601941747572816,
"eval_full_zh_cosine_map@100": 0.5346277197767966,
"eval_full_zh_cosine_map@150": 0.5441006347287816,
"eval_full_zh_cosine_map@20": 0.5176817014415404,
"eval_full_zh_cosine_map@200": 0.547804939644668,
"eval_full_zh_cosine_map@50": 0.5050961591489588,
"eval_full_zh_cosine_map@500": 0.5524877228701637,
"eval_full_zh_cosine_mrr@1": 0.6601941747572816,
"eval_full_zh_cosine_mrr@100": 0.8068423485899215,
"eval_full_zh_cosine_mrr@150": 0.8068423485899215,
"eval_full_zh_cosine_mrr@20": 0.8068423485899215,
"eval_full_zh_cosine_mrr@200": 0.8068423485899215,
"eval_full_zh_cosine_mrr@50": 0.8068423485899215,
"eval_full_zh_cosine_ndcg@1": 0.6601941747572816,
"eval_full_zh_cosine_ndcg@100": 0.7344118850318737,
"eval_full_zh_cosine_ndcg@150": 0.7580048379992059,
"eval_full_zh_cosine_ndcg@20": 0.6629898844211244,
"eval_full_zh_cosine_ndcg@200": 0.769464510105362,
"eval_full_zh_cosine_ndcg@50": 0.682216395408567,
"eval_full_zh_cosine_precision@1": 0.6601941747572816,
"eval_full_zh_cosine_precision@100": 0.17902912621359218,
"eval_full_zh_cosine_precision@150": 0.12912621359223303,
"eval_full_zh_cosine_precision@20": 0.4868932038834952,
"eval_full_zh_cosine_precision@200": 0.10063106796116503,
"eval_full_zh_cosine_precision@50": 0.2959223300970874,
"eval_full_zh_cosine_recall@1": 0.06669332811942774,
"eval_full_zh_cosine_recall@100": 0.813864097315397,
"eval_full_zh_cosine_recall@150": 0.8683619147921042,
"eval_full_zh_cosine_recall@20": 0.52040897323663,
"eval_full_zh_cosine_recall@200": 0.8964210248615742,
"eval_full_zh_cosine_recall@50": 0.7067236634036261,
"eval_mix_de_cosine_accuracy@1": 0.642225689027561,
"eval_mix_de_cosine_accuracy@100": 0.9771190847633905,
"eval_mix_de_cosine_accuracy@150": 0.984919396775871,
"eval_mix_de_cosine_accuracy@20": 0.9240769630785232,
"eval_mix_de_cosine_accuracy@200": 0.9901196047841914,
"eval_mix_de_cosine_accuracy@50": 0.9635985439417577,
"eval_mix_de_cosine_map@1": 0.642225689027561,
"eval_mix_de_cosine_map@100": 0.6570111325791598,
"eval_mix_de_cosine_map@150": 0.6572712744212402,
"eval_mix_de_cosine_map@20": 0.6521189972338849,
"eval_mix_de_cosine_map@200": 0.6574012324541948,
"eval_mix_de_cosine_map@50": 0.6561813596290409,
"eval_mix_de_cosine_map@500": 0.6575399010277455,
"eval_mix_de_cosine_mrr@1": 0.642225689027561,
"eval_mix_de_cosine_mrr@100": 0.7262168772880452,
"eval_mix_de_cosine_mrr@150": 0.7262822017289415,
"eval_mix_de_cosine_mrr@20": 0.7246816496840639,
"eval_mix_de_cosine_mrr@200": 0.7263128860080087,
"eval_mix_de_cosine_mrr@50": 0.7260235454700952,
"eval_mix_de_cosine_ndcg@1": 0.642225689027561,
"eval_mix_de_cosine_ndcg@100": 0.7547612967303503,
"eval_mix_de_cosine_ndcg@150": 0.7575184392863841,
"eval_mix_de_cosine_ndcg@20": 0.7332013199323174,
"eval_mix_de_cosine_ndcg@200": 0.7593986816807992,
"eval_mix_de_cosine_ndcg@50": 0.7490333180034867,
"eval_mix_de_cosine_precision@1": 0.642225689027561,
"eval_mix_de_cosine_precision@100": 0.0261622464898596,
"eval_mix_de_cosine_precision@150": 0.01770844167100017,
"eval_mix_de_cosine_precision@20": 0.11911076443057722,
"eval_mix_de_cosine_precision@200": 0.013424336973478942,
"eval_mix_de_cosine_precision@50": 0.05086843473738951,
"eval_mix_de_cosine_recall@1": 0.2405616224648986,
"eval_mix_de_cosine_recall@100": 0.9480412549835328,
"eval_mix_de_cosine_recall@150": 0.9618651412723176,
"eval_mix_de_cosine_recall@20": 0.8650459351707401,
"eval_mix_de_cosine_recall@200": 0.9720922170220142,
"eval_mix_de_cosine_recall@50": 0.9226295718495406,
"eval_mix_es_cosine_accuracy@1": 0.7009880395215808,
"eval_mix_es_cosine_accuracy@100": 0.9885595423816953,
"eval_mix_es_cosine_accuracy@150": 0.9921996879875195,
"eval_mix_es_cosine_accuracy@20": 0.9474778991159646,
"eval_mix_es_cosine_accuracy@200": 0.9932397295891836,
"eval_mix_es_cosine_accuracy@50": 0.9776391055642226,
"eval_mix_es_cosine_map@1": 0.7009880395215808,
"eval_mix_es_cosine_map@100": 0.6984889579958145,
"eval_mix_es_cosine_map@150": 0.6986621032108891,
"eval_mix_es_cosine_map@20": 0.6938173897965141,
"eval_mix_es_cosine_map@200": 0.6987465392575996,
"eval_mix_es_cosine_map@50": 0.6978248868009254,
"eval_mix_es_cosine_map@500": 0.6988876342368443,
"eval_mix_es_cosine_mrr@1": 0.7009880395215808,
"eval_mix_es_cosine_mrr@100": 0.7724347923967887,
"eval_mix_es_cosine_mrr@150": 0.7724644404043258,
"eval_mix_es_cosine_mrr@20": 0.7712491671812917,
"eval_mix_es_cosine_mrr@200": 0.7724705526191206,
"eval_mix_es_cosine_mrr@50": 0.7722842539435679,
"eval_mix_es_cosine_ndcg@1": 0.7009880395215808,
"eval_mix_es_cosine_ndcg@100": 0.7884317468596705,
"eval_mix_es_cosine_ndcg@150": 0.7902844804245556,
"eval_mix_es_cosine_ndcg@20": 0.7690336236998598,
"eval_mix_es_cosine_ndcg@200": 0.7913994944724545,
"eval_mix_es_cosine_ndcg@50": 0.7838732562697655,
"eval_mix_es_cosine_precision@1": 0.7009880395215808,
"eval_mix_es_cosine_precision@100": 0.02598543941757671,
"eval_mix_es_cosine_precision@150": 0.017493499739989597,
"eval_mix_es_cosine_precision@20": 0.11968278731149247,
"eval_mix_es_cosine_precision@200": 0.013198127925117008,
"eval_mix_es_cosine_precision@50": 0.05085803432137287,
"eval_mix_es_cosine_recall@1": 0.27067577941212884,
"eval_mix_es_cosine_recall@100": 0.9599497313225862,
"eval_mix_es_cosine_recall@150": 0.9695527821112844,
"eval_mix_es_cosine_recall@20": 0.8850840700294678,
"eval_mix_es_cosine_recall@200": 0.9758970358814353,
"eval_mix_es_cosine_recall@50": 0.9390968972092216,
"eval_mix_zh_cosine_accuracy@1": 0.7713987473903967,
"eval_mix_zh_cosine_accuracy@100": 0.9947807933194155,
"eval_mix_zh_cosine_accuracy@150": 0.9963465553235908,
"eval_mix_zh_cosine_accuracy@20": 0.9806889352818372,
"eval_mix_zh_cosine_accuracy@200": 0.9973903966597077,
"eval_mix_zh_cosine_accuracy@50": 0.9916492693110647,
"eval_mix_zh_cosine_map@1": 0.7713987473903967,
"eval_mix_zh_cosine_map@100": 0.6981100717727863,
"eval_mix_zh_cosine_map@150": 0.6982601227257159,
"eval_mix_zh_cosine_map@20": 0.6929147114308428,
"eval_mix_zh_cosine_map@200": 0.6983171494463136,
"eval_mix_zh_cosine_map@50": 0.6972607407491801,
"eval_mix_zh_cosine_map@500": 0.6984116893552017,
"eval_mix_zh_cosine_mrr@1": 0.7713987473903967,
"eval_mix_zh_cosine_mrr@100": 0.8436803457907981,
"eval_mix_zh_cosine_mrr@150": 0.8436922193976949,
"eval_mix_zh_cosine_mrr@20": 0.8432785828350186,
"eval_mix_zh_cosine_mrr@200": 0.8436986631082636,
"eval_mix_zh_cosine_mrr@50": 0.8436385628906108,
"eval_mix_zh_cosine_ndcg@1": 0.7713987473903967,
"eval_mix_zh_cosine_ndcg@100": 0.8115576206060865,
"eval_mix_zh_cosine_ndcg@150": 0.8129087269558002,
"eval_mix_zh_cosine_ndcg@20": 0.7926986810043013,
"eval_mix_zh_cosine_ndcg@200": 0.8135973837485255,
"eval_mix_zh_cosine_ndcg@50": 0.8066848794942646,
"eval_mix_zh_cosine_precision@1": 0.7713987473903967,
"eval_mix_zh_cosine_precision@100": 0.02944676409185805,
"eval_mix_zh_cosine_precision@150": 0.0197633959638135,
"eval_mix_zh_cosine_precision@20": 0.13656054279749477,
"eval_mix_zh_cosine_precision@200": 0.014877348643006268,
"eval_mix_zh_cosine_precision@50": 0.05762004175365346,
"eval_mix_zh_cosine_recall@1": 0.2585731683069888,
"eval_mix_zh_cosine_recall@100": 0.9715031315240084,
"eval_mix_zh_cosine_recall@150": 0.9781576200417537,
"eval_mix_zh_cosine_recall@20": 0.9014352818371607,
"eval_mix_zh_cosine_recall@200": 0.9818110647181629,
"eval_mix_zh_cosine_recall@50": 0.950347947112039,
"eval_runtime": 11.3241,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.8135973837485255,
"eval_steps_per_second": 0.0,
"step": 200
}
],
"logging_steps": 100,
"max_steps": 605,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 4.5625697398559293e+18,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}