diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..231325f65b3388ad6e7f516dc1a1e7c07e55a60c 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,27 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e5b3b6b47dc13112748bc8387500e81da895fe99 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.30792186288041745, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.022591197439731495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07098986968617506, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020679786797452465}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3069347608020833, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00517507368107689}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10294623137452774, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020587417894922925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031171214011889447, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009608900637588894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14183320494534776, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0033211715439776072}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04712663066068758, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012276103918669153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06796024562406605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019370776267962208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.29664082837766304, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005024240535996322}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09881593036325725, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001917130031576468}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0670791406212816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00196698409746432}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2878672957371347, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004800974945636242}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09698777350644844, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019324455424936378}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebb759c6711580763c9e445563cca8be3a5321d --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5029735260771602, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.037504230092449804}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.13619661582031448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0043020137724201464}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.316637398074897, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047970506632331504}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.15768658147508735, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003494665966696393}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.06820976880895747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029059822832858398}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15837063857057912, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0034375560556260923}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.07782418733894164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023362205542013246}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.12413525469005826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0038754321440188466}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2992719822505979, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004524889522002559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.14491859595914175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003065753619906709}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.12668637709059938, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003967270717894955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3010027831236105, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004513515461941868}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.14722111353362036, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0031421471913191945}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..105e04579e3ba74ddb2c93a57249b79cf0414838 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1677624908585186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002227107904916062}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2596588931478101, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002997542713484213}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1877757783616715, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002098472966964512}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03900987564301008, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009646264507463447}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06275053320845367, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016213745197323872}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04392454941063653, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001027826782042431}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1321786244987408, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015898806527527606}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2108343289151636, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024185861125649503}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1495463996881597, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001529629957138695}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15492456336179825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020566337458244716}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24059158197735586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028186220199704517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1735928623880009, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019465237397107696}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.443321935592914, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09064724887478164}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..86fccf93e76dcbc1e137b9ce6a6e4aadccbc5fc4 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2506949292837622, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035826466742239185}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.216927054352879, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028088091990487226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.19603976253059838, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002209711985991064}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.06671631551602682, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021245172015467873}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.051740103428563375, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014534357317337603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.047953521910444996, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012655545908108951}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1934840203286638, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002982369736201223}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16375914032560498, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021690067639137493}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14805027301359455, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016833891759156644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.23568777027923624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003415634236822358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2032981534504797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002632061036819137}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18360306023241374, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00205910275267234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.897173783637095, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04723692099575378}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..312aebd8fb87aacb3e03698ea732bdcb0f7e47f1 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.941956523442191, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09932749482493093}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.20220167360973929, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017775397370267494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.40694948255704005, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030318532028052545}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.266035838888047, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00214687581319049}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08918451858000426, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011232374812415247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1824874010352202, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002231269996765666}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11793161527142047, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014395777814735315}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.171931143567588, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014094508987155406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3506402050881267, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002593888393315589}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22717154379396048, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017325449588314497}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.18007224082622914, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001637841819840828}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36377758074636973, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028984303974106587}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.23720221029041466, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002003449214467719}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..908054ddd9da4ae5a70f3ac36c13f737d8e85cba --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.380602370008575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19219222099661637}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5762149768264377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003318783916958475}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4407794090538949, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029897484855389944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4721348830907075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023404970653199955}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2814540689762945, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002795334538538015}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21174089039601776, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022062395085723743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22711440839557615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020751801779315127}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4229881150623638, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003072919322994061}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32033975746914833, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002489730198496103}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3439998053438798, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00212844149551342}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4731321806462157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032652927514093106}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36070812284253606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027712237046193665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3866905695770315, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023474299675248548}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bae7ff3bbc8edb0d1be50ea0862d0ffe50e2cbcc --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.191488024972156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19907510301810782}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5888620057074112, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00325974855044316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46734675933757636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002910336590920325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.49478002813152466, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022132976290390608}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.298835335925771, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028167958629137044}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2332339594931545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002268844314664733}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24713224212661672, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020909646942975984}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4380934657095154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003041090518262408}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3447152118587733, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002445756611409155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3659238384457185, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002069857446914006}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.491576051493737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003239734182513254}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38921339856167103, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027477384856747842}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.41241936907841864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022987607835818604}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d63d06b1fd42047e78f704890a42fc207d274324 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.64881594516423, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14225876634497212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5907860432410378, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031560435722029602}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47164290046583734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028460616360397144}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5004124175592417, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022065167958013948}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.30074421250718314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027356725355736525}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23739401119844838, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022738788955147583}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.25184632683249925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021066699664814875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.437299096878406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002968957729484418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3468480918537638, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024452067199333613}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3686141972958827, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021055632446747067}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4939511257717702, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003153232253904959}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39417799230568645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027496846190725264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4182292558816836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023341754403372627}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..523af87ac35457147f5a83748b2416707582a69d --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.098333020388077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12831977294846147}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5966648139686145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032302255772308427}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47760538890316145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00285398486806638}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5071734526172544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002256209019372641}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3049813003705614, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028143522315018875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24128439152213985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002326306182449381}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2561891586621636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002175088764672847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4375644960495563, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029585544115121273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3490377714500209, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024749540858779945}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37081754277374707, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002131577935728707}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49662519790850435, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003207650849575026}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3977409010762705, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027651459862259265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4222811145975071, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002382321269391712}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b7a3c2afeb8917a23888df80e02100629bb602d1 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.062931767147242, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19067140642933314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5946866907857069, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032041378906118583}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4773278231081852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027831508718061987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5077222285813221, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002220732488512632}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.30451374992065544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002789941472506245}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2417166711851211, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022968048020895614}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2570060960713732, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021518885893666365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.43676493018556145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002927133353052165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34988140572226323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024419111341844576}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3721494155980024, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002117723784512971}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49777714097705755, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031788848137924734}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39973890243703447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027139961037825227}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42510332300543213, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023482381852689186}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3e13226886ed0841c727043d17dd077a6c3a8537 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14732873010394443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018472239906953342}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.35199358110459894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004413516152222082}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20505824244715506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024783005153629807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0324785643615811, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010795578817257175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08244261487005299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002863077391938578}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04590441078806022, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015202206206850909}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.108970601383633, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001382629098764731}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2622701817944651, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035205468161132866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1519188383604905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018845750655938495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1173139370778848, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001569538852204758}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2818166643830611, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038965162010598576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16348753229063173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021323303474861774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.750432821724133, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11024260307164419}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d687cbaf4c23e169fbf3eac4797b0aa03f603a52 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.23169122870326006, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004045147587622825}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.26815002474583066, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004110152736623833}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22983801220388622, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0032940906774565366}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.052796359945369666, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023703879179179594}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06066441266683632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0024082157247570543}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05179388258497403, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020972850091121355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1746429223847538, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003336919221467921}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2011435130769754, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032461458681743278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17244857599829136, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00267315623596849}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1772831820859513, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003324161176359277}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20683242721981307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034228474156704266}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1758880230368807, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026930773402095492}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.4943571404092832, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12369471155469476}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a312de5557bbf3cfbddcad64e35dfb6abd483c55 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.25217889274484556, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004187176500529052}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2667996083056836, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003952166510919622}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.24350643855178628, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0034168567984665956}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06179253514253428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026427530004505444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06403547304250448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0024621761069962894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05864225314595189, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002293228927176543}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.18918049038921544, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0034708834616706697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20001592844363475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003205668683161223}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.18232363203561192, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0028221690513137707}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.19188184345223513, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034530710844608826}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20518196814507939, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033724061824908134}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18572746911328056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002846842492367856}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.9857214106954544, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14101412936916624}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f4b14a0cbc3079b2d69e5d290397b741a239a571 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2484813044251097, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0042984090370612816}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.25675482709920644, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00429153056298093}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.238220796075611, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003745482282361713}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06066711842193548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025878516044052237}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06342202286918776, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002586925750413113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.058505610925660055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023584061095609406}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1878574292139355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003601580338442701}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19283239743534678, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034899752275218544}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17904839989000923, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0030840608870087312}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.19005537260387176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035974744150852533}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1966886872714737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035964115374883606}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18170572127239473, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003101828200101794}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.2870789581611426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21202333940864973}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3142d737acd9767e9eeb4af76bd2488debf44a92 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.06527208935660792, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004136508171521384}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.05998571726736939, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003713797694626656}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.056660365933148535, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0033872772198712937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01545632928618081, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016742571770703835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.014726543547135009, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014902502152271866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.013504510872103278, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001329260201745657}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0505669228329614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0033876169186837024}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04522270312870648, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029093653261490714}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.04292181483636768, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002659025122857177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.051289550137691375, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034102478996916284}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04641007879693294, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002993715279238018}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.04378042063061544, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026997367087303044}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.20657036807352894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.057452674047792286}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c0fd0b089ad068e8e45a523d3365ff346e861932 --- /dev/null +++ b/evaluation/generation/agg.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0027295547123993985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009121185765318135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0019729049386547235, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005615055607779773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002178348093993909, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006423774239749017}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0005583570131732993, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003699378783076142}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00025688148329657765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00014579873768176573}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0003426428225561565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020535656561021637}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0022248632641988773, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007092471581067394}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015861083611375401, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00043284232233835025}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0017770068245789574, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000505751759280628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0023748236425604474, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007550781242137756}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0017618177197440384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004963241045032187}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0019231486237150143, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005504938348202478}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.444458864274154e-40, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.5488576236449342e-34}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c6fdd006e0b620116a7f0fc9a908a9bcee17c8ad --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeede8a8eb388313f0ce068e198c5129c3722eef0c207cbe4a9aba6dcb6bf7b1 +size 4211918 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..42d23970ee08339019c30d1ba5f50adad252e68c --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd649f263e0eb797cde0735b9607cfd919db8c4c1e9c8bbe67ea1d45cf4067e0 +size 4766627 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_2.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_3.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_4.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_5.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b3317ffbb5a6f3f7a72b9a59530e6b6c7d68a4b --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff65078b7aafc1e78235b2d1a0c1056e6575648c8fa068277c5eb620110bbcb5 +size 7662801 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..18c103b35082a750b125752e77921e9cae182eaa --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fc033390efadb96f677cffa155a4e8eceb8483ee358a9b4e40651507708b53 +size 13013328 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_2.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_3.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_4.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_5.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9f36ed27a736ab07e0f3f2638550beb56cfa00bf --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f43abd5b7b62a2d30f00800086b7fbf4bc4bd348d470cb0036292ca9c1dcd9 +size 4442035 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6f0a9c23da20d7bd68179c3e977df17c786aacd5 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ad044cd4ee988067c0fc632c906c640f10d69f465a679c2446a90393f8f7ed +size 5004165 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b1860bfa2b09f8a0210d11e440df7a55e121f97 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32692d733a0c6839c64367c1fc7abc12049c4bf3cdb3ba316ae7538903028a9 +size 6096820 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f8de374e828a2c1a53c7fa316735818edecb68dd --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ec67c67379579999df2a0407490bd0a5cd90a0882959fa253596f64c1fedfc +size 7177851 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..48aa3b21890a2459bee0128128861963d34d041b --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577b2a15ed121110e6b03b0a3f70d3e1f5f71c907f676c4634525634c79d9ede +size 8257061 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..54cd0319eb1583bdb53c5ee6a1559ad10230c496 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53551673ae0235240be1ececebf2b0c8c6923d2da3eade250e1e5c79351ef738 +size 9345047 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ab8aac8442734a562af78318646d2129b8cffd80 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1462350d653e58054585e18f70b3e9533ac5d287bd34e6d54e2d501c6b6314 +size 2833595 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c6d50f272a21f998082489448029274246229051 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd120d63650da12ea034812ce0f09eea3ffd7ec227ee094b2d86afcc620ee960 +size 4947829 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4f320d71a31473e566e1f759bd8442fc0ddcee9d --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced14626cf706debd42acc11e81f4e0d01a9560fb221cf2d7fced9bfc35cbcbb +size 7201408 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..22a0d38c331b8e9284b69a9b621ca0765e902bae --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a11ed3fa28e18394fb53da16704f603fc1b017c4c75d0a452fccc2636bfd5d1 +size 9478985 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..819e8a1e8a1c7d977c1564fde528d423b0646899 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5633247857fd203d0e8d00bb75b082e114f0e0a6402965a340384c9170bb1a73 +size 11632660 diff --git a/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.jsonl b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3098b30b9da42e9589e593b708d176c65717c901 --- /dev/null +++ b/evaluation/generation/examples.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03989bdc825c1fcc9871ac832f3e737efbc7f138f23c070f392448ecc64248bc +size 13897411 diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c33255025c0f35657ec72db17cff2b08b5f514a0 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.30792186288041745, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.022591197439731495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07098986968617506, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020679786797452465 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3069347608020833, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00517507368107689 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10294623137452774, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020587417894922925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031171214011889447, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009608900637588894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14183320494534776, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0033211715439776072 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04712663066068758, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012276103918669153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06796024562406605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0019370776267962208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.29664082837766304, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005024240535996322 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09881593036325725, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001917130031576468 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0670791406212816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00196698409746432 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2878672957371347, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004800974945636242 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09698777350644844, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019324455424936378 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9b326b0e6915eb2a86db65561c30e5dd882aeb03 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5029735260771602, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.037504230092449804 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.13619661582031448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0043020137724201464 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.316637398074897, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047970506632331504 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.15768658147508735, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003494665966696393 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.06820976880895747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0029059822832858398 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15837063857057912, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0034375560556260923 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.07782418733894164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0023362205542013246 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.12413525469005826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0038754321440188466 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2992719822505979, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004524889522002559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.14491859595914175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003065753619906709 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.12668637709059938, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003967270717894955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3010027831236105, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004513515461941868 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.14722111353362036, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0031421471913191945 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9561c17922c60300163774f1c675c6676298ef47 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1677624908585186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002227107904916062 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2596588931478101, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002997542713484213 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1877757783616715, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002098472966964512 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03900987564301008, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009646264507463447 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06275053320845367, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016213745197323872 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04392454941063653, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001027826782042431 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1321786244987408, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015898806527527606 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2108343289151636, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0024185861125649503 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1495463996881597, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001529629957138695 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15492456336179825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020566337458244716 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24059158197735586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028186220199704517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1735928623880009, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019465237397107696 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.443321935592914, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09064724887478164 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e682628ba3ef3953aee118c5c217603bccb8f82d --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2506949292837622, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0035826466742239185 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.216927054352879, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028088091990487226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.19603976253059838, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002209711985991064 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.06671631551602682, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0021245172015467873 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.051740103428563375, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014534357317337603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.047953521910444996, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012655545908108951 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1934840203286638, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002982369736201223 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16375914032560498, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021690067639137493 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14805027301359455, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016833891759156644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.23568777027923624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003415634236822358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2032981534504797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002632061036819137 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18360306023241374, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00205910275267234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.897173783637095, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04723692099575378 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d3fd770a2e859f2472a120f87d37dfff14ccbd42 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.941956523442191, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09932749482493093 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.20220167360973929, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0017775397370267494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.40694948255704005, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030318532028052545 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.266035838888047, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00214687581319049 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08918451858000426, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0011232374812415247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1824874010352202, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002231269996765666 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11793161527142047, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014395777814735315 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.171931143567588, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0014094508987155406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3506402050881267, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002593888393315589 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22717154379396048, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017325449588314497 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.18007224082622914, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001637841819840828 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36377758074636973, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028984303974106587 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.23720221029041466, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002003449214467719 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fcd14ca1ee4b7a00105569474e83e8be2f0c475e --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.380602370008575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19219222099661637 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5762149768264377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003318783916958475 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4407794090538949, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029897484855389944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4721348830907075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023404970653199955 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2814540689762945, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002795334538538015 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21174089039601776, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022062395085723743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22711440839557615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020751801779315127 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4229881150623638, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003072919322994061 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32033975746914833, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002489730198496103 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3439998053438798, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.00212844149551342 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4731321806462157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032652927514093106 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36070812284253606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027712237046193665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3866905695770315, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023474299675248548 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f71dfa32789c7baee650168da102d5a3ecc8e55a --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.191488024972156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19907510301810782 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5888620057074112, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00325974855044316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46734675933757636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002910336590920325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.49478002813152466, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022132976290390608 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.298835335925771, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028167958629137044 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2332339594931545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002268844314664733 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24713224212661672, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020909646942975984 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4380934657095154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003041090518262408 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3447152118587733, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002445756611409155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3659238384457185, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002069857446914006 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.491576051493737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003239734182513254 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38921339856167103, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027477384856747842 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.41241936907841864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022987607835818604 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1b1be9f28ae703477c2400a0d81fb7d9f5dc4015 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.64881594516423, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14225876634497212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5907860432410378, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031560435722029602 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47164290046583734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028460616360397144 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5004124175592417, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022065167958013948 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.30074421250718314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027356725355736525 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23739401119844838, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022738788955147583 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.25184632683249925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021066699664814875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.437299096878406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002968957729484418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3468480918537638, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024452067199333613 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3686141972958827, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021055632446747067 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4939511257717702, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003153232253904959 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39417799230568645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027496846190725264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4182292558816836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023341754403372627 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5d78f048107b9861c0328d465ce7bef9b4664d57 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.098333020388077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12831977294846147 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5966648139686145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032302255772308427 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47760538890316145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00285398486806638 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5071734526172544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002256209019372641 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3049813003705614, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028143522315018875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24128439152213985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002326306182449381 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2561891586621636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002175088764672847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4375644960495563, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029585544115121273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3490377714500209, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024749540858779945 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37081754277374707, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002131577935728707 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49662519790850435, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003207650849575026 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3977409010762705, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027651459862259265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4222811145975071, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002382321269391712 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5c11d359e6810e92158147a1fbb2e5947a4fa973 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.062931767147242, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19067140642933314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5946866907857069, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032041378906118583 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4773278231081852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027831508718061987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5077222285813221, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002220732488512632 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.30451374992065544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002789941472506245 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2417166711851211, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022968048020895614 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2570060960713732, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021518885893666365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.43676493018556145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002927133353052165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34988140572226323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024419111341844576 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3721494155980024, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002117723784512971 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49777714097705755, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031788848137924734 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39973890243703447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027139961037825227 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42510332300543213, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023482381852689186 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..23c48872f2b0c2f86f4e77c7d20b0e11e5468001 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14732873010394443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018472239906953342 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.35199358110459894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004413516152222082 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20505824244715506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024783005153629807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0324785643615811, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010795578817257175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08244261487005299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002863077391938578 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04590441078806022, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015202206206850909 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.108970601383633, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001382629098764731 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2622701817944651, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035205468161132866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1519188383604905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018845750655938495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1173139370778848, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001569538852204758 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2818166643830611, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038965162010598576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16348753229063173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021323303474861774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.750432821724133, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11024260307164419 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..481e8e3570d1fa4909c17aab168aa43718c88981 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.23169122870326006, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004045147587622825 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.26815002474583066, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004110152736623833 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22983801220388622, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0032940906774565366 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.052796359945369666, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0023703879179179594 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06066441266683632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0024082157247570543 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05179388258497403, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0020972850091121355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1746429223847538, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003336919221467921 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2011435130769754, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032461458681743278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17244857599829136, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00267315623596849 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1772831820859513, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003324161176359277 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20683242721981307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034228474156704266 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1758880230368807, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0026930773402095492 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.4943571404092832, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.12369471155469476 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4357c19851c4bcc28335c68685cf3eb5adb07d9e --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.25217889274484556, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004187176500529052 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2667996083056836, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003952166510919622 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.24350643855178628, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0034168567984665956 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06179253514253428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026427530004505444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06403547304250448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0024621761069962894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05864225314595189, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002293228927176543 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.18918049038921544, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0034708834616706697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20001592844363475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003205668683161223 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.18232363203561192, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0028221690513137707 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.19188184345223513, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0034530710844608826 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20518196814507939, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0033724061824908134 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18572746911328056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002846842492367856 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.9857214106954544, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.14101412936916624 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3f440be323f466e76ee8a51c535ed733b0aaa3b3 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2484813044251097, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0042984090370612816 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.25675482709920644, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00429153056298093 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.238220796075611, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003745482282361713 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06066711842193548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0025878516044052237 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06342202286918776, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002586925750413113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.058505610925660055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0023584061095609406 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1878574292139355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003601580338442701 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19283239743534678, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034899752275218544 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17904839989000923, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0030840608870087312 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.19005537260387176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0035974744150852533 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1966886872714737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035964115374883606 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18170572127239473, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.003101828200101794 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.2870789581611426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.21202333940864973 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6063992e075b54bc87aff3fe50023b7ed8aa8cd1 --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.06527208935660792, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004136508171521384 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.05998571726736939, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003713797694626656 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.056660365933148535, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0033872772198712937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01545632928618081, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0016742571770703835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.014726543547135009, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014902502152271866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.013504510872103278, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001329260201745657 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0505669228329614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0033876169186837024 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04522270312870648, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029093653261490714 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.04292181483636768, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002659025122857177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.051289550137691375, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0034102478996916284 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04641007879693294, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002993715279238018 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.04378042063061544, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0026997367087303044 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.20657036807352894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.057452674047792286 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..77243229133fa9a9f245b841e2f91c4804a59d0b --- /dev/null +++ b/evaluation/generation/slim.lm1-4b2-84b-oscarroots_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0027295547123993985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0009121185765318135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0019729049386547235, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005615055607779773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002178348093993909, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006423774239749017 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0005583570131732993, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0003699378783076142 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00025688148329657765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00014579873768176573 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0003426428225561565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00020535656561021637 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0022248632641988773, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0007092471581067394 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015861083611375401, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00043284232233835025 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0017770068245789574, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.000505751759280628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0023748236425604474, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0007550781242137756 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0017618177197440384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004963241045032187 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0019231486237150143, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005504938348202478 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.444458864274154e-40, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.5488576236449342e-34 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscarroots/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_0.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_0.json new file mode 100644 index 0000000000000000000000000000000000000000..830a761289e55120095faf8564d9e7017595f933 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_0.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.312, + "acc_stderr": 0.014658474370509008 + }, + "anli_r3": { + "acc": 0.31916666666666665, + "acc_stderr": 0.013462309712005129 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.24786324786324784 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_0_lm-eval_global_step80108_2023-02-25-11-18-33_0shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_0_lm-eval_global_step80108_2023-02-25-11-18-33_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..830a761289e55120095faf8564d9e7017595f933 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_0_lm-eval_global_step80108_2023-02-25-11-18-33_0shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.312, + "acc_stderr": 0.014658474370509008 + }, + "anli_r3": { + "acc": 0.31916666666666665, + "acc_stderr": 0.013462309712005129 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.24786324786324784 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_1.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b13ccb1aea6dddae708f5e84ea2e01ae547dcb10 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_1.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821477 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3494623655913978 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_1_lm-eval_global_step80108_2023-02-25-11-18-33_1shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_1_lm-eval_global_step80108_2023-02-25-11-18-33_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b13ccb1aea6dddae708f5e84ea2e01ae547dcb10 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_1_lm-eval_global_step80108_2023-02-25-11-18-33_1shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821477 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3494623655913978 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_2.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5a7588ca69dd82e0a89877c3478512949b858921 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_2.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706618 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224484 + }, + "anli_r3": { + "acc": 0.3275, + "acc_stderr": 0.013553211167251944 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.31173780487804875 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_2_lm-eval_global_step80108_2023-02-25-11-18-33_2shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_2_lm-eval_global_step80108_2023-02-25-11-18-33_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..5a7588ca69dd82e0a89877c3478512949b858921 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_2_lm-eval_global_step80108_2023-02-25-11-18-33_2shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706618 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224484 + }, + "anli_r3": { + "acc": 0.3275, + "acc_stderr": 0.013553211167251944 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.31173780487804875 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_3.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b9afc717fed48de618ad5402c92bff08ff99981b --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_3.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767789 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813058, + "f1": 0.4563331988705123 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_3_lm-eval_global_step80108_2023-02-25-11-18-33_3shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_3_lm-eval_global_step80108_2023-02-25-11-18-33_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b9afc717fed48de618ad5402c92bff08ff99981b --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_3_lm-eval_global_step80108_2023-02-25-11-18-33_3shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767789 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813058, + "f1": 0.4563331988705123 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_4.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_4.json new file mode 100644 index 0000000000000000000000000000000000000000..48019e64a84bd0b92d5ea63d50eaa0d3b9bb8d2c --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_4.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.01359683672948516 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.35767195767195764 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_4_lm-eval_global_step80108_2023-02-25-11-16-30_4shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_4_lm-eval_global_step80108_2023-02-25-11-16-30_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..48019e64a84bd0b92d5ea63d50eaa0d3b9bb8d2c --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_4_lm-eval_global_step80108_2023-02-25-11-16-30_4shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.01359683672948516 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.35767195767195764 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_5.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ff22674b89978adca931bb302dcfe916fd1d3c21 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_5.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.361, + "acc_stderr": 0.015195720118175113 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541038 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932879 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.35469755469755465 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval/lm1-4b2-84b-oscarroots_5_lm-eval_global_step80108_2023-02-25-11-18-33_5shots_backup.json b/evaluation/rankeval/lm1-4b2-84b-oscarroots_5_lm-eval_global_step80108_2023-02-25-11-18-33_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..ff22674b89978adca931bb302dcfe916fd1d3c21 --- /dev/null +++ b/evaluation/rankeval/lm1-4b2-84b-oscarroots_5_lm-eval_global_step80108_2023-02-25-11-18-33_5shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.361, + "acc_stderr": 0.015195720118175113 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541038 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932879 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.35469755469755465 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39394988c11c42a4cb63f5c11e77066b815f64d3 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26bfc9926d91e8c400c21c21d9b57e44061339f46664b77260c962219959907 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..082f19274661e51c8f4271d59f7e370442fc5a33 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1fd01cbd453cfb5b45027d16897a59e7ba434b93fa0cf82c5fd9b6f3d29f78f +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffcacbda16b8cf6c9f986db149197c3dae8095a2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dddf9491ee6c21136ba290df83f83a5fb04eac472cb8a1174a6b3e80cc6b3e1 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d39d353cda77dfdf6b7b15dd71685c58247a448 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a616fef52b85daad34877a64373e549de3220818849dc364de4170961433e005 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe0ab27aec5866422427cba366daeb018d4b515 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b03fd6799c42a6400721675c3176a7b6a34608ca3ce64895f13b3a7fffc70e +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05f725028ee47c297c8f873abf52b01d57f603d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de65c3ff12ad0128fe06322f8943a30e093e5dbdbd2e57755da2566cc8fba414 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c2be6aa59f80d3092a1fb8ca2c91dcc5963167a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01065363d19113b51b01bc2596e92c61de858b2bf24daaabac31c7d45388c061 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58eec409f6ea8430aa37380053e6353e0ee1b4a7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9fb440c1b46ccec7b93616566539ca18c11f40931b4af1c81599d2a596e881b +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb98cc7f74daebfcc078ee0754ff8395731a7e48 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb185ef6cb3c6fb54b7ae3598142be92a10ca279446dca726ca51f8b0784e5d7 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6c1930ac1596c1740e0470d8f2f3735d7b6464 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6319f890c9d69329d891bd0b211bc9716cc460633fdd6aee33ba1da2c5062101 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab2b24095bb698b2fce787a431e326c0184fcb82 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e6289bebc165f0a4a4072cfb4dea6744683f0be9c15d8fb523adf6296b1c85 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a74bcd0988d741b0209c3ad5edf2e98167577bf5 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d505d3461c336067002578c3a90a75a9c1951fadfa27c09a1c169490f03ea6a6 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c5faeeedf7962ee86d59bf41a70b98f67d0efa --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01810c481cf58fe6c167ebe505205c92fc6cb1cd03d90f4b13ce8e11fa5773e9 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a935496b56e0022159ba04bde13896d476e610a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa731dc614d5687df0f289925d0a479da9c60f2115ca8ada6ceb5dd9ce1173cf +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87af5f0e679d877524d3d6bf21a15dac05794ea9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd1e567ec835ecdd27d04b2dbd3bc73f6cc62e8e68f50c4bd92486c2ff0c289 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744412f93ed8e7dadb833cc87f7a44ad62001a08 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00885d74e3bee9e5490f76aaa2c005f436065091e4d2c680aad5c1c067debe47 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3822d89b835757981661174f910c7df5b299a1cb --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d77ef6c2f2ac6ce7e4d08691925950a4095040b50f25eec2bf11c9bb9fc888e +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..184d7a92eaca132458f4ffb98d7a77ff8f2342c0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a455bcca6bea04a447caef0177a13ae8c6f07f858615de3d2b1edd683dcb35e +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..029fe2e86c106fbea248c2af827332705aa19c4a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b44e85e085741ad34daefe354d22a4475f0b8488e9479e1a502c523f613a90 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee76fc93cdabbc74d50beddea096f43fd2b3329 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799bed90f36e87c2c759b4c953d6cc3c2702c97fa5d025728969fc09ac336328 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62efd6a97cff48f62118d636de2596d87a9c9847 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47e15a48f3f7801f791327e00cf4dc130fb207a09e4849794f9de4171a7b137 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae7730c15f9f5f0d6bbdbdef337f64e13990a37 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4fd8e4a32c9ab392a384ec7a48b3c134a3890d356833f2b0b05dde572a0c3d +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7fb0e0f516f8504afc53dd17e90f3c27319f8d0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d97842597d1a7b1ad82ddc8dc6375651afc062448524827149af618954fe0f +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f75b50c725b41001668a8fcb2acf8092fd128943 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef05939def56fda81ec367f52a7bfafdbd0c5b4247a5a4442638a4f7e8dc11e +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d0a84510ad97e665c0e3381aa565823bdbd950 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a932e39ef79d8b63f3c6e72d736f8ffc76ee317839851c1236a2efa9e24e8d8f +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1af190f3ce13ea441d354ec10e9a298f9bf9f10c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8201d77beb83e782a9659b1df8439bea4bbccab079a44af2b3d9f12f62edf61f +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2f8b3c9c164f547712a28cf3882ba7923364617 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9382fea4d6b13370df36c17582392e6bbbfe1268bd6e31eb8a6b43893f44f9 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc785300819ce78095faddc97bb7bb88e22b30cc --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a947372a1103a9dd78a4b5b3d9ade005caf7e92fe1a0504099d28f09f6d8f360 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba91de6b40719ebc4a069189a2e0350836d91ea --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c889935ff97724e70139ef78bfd94c0aceb000d89ed7000e6690dab88bcfc6fb +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f8153e05208710dece8f16f97e12fafabcbd24c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9daa3bde5e01edf386f48cc815a9b719875dc77c569f84d6bfdbc677cd18920b +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6483d257c2776e419f62e84c9c3cbd288b356d0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2e7908a27121b5d16e1a9f29ca61815eb31e07ece616b73d26840a239355e1 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e6c895a9c09a85bc517a6cb26aee39f5fab7c9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e5831dafe3406ee267b503ae069b669fc90c317296b56e62f3678d36f0646e +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166d98861c8b22d24157e8b155bef996f248403e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859e511fb0dc742ee37136544a93948a3265586d9915aadf4dc3e8338c3bdd28 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ae6302e9e4ad910ea0480e3ec10aa3cfda320a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4fee50117f1c5e6c9a1c5ea98a039bc9d063a84ea5322baa527deb36db7497 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10527745eb4b68b0d38a3c3a7275bb47bdb8dafc --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de4eb13122194fc288c1d69a9bb3e42707d5964f7d82ce6da13f845407c7744c +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e7299fe4c92f72284b8f5f1d97b9694c88eb7ec --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e104c042a09c10ca2032e23a8841154931b7f785677331f05ae865a598f0df +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29bdf98b6dfd08a6a8f2443b4f6ad6cfcf6ba53b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a7f2dc24f93d2b60dbccb5c512d84452f92ef82ea693cb77947cbb06582de3 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..691094b1c7a925de0164990e000ad636cc7dbbfa --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704de28e287a7eb68b868c9b84a855bdd0ba26c69dc52e62ab09da3d0502496f +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9fe826697717112ede202ab0bd7e8cadb88955 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b14e7a7e3732fad5857c11a7b23ae64c1b87a5a10bea361ead2fb59f5dfadb +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed222c305fe4f15f4df16ae037d3791c3d3d7ba2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92863eb211ff287474d04d058b017303ab8aee088318ae5664f18ab3ad2965e2 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1e415b91c9acf63c4b46528a975bd808d5d275c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e17cc47df8db2d2a29af2066c218d7b835416af7540636d7706001603e47de6 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db073f6bbe5e8a3b356424ba36790ab898492159 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305ef8af60823f42a06a18b4a0d29977bca36eaa21669059788070b602d014a5 +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2b3964a882f09da267e38dc709871157556465 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855fce980673cb1677ff81ce4e030825ad33ec9a48af3c5bb6c55210756fc394 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..523cf3432cc9a1d4d33c8aaa29cb7278d588fd7a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d01d6923a71097baaed6d348c5ffed9022ef38ff37d30f3585b0eadacd7b352 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8854ed114ce825552faf6bb764cb153fe3e13e69 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f8560606e19e0779aee0c179c8f426b8b90862a44fa5a0d4488cde904553fed +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec1959cc7390a6c21ae0141901bdd2f103dc50f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0967e10a6987fcf4b0fc1638caff0278fcadf5b6aa63cff1d6b315fcbc00e10b +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b9040a86d170deca45ea0868c22a9889d5e698 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d60adc5adcbe6819d70b58fa38aae0024308b29cd48fa7468006453c9acab5b +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0436530304f5c5d31162310ae489164c69494db9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89cf6b6954427f9ee76aed7511e176d96d15ec0a79b900099104995b69c3816 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71ca71dc7a0f1f17f9b957c3677afe6023494bb3 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad90fd795209ca7bc570f009c6b442782f31e7d859bf601a8b77be721b958cf +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61e46927709fb907a14d1e43c265a38c7376a410 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f687329391a4824d90b3fcbb4803879fe2d58a8347fe0dd5a4f9445c027f9b +size 199058797 diff --git a/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea96609bbbc6303bb345a6991f9538e08e502c48 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cf056f4d9a2e17c7117647674aade184f994d96ac802cca9a3a4f69d0c5a2f +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b50f8fd6596057dbbc87584b8d7ff01fc4963b69 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb5aa0bc52a6f30188e490b278fadac07ce76655ffd08a024f43d1ffa6892629 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdd1b28dcca77a3b6eaf8042fa6047b6e2cd2cca --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7db835b91dd02821869a9b31b15d7e66d4c02dfd493612d317b643fcad502e8 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b1e8eb6e161bbebe89ef443b68a23c4099660fc --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0a784c344c99abb1498d84b0c042716e8139ff95a339e851da1b55d708f687 +size 199058733 diff --git a/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..956dca2e5370b4ec2c664ef6b53ae817c6834efa --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4923171ae700c13c98ab72399a45ea94563e525ee3ae85ab0fcef56f980aa585 +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb71b8d8cc84ff3492faece180c09c5451d91605 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becd1d6ddf7a484c6ecfc43f8db45f2d1b2f64ec390dba24f80a74130f40c1ae +size 199058669 diff --git a/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5266a5dad15dbf10638cf445853a7796f8d41068 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d08277358c76538ecac9826eb3409c1fb9f977d89ec116441657fe1cee62490 +size 199058925 diff --git a/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bdbb2eb645a76609a56fee2afc8325985c71d01 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9075199da24c094fbacab20f54cd80960740857ad65fd7ed9703694cb9cd1422 +size 199058925 diff --git a/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12f8575661b151931410d7277bcd35bac920c7a0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce86a73bf5d4c139e8d7a249a6c4aa518857603a36c3e7f674da2ebf008e7b5c +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c8386629e15b9318ddd58cb57feac20a8de281 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f132a6c9a2537fea46ef0e6c2dc2fe6a8043fe29bafccabc24c3accc4e6d69e +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3e52353bf090d8a1ce332aa28aa144fc51e9214 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83339ea736031935f65d1577f0eb8ea658b16b0bee3a27411601ccbe47f31f6c +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59f6480e2f76dbee5d02732e71b785d97d21a755 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f539e496904e9340a69428e0da9611ef5f5f7c56a00ddca087263844a985fb5 +size 199058605 diff --git a/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..886193920724c73e577efc1dc01e114674cf9b9f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a379ce2a88fcba46e635880a31b1fe42c1beebc3f8da7b985c97986d28c7ade2 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8eaf230c8ca19dfa68c39fc35b4a813e73d6df0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d810af6ea095e04b55411c695e3a6573dfbad205e24887b4f2e204e161793a2 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c43da79c14fe996d036af2b514ce0b09e5737c3a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3a8ae8f361cc1e152d3f078f613e1f294773eab93362fb566dcc1cbc46b728 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ddb7aec9f88d5606fd0117c114f75ce580fa1d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615ded61e3d19dc0d17ab6a085480dddbe0cffa931333dd57e6816f04b99e090 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b5700f6351000cac0e72ecc4699bbd06f83abdf --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c8959a5a9070ef5d47523d16fa4378366824dad3712c4c98fe359ad7ae4985 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..947f29d02bda4e508aff7cf652805d0b2498567a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a1008f57221a97a80b6129dd66bd02849a0bf3501dabbae1c71f22e7a9070c +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ba57219907de60a13f6ac61c8b06fedc13d1e43 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d133c3e0d43d173f5bba637dd14e9a7c5a6e0c477278ea2521b5bf444f3bac8d +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e52aae202beb7ed5eb9638bd9d72c6aeba762e0d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55deca1c80a597b032e7a2ba9525717194b468775bf0ae9bea854cebe5b40a88 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b49b63a3389c39356f38652e30e58e958aee9e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f740f7d22f7e7925a0366254402a8d9d86e943e8202847b6b018ace6e973544d +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..692299059a902c7c6f6321b9abc110aeba50cb9c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf8fc3b2c102433da15de8ac81a4981dd6de1082cb4466086cf3ac29e2888b04 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98f7ea40fab664ccbab11bb0eee43f527fc97e9c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdcdb0d9825be92527f8949eea57c618f1f9fb371251f0b70aa66a05b7a8630 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb73239ced3d59945769e111a1cfcba9bffb61b2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12c567594244d3f33034658e69d105288f1bf34e654a44505e0ac96176d18c4 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1e6dd55059be58056cf7299ea279efca14696a9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ad37aa3bc4c54f41e3a4467b05e2c87f27348b57d1e6f0e1accb0a87ec35b5 +size 199058978 diff --git a/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb76983ea2bcd88234b0abcd812387b4cb204336 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e1ca54aff40693ed08501e22ce996429cc118ac4e1a32d545dfcc957c0b282 +size 199058978 diff --git a/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49c9d312d1458aa790344c23727316556df76c99 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ae623854ca756ae9cf1fbb4a369cafc693655069eb385cc93bf91cc99838011 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f61ba34ef238cbc9a887e7af2c2e011b458c782 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2b740a32692b69637790cec20d6100d0f65f51710c5bbe5cc1e73702972e89 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..514498d6aa7db0bc4970f9d49b969fb3bc40baf0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5031ae145eb46c044f4e0b988cff6a9b403d69679a242bcc32ecc549a44fa004 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43b7865b6f87268ccd20c6863922c194a621586a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489fbb193e820a43ccbab3d2064e7a2951c78b8adc9eb4501bdef194473eadfd +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf56e2fd465359a2bfe1fa832391ce36e1cea20 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17814680a68f95fafbdf9e9004efac3796a9a7e4e532003b1daec951132a5021 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c443d5ba6f69ffe3760808eaeed6bedc44faa65 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f731d784b200737b59b5059e1924d35f08ac49f1cf43636f191d56e811b97cdc +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13af4491e56c16b94e09fb5e69df3393f7fd7bc5 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29651669eabc33d3aa2a54c7c15c42104d3efeda670e792f5b57efdbe90f6be0 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a9a77ecd8829b4826e0e6605ed360b67331828d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319c8b635407460cebe836c6fff1fc66a2fd53c589abb1be646ea6a3cd104c17 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f6f7553aa7b588e0d27b221d18bcaaaccb10830 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167787c9932759eeb0513350682d854b43459fa70a6112ca68342f7203a02530 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e55bd9e770a9607a8c3164ab59732bc01f182a8 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39d29e38f0f3f2c0e154f793059cf99c3fc3ce1e073eae4dcf66d816d57ce56 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..360855f5a20463f002c0d8659238255870d2f1c0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ac6731dd21b8e4c377f50c0d5d6d55e673aa578e361423e675467a3e854965 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf90d564ee413678203c4c59bf833d6245a450f7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54da83020ce7265ca16706139152aea112968640e4a2b403c994d631deb89444 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b06006384c695dd3682caded8b6f086e34cf09ad --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ffbfb0d9dc005ec34e5ee30223086e2b07fc5b8c58dd6509b73b922dfbc81dc +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b214c0ef1b14b7cd3ae21e060e7e581f73c3d710 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a3d36b82eb0543aba82ae245556bba3e48ec868532e7453a5630b561dc56a41 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbcc4b47a452381ad005597b79d40352581129c4 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a67fcf0ded1944aabbcfb9e2b833c8c669e34c8de02ad9dc9d696cd3d67fc2a3 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e43174d0c705d8122247940e9b4f9317e36dd158 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a7fc84d13e4bd3e29cc4f7f19b89b649e31e85452830891979556bdd150077 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b36d725a9f41bf81d1d4e6a5d50ac691a47ffa --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42284e652ab1e374982a29f761c4236ad88e0b1292e38d0bc0ffca490369aa7 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c310d4355f34687a51dba5f6588f55713a27b571 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a39e0a3d116090af60a2862e1e029f267bc955066403f867cd8b60a3b2fd0ca +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc704b26930ad21cba683cea346fc53800de31a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efab838bdce4b22b898660de8eef3190055d9a0768740091775062e61c65ca23 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a825f6e0bf6c8faa6a002773a29dc60acee6c252 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a62e9edabcf20e4113721943d91a4ba8f18549f9842d660c96ebcebe2b798e +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afbc8a502ed2d73be1578e37dcfc13e23f4363f7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e8d8c84e46d31ea956989bbe18a5c3837c93d2e3617f25287be755c886ea683 +size 199058594 diff --git a/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc70f8d43321deec60461ad1c64f769c760171ef --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61cfb4f0814a21759ff33a4518c647fc1a19ae7c7dc94c348a80e4ba9a970ac +size 199058594 diff --git a/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13272ba6e80febd8ba87369d13c374dc297e2c26 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7eda79ef2aa439c2ed9dd9ef32ed4c38dc8ff877987305e53d208539b72dcf +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6de19d7526f063c2d7dc66304540ddb94843091 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494767c586f707ee9d3e13436d854a0694e9ccb3055c3cef6ee885551aaff14d +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43de16145b3c3db463111e576de807aa66f738ed --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c1f3e8973dfd2c0026fcfbf59cae36b0db2145699641163a9f6948856be70e +size 199058711 diff --git a/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1257228685ac3480b24feaec9442ff355485cdad --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa341c0b364f9497a16c2cdf618dcbd5d966d37753639de07d3915b484ee52d3 +size 199058711 diff --git a/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c4bcf4cacaf24f2fa5bb7c9b0012ecc40225f2d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32329ebabe945bbd5cd1e3a35617c3e23154dd2d6eb42200edbe30a330cd1fa +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7af2ec6b8cd9500821ea53928fcb4b4529e07d20 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db91a3178dd8eb3ec2e36b831320e5207c3ec4d66860e4f0f55eea68265a127 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0894b52614dd8f7b61fec40d3504b58f645ec2ee --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e142b94eed6818b5cc0f5fff358077e0cf05c95e5bda9906e7276af0bfd9599 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec418b3b4d48dd09487d54a2279e348bf0f5a3c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14544e356abe20953422805bdddf748a8994a8700fa64dc4fa268c889baa2d2a +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93bb910d9a63fcf91778c8eab0a9ac2412b2660 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7dc3981aaa5ccbffae1b95e37584399d177deb1132b374460a9496b59ed47f2 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8f99ac6d49239cf992f34482f9680efbe35ed1 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a96f22fcdc9c4b4003a7ae0494d44eaa3f7bbae4b81902922cba44947bdb5d +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df02fe55fabec62a0065f273f623a4280145ba04 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd9c15fa9a4fc064fd5b7564256f0755fc71f792f055ddd3d28090a2e06808d +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3f6c28dce47eed7efdc725c5f7718967a0cd37e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f438170f0c72cd5d2547623ef157506879de31f3ef07bfec894a6928029497f3 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ff7223290d4b9a0fbc42e122f8265edaa21f458 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c16e1a83f62d5bf7b3f6322eddd1a5da60a6ef10060b4fd0f3a913068cd5e498 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd86c9385ffddcc987fceb835e6ab3a6c174e9a9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a77b85952333b758de82574c8c3fd8dca7fe6f681361327571c312617e07e8c +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2acc15c6cab1af02594d8ef25e6e1b8a66706f0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408f176e4f4792b6e4c5a14c8b294e772464e07759e99b56ded083dae75650cc +size 199058594 diff --git a/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9e8f4c0424bf81bc8f50d74deb32a98d1b4ba25 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3aa894652ff8dc55fd93863a460bfb52d6ec7f07c7e3a8c2e3b1bb1e3ac5af +size 199058594 diff --git a/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b24fd7fb302753649461fd37ca3175de2571d8f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524d3023bd585e95a2887076a31962884125235f43cfba76d0b9ecda620c2b51 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482a054624c9077d0da24500adffca277e5f8311 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fa1521aab6b5362d58e640eff5b061afebdfbb305000bd225bd6beb7f649af +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca446c35dde9e7acfca1b1805ea2823944f858a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20fc75e51d4182ae9d44b3c13ea224cf6edd8bf6c4d45647c54cb4d21da5af2 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e0d0bc1bf04fcc616cdea02b5586b3d7d401219 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6167acc6fee7f195a31292627698ceaf280e4704429c6674174f7cdd6065e49a +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..447eea2c2b2eb3b7dd503d63b2cfd684ebca5526 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86f414812d285d2e2d8f9e1a21bab26669eeb73bcdeb76397c8459cc8de57f95 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c80032e6c29afd550b6f6932600177da96e47329 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ca5aa104b5e17de79a1bc06fc011b351cca578171c5352a0dbac1ad9f8ecf9 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0e0099b4422ed11f91d9e220d21136d86a9965 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f321c801f905c8e577c832c1913eec1d542239c36af7478b0162dcab688de893 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa97fd9c66b367d423b21f19b58b30a29e67d97 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c67ba10dde3971ebe484318592303c58b4999944c96091cc514f4477e705d53 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba343d2df25046d0f1d5fa087f4e4285458b4522 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b929eb2198356a8ea9b5854e2daaff23c4fe490241cbcc80b6a27b05f04cd5d +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..157ab38ec5d6bae7fb39b0b7fa62ebbbccdd9bfd --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b772b734e422ba1886991c60043a45965b3e73b061f63dc790c5b25c145ede15 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..816bb5b795fa0e3694e553dda9a39f3d3b1e8468 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f50dba4dca728b71583176a8858c9393fbbb92e776a257bd9233b1d421dcfa +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43b38b2798471fa973ceec89810dc20cd57a33e1 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2985feaa24b0215d52282c3f7ca102b8c016269f935321896fdd5459912cfd7 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e067fa318da0d96bac35d4b2506193545f0333d1 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:023a96b96d721a10b014c19c6623b5f0f81b2bad5bda218d5224f37f024e414b +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eda3465f8cf573002fee2933f9402ef3db48860 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57fae7b6a2ea6a57b1135c5ca45f5d8458b5907f7631051120e375076d732c7e +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97a8235e18a561630b20bb711b440070833503fe --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265da56c8d7f856bb028b0ff27996fb3f078c3b4c4306efe37489836cb312655 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aea07d788f25b47053a2f91d0f497d32126690a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9778cffeec8d45215a44b716dea68d0341484628b609222f152fbab05d2f3a7f +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73837205f832f0e3844b00eee87f75d08fdd17d5 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b552e9bea8ee52ada219544dd1032d6669b2b11b89413f52517774a1ec849b +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0160982d89c4f5889245cf638139d91bddf60056 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665e8bd27be8d7374e493a200e36b9e48a9d7124be0c2c5d96909b21a925fbfb +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a00b825f97dec5d4614cb64c9350389eb55da2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f55d528f29ecaa5a06520d00f4a68da1938b48418fd7ec6db493d4cfdc5b951 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62f470551174a9da63a3d34c859684572d26a54c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a39c2f2b963a7d89af947c7f237050398917f43af75beef961142be60c8b1f +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f715e6b6a481442d64f4f4606f4cb15af583c4b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058c9546752f038827f55b3ce69bf78f231b96b36989992b73de057424a85e0a +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62af29d66b8514dba01bae529fd27d0fa856835 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c82283af071c895648d2c3de9824622e46a1cd637aa956659170d2c579f3e8 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..386e59914c88ce69a1a8075236f878c9fb589267 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7babac3df2375d29c2e772694339fbc5cfd72baf97e6480e70e6267fa906e3cc +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28bead9a2c81ea7800b4ae342b9be0446de0f5a3 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1dd2cf9089c048552ea859492a49fe5ea8f24dcd513b26f5c2de7cd633b2b5 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8c2c5e321f18f1cf6ca59c1c50a9fbbe7c6265 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78623661b61585657e0513debea1195b03cb7abc7eeda2b103db4d857467bc5 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ea27839bf482bcc1e3f5825973555e66596112 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5059df86a1c29213b4fd44fb40c417ce60d7668a7a99cefe58d646fae673ead +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3262a2e94e68e273673bc60764f00ccd675a32 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a87052aae05b4c58d1344564388c534e62a7bd29843b39c5ff8518a4e50ef3 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..545e859abcd9a8c94ccf91b36096f9e2dffacf11 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49030cd896428eac05454f13aefd2776c2973b19037e6dc90bb1639cab074141 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51dde3f436df1cdcf877b2587a35459d29ade3d0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e13c50932c0544f89501c16fe99cdc560182e48a0537ceefbd423416d1945e9 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be87ff20c882efe42ac17f45158ebffdca193954 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08be9e3bb161f49e83b6276f67fb2666dc2237605a9973128291c0a900203822 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e00bb00120e32f791fd262941f3b638cef3bd2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea3c575fcd2b0e725a3374d8e8057a1241e0ef439ee9cc29d99607df64eff7c +size 199058775 diff --git a/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17362df9d3d7ac71851dad79bd1a0cc465be823c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad46ce7ff9241c4b207a22f6c1c5425d096cb6e88ad0e87602e00c90fd206c1 +size 199058775 diff --git a/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3a1024668472e083a3da7b5917f6ed6fb8ba95 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f899f54b12e840c21a74fc1f1edebb7a8d6aba6ecb0f15f5e53bec3868a15dc +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc162303a166e02134df4c72ea867f3b13759e7c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b135da6cbac2a34c66c11970c01c2e9e79cc08d789a985718ccb14ee9cd825f6 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86497f0b675a6eb5be1a38639460bc296dd38a9f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e1e259a5fa907c71af166867352557fda85736b914acf0ea8afd6ed1574f16 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c82906dd316e0064a37f8d6bf1f0699b75682f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6029ad1012213c72cc34cbb26269d6ea2b9ad6c2cfc898c23be9221fe1cbf9d0 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa81ff3dfc5cfd9e3f9566b90cb228255be25b7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a31c21b341554e57dcac42cfb80788744839e49971777ac1e0fb24370979598 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d11e50a3ff6ea68978e1dbaaaef94a2ccbcdd0b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6acfa131b0fdc856bcdf41f919ea6c54aaa175d926c2e6b96ab3dd45a79f05 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a6acd985542e356334ff30a6f8ace973bcbc60f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b2463fd19d35a85d9b0ce4a265d940bf37e93c5ed38f97e4ce40090a1089cb4 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81e806289cca6695cc522b848839b6f0690d4586 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce84ace8f67717b6d6dab5ca5736cd41c5f5a274168974a9a4dc3ceeddf3c3d0 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..161fd1bc12da67b6992ff64f9722e167df0274d0 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c459be8ebdb74130d6857b955f02dd3cc5a3df4252b91b399bd11d826f7af068 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73713ef43344d55396f8c50479b801644e7f9238 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5c837735e357762a3f01f19b57a20203407e1ff05640c9f367b0cc43cee23f +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..294276ebf850bb0ab310e2c9bfb32f2b3e1892bb --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f623e2dc7fef8060fcac43f82cac131327fec8d5bbc10fedcee20f352566e0 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f10d4ca47e07de9d5038c5a38bb7ba0479c52d58 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73608e4b97a9e98a2c97c24d75a4219322edcf0b35f36a95c062db9ade952592 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d111f407013fb2e11d0ce17ed118563fe8901e8 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4e54438836975b810327890c655fd11e80f674c9ba9b06080c414305b497d5 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00aa2ebc8a15d9e611444475acdf717e9e35541d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed22f5047dd4412be61d1a3ab4f0c8601203f0171b1a8cc16b4208d2f3941f88 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d91fb0e6d7c90727a58f0bc0d26207bec4709a7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994a9ecb46f50fbf12f6d5ca17bcfd628aa389d5691da2b694ada5bde3562686 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d61eed18ec09468350ad64ab704a5e2c3d6b829c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e9676eac08fe6b28e09bd20d3ee4314332cd2925b7847b468e6289fb76a67b +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..551dbc5a817f6e7167fdd2c1a45bf807e55a08d2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c9775c0431086681570670ed8557b58e2714b38e1cbdc0a2456e805433335a +size 199058914 diff --git a/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac971aee9c72713812c257f351db2cdf12fb1745 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:011be631a5d3b6e8209335912655709c08392e1939900963fb939010fecc1e15 +size 199058914 diff --git a/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ef5ca7be99bac6096161306c154a787006c6331 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15de419aca58434efc2196768c3a1fba772313199d750ad4a69323f38715ba51 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02db9f7a0e8113387c028a72f03873ee02d785c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea9139b941d8cf69a8d086685afc5f89a54123c94c9b9e3d845fc70fa09b2a3 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1275ba3c78239730e6feb1752c86df9dcd7808 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf0e04647de05404259320048aa3c4063ae33e57c6ec136d02dffee28a4836c +size 199058711 diff --git a/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ba38b01bfdb44ba45726e29fbf64b12e8663c7b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4255b7bde69bd8844f99a3b663e182b3fde047eee2c67289aac5914f386e2163 +size 199058711 diff --git a/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d224e8ef783ba17849afa80a3a9cfec960cab7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738b83c8ec90e52d7e6a36e782bb0b070938589177e8a6258869b21f49b34b20 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8995f8bae94349cf2a1e59cb40ac76ec37c1e81 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b234c2852f8b9f941949663ab67e2c2fa73125c4ce69ad49704b5deac08473b5 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e59f3c890afbe35f36e36fea8930c02c633e0655 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76897dd5f5cf6f4c8f6aab2b9b87852fa77ae14eae691b06f43b346ddbda696c +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d356072a8e386038fe9d92e1d7d9439dc4b5ec80 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdf0bf222845b94931aedfb19edaca95612c3eb8e8226268efd1e9e67aadfd3 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480c7241941e99a0883cbb17934a79845bae0ab7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56ae8dd42544b561f0caa84c9c8927c276002bbf70d3187b33461a569d7a7af +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00dd1cf28934be9d9285bae9d7c71afdc43aec4 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb42c31e3b96a753eba0d7dfae6c0cb0337d581d932276c0d4174889d85da31 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca526508d7858947cf8fbf3d98c5b270694cd704 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fcfcbeb7e2c4cb54deb166a2959540d3072e40ed189f0c291300d520927e01 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67a122c59c664bf88f210cb8e3f4f3f79bff7f8 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c893b76285b384a54b14a195124210f952c6aa07eef79517467a97cb2026240c +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01cf1eee1d2f2090a5b2ea1c16d5d6cc6e292963 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9fd6ea8db3dcc3b84bcc6bdf478569d59cdb73c2c30ba4af731c3f8ccd0078 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f1a0e7ed1f96ea15f1bc6615765a13b3ff01da --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf3bf1dd2cd977f967cf5035a9f254749bb6e3aab63cf22e1f8a8d97efae404 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748938130c2012f558d9ae143556898a16d87187 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3cad4624f9c5c1d654096a1c46ddf1e7ab49219875ef459a010b7fac6eaa16 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..974044875845b2511b9944ea97dcf2653b2525d5 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9693e9a99cb82fae346290195e1e79ad573d303dc449e71ca5981acba0f873a3 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d44cc0faa84bd8547435b89d16dbc800264d71a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e464e96b119adfac68d84541715fe651d01448cfeb0cce22fd8026a8221a942 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..733831005235146615156fe6bdc8b690d7b1580c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb42313d81fdceb45e50a6f5292b352906dae564d459ac3cf569e10f8188c2b +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c93501751d059dfb2637417d9baec24234c1ab --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:786d6a7e8e67dca11c9f03072e4cdda74417cc30e48e7e0fb19445c3d40b0b78 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb352ac46b5592e622dfa590138ffeb856a462e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f76861ed81ac2701e236911b9d7b79501060678528595c433cba8d5584175c8 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4e7cc72534b933ad1e6fd0b4f17e7f3de2160cf --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd072428bff0ddbc04c5eef87ba9ea91d93a26eab3d4cdd974299dba59af722e +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d42d5af90c1cb0bcf8224c1c2f5afcf671c0087 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92797d11a3a1e37b9325230222c659885fb30a5f31b5df9febb35523bf3bb28f +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e27d29430d03b95fb31a5b9f4e7f07ee7599f47 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7627aecf8cb3bc955b26bc631ddeacc8748c663369ef66c0685a50544e9b4f7c +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16988fca1bc2497eee0ebde8df2a7521c0c6265 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23eaeddb30679f9d90d4fc73ddea352c79d51a0f226529cfa8b2cf7a56ca4cd7 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6535d978219b5159a490e1d3b39cbb81f748e208 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee062a4680c4cf1439e9017d4e7c8084c4f6f36030fd475f4de729f223e72f6b +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fa33d8fe8297c60dd4550d725f880a00def83fa --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337717d7447e15db00671b9bcc0fdd7bc27f6f456bfabfc7ab4802b8222df9d4 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..960ec094ca9ba7e2ece31ef44408ff3c7cda0478 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab89464a8cd125203130804ec8c9e8d5368f259da7543a50f7efb4656bcf14f6 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a748dbc2c41ba9239ebca47101dd608990e399 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b93a5d1b281cbcc7d64cc174a864f1734686aac4a999686f38cad3e6f4efbe +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99e43041a04832520ff685728000cf8066baa0fd --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214024796be78dd14efff89d4892a5b918481b69ed228b75cb861a50833af3df +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40229d652d3412a22a26f72c01ec4d0b690e7e65 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e4e86777a02d7e166921d78dbae8d5773c5e9ece71585f9c608806d62f8560 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df5bdf20d98d6cc8197c2db66f09de3547680744 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d665c6b950cd563f428fdcac3e2eb10a93fb69223e4cb6f31745ad8ea363ab59 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1b8b6f27b056178dc3819b09a8909b1e7f5f263 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09195be9001267c8ea36221fddc7a2226b55b9e66ba6cc7560bc4b2afa0ae928 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ed350f5b144e14a3c61479f084ddd19a591a8f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fc082615444e017df2a3300893c31be7ca921ee43361ff993d9442907fce2ec +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02771661e5f191df90b9bf02ccca1b92ac908156 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8ea8a318f8f2c7368238352d5a464fcbf89d87cbfbc5d945e0de15e4ea6be0 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40017bf70ca9d475da27273d32b821ed47b5fcc5 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51e7da38e4c4f2280347e56b0b92c42d7b0a32b6d6065ad42e4d83745d0e904 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482733f5210e739f861d2e5e5d0a1f8fe8217456 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f9207b9972e9b6c7a98ef578911848bec965f6e6e620e591c88463f2f90f24 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d76052d789123895baf2ac3ab9fd66622619102 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28bdfe6406d880cdfb3677f28356e042a7f70066795a3c0d4437e32a3eac2726 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a254a99f4ceb6244e44e95fd30489a18d7d299bd --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8324b3b2c9ff6e9e53bb32e290a2c2f0c1feddcbd07d61fe817d4bf673fbcb +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec5977eba0efb7984813974f1fe87158c87bc0e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a440f9410186b6a6bf4ffa4193eaea25e0baea8216ab4d1a5e0963e0eea875b +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3a313593be06a0b2f17149314f0309c3190023f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb85631e4d18b515faad0dd0309f57a161bab2500382dcbdddd41e66dabc8afd +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4381b89cb976376054284c81641eca5e0d5c1f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f481120dbd042817cec74af1794b7bc1cd3d5cc79b5a440d233d9586320565ee +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ecfaa05deecd41e3abec3e38ec9c5b0a95daf64 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cae8928edd781d2a29f396c8eb600b7a5b7fca59f6aab058a025b354405aadb +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f13325f2aa24f4391bf520b7b34f6b9dff38052 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2251dcbff9d36905528f7358a57e5edefaf48938eeecb98ee3f9d869e7bc6f +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..350a6c89c7a683edde31c169a4177ded8c64bf50 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a64514f7b5a1e329c082a0798fb5257e46534dc5c76be54cf073aa6c335e29d +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fb1b7aec09144150e77750da28ff76099500158 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3a25bba0aa64a65d9d824235c433db81e2aceca457d80d70d2f2957df5b126 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9b520c9e1aa154fcc2d5c0bdf6d9be99e5796d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c37f9122b52487bdf730d7208570bbdc4dae210b90540ab4bfb721a80ae924b +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf17496b4bd466b9d54d4c5238a6d91948cb705 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f045392afd1127808b2c1307b8f06f01dd7dc6f250ded1420f4d87d92c43fb +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c86ed505633b9357749e309cf72b1b0ad11e21e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bdd6a581a51b34ef26e1c1d1951fccce8c53c2e9f97ce8a33ae59db172e483 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef94de21a9189154e93727d0186b6699f2e5be3b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81378beb60e2aca04a5a64bdcf1715e03283beff40faac13330f31561ca92f7f +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d5bcba2977b8e4232abac1d00e03d274aa918e8 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d58891128d56a8b40245a92bf01d3d88bfd651033ff6a77e6933b92c8fea3f +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21e5b710af419a2e38563348358f42f283135f51 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504d320b48136e969fb5e8dcfc714c32ad30fd3e3349ab864548e00e26561dd6 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cfd3f5082446a26de3df98af7b2b4296cb327e4 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7025de5ea0dc022ab50b97b3ff4506f004e3b7d7158fed4d82a5b20bdc235210 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c0d2c06d1198f07ae98d575a7555848ce750b2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a38759f1d4a07c9741f8b6a0fc7abdde0d69b2c313f709f4977c5b4e0f58a29 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62aaae7e63e65c9ddaa95981bf2e8ac3514a13e7 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d377e8f50c4ff132e3df46f043a9c6a05d9eb37a592459dcd57e515e8f9310 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5511f5ad149a59416cfcfbcbe133a0a0fef55e2f --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d46c4601afc99ae514051cbb66540658392ce92efb68499524c52618a4ee8f +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09d5c799ab6304509bddf4a851dcd36d09dfa271 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56c53e233b579e74b966d4228fe77c96ea7563d11c9ee085fb5f9dfa40ae3f5 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72d8a23ac54f8be89aa036ec717f358f3085c195 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b677b98ee6f7d7b8b769d2212576dc526524935283e3bc6444a1882a66a59b7 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..807aca308d137a29a7245f9ed4cde3ab35c317d2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e07b52e6bf3697bc8f40a636226ad418bb2f4061621d76d0cc4d8ae34630c8 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5866a471ba9a0137ad7e60abce2f4a1ceca7adf --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee05461ad95ac7e4bc353abb30abe0fdda7962f1f0f885c00efafd95fedf6de3 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5709b623560bc21ff32be8b5372449539d246308 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d7be75480caf9a3b6b5f48840bf773d1c95cf35ef07c93bc33178345485a6a +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..633ddf9e01e52d00e84d8279b92ac9397003d147 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ad67b864ce6362d758fa038691952908ad6fdcc7d2a197eb9bb443526d2e53d +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8292b891139d40b1cbbbc2362db165359836527a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5604a7510436a7dd66294333100afaffaf35bfaa8b7f1b0cec24e4f529f9fae +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1342403cf8ad082886b991e96641cc738f5b9b2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0df7f22ccf650fafba9c2e137ff13d509e7bc201556ae0996188a942913d385 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66bb9177164dac93a69abf0290b86f4e898b8528 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ef803f2c6e37d48c4ac79d727d1af02aec642678bb3fdd97424b56bec3e8456 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..652fb4454b2dac6bf8a5f9d11cab4b942a863a5e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a5a0b1c472ee1b011313a74b5e31973ebdeeedfbab8f65ef314191a6d5ea733 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6daa274b3cabd6f4c84754a8c1c2fdd2fc1fc35 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868f8a4d177996faf4b2656746b990d6351aa340e8794946dc2afce69f57c571 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fca9faea5b07ead22303d19acc2ddda0acf6d176 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c62a111fba221fbd90dbed4e1ada2a6af0d08d4a34acc30a4453bcaf97a85cf +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8ed8066e8463fd9ca4a10cd33f3ab5ea88efee --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e350f8281e5c55c75960182151766cb6c57a3452483789c509b111c8c0daac89 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..305808b2afbf40e46ab02edd3662c87fc1fba46e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0369fdeaca67e74aad49ac94f265f07b26c97a84ac2466e7b25da3b91c85f012 +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2e0257f28fc15b0245a960a4932a46a4951eda9 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eadf096567adcc2134ef8d9416ecb3c41bea8155ae510345a707dce1305c4af +size 199058647 diff --git a/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8be45f4d687bed2b43778fff7867a8a6a6c288e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f14d82064f5e64bde9b378e8f0a97ad683db28ad0f4c27b8efc36253cf80501 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f5ed20a7c6be8973d996a75182cd5751adc8643 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568402d6d7eb390639640a4bb896879f0121426c018ea4ffffaf32415ba4eef0 +size 199058850 diff --git a/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f424fd23f26090044fb14899dcd317e9fe47c8f8 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b090f0e50f475b7481ef4fa959227334a1a81921a61bd88c1ca740155a30ae +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fdae1da9d4a38acc91d54c10a7f864bc785285d --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3961b339b60fc3ca8c704e95797537e1d78f9cd34a89c16f85f75074d31c923c +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e07e91b7723ca8278b1281281620cda60fd97c2 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d628dea2cffe63ecc015a3a1406e80d6123627059932593301ec620e2b70f1 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a1fb3f717c5e80aa25c362412b36bedb895586 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:280ea73fd6dbca78724aa2034dbcf8289ead160ba701f77103d2fcc0fd71b581 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f29c9c5278f70f08efb3734c36a0f27ea4d2ab3a --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730490c9214d7c6175750b84e5dc1589c7c3e6ac6c29507c5eb86363e20f75b6 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e8a1f32ef15e622f2d89e28cd95cced130b68b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855306a115386af22655ac2d748f7bffbe0a9be373096955a31a9dd2ae7d688e +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11cd6fe9569573174cc4bcd66750c4aa5cbf4bb1 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3931b85eaa00342b0e47dfea5fe3e516656fc8fb5b68af3e9e273131202506 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2426d856e0b49a325191600f5cb0adf6dc31c733 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc45ebabd03b7657a046f7c8f77db8476375888f00452430393276c4515ef2d8 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71dd4d618105997a9a74f31d9dce0a539dd912c3 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f439213bda60fb3709775a7ddb641193e882b1494432b98bc3bd5ecefc0b86 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e360caefc7a6986aa7312a25f899c7e671af3c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4716fc7d49d88c0eef3112305602d4d29dd7ee5f695d0bca4a4bcd85e26711 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7dabb6566ac31759cf7e09be77f739859113871 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a6afd4a3a47c4b438e2df5a0685aebe90d66ec41368b665435289c7b34313d +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a0f97aa2381c2fb2e315abd3f6b2c787127c7c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd35367f92a57fcb9bea1a11bbacc1853b28261ee2f7f8aa01da94bdb823f0b6 +size 199058722 diff --git a/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e944564d247134abc9ecc12a8f2a06ab2b61684 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2205e1e576a419aac93f2f8c4d8f4c098859a113ca1412ca03d3f3e36b534b07 +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52bf170dee2f00bd368eafd120ce199b773cffdd --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76e1dce1b9f38285d196dda55a6c849f9fdc178669d22efe0e046f2f0fe79ac +size 199058786 diff --git a/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cf50866a4bdef959e2504a969ba442fb187af6e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f167ed72dfdaf61598de9eeebc204f93f2c49bd9fb1ce6a3bd81ab1dfb6cf638 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79365ee4c507cbf7ce2e4e7aea63bce60e16133c --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb91c18dd79bb3e5aa2ae7918076d65c1af89e7f3c268c7bf5f9fb38b59b4d3 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db06c6fcfd6a3a646599967b99e86a60661abe1 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3853a2c58dc76dd240c1179f7bff84f7b21c2ac1918c3e6b6f661f72c33cb779 +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc2fcc39c18de8f93072f026466f77e19bc389e --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e931e23dcb1d01fa3a183763f6cf1178f3cd5fcabcf537f78941392036077e +size 199058658 diff --git a/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd66f17ead49290956b203fcb97f666b7cae697 --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa904ab83309e85c79e69aa38bcc0967400936cd3393f245a6ea52dc7bb96dc9 +size 199058839 diff --git a/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e0b2aea93b43d7f356c2510bdcb88038bb9022b --- /dev/null +++ b/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b8cfba3db7a840ea52508cbe26e56909b618dfdd504aed4d88dc961c84504c +size 199058839 diff --git a/global_step80108/layer_01-model_00-model_states.pt b/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c80b9ebd00d7ec3e8b7daa0e0b8a55c7d4f26f40 --- /dev/null +++ b/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fade3cad578dc7fb3921f0cdc8c98a444f9bf4157cc1df1f683558114f2dacba +size 167511299 diff --git a/global_step80108/layer_01-model_01-model_states.pt b/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1835d34767a8c84b15e5ff38c6ef6dc7088500 --- /dev/null +++ b/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d47d60552056e0ea32f23678d28741fc2723bf5e088f160c6e1a3c334d69d37 +size 167511299 diff --git a/global_step80108/layer_03-model_00-model_states.pt b/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49913a9ef932361dcaf4fc676d126933ad9fabd --- /dev/null +++ b/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf704dfb23714f8b93db8489b3dcf090dd598e739105b8c2d496235f7c211e0 +size 113308931 diff --git a/global_step80108/layer_03-model_01-model_states.pt b/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0e6c276368875caedb9565743c2c05f00e232a --- /dev/null +++ b/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b0e1bd12b63ffe1c8d48682742747b26b2e7036d2f954ad5058694fc481ea2e +size 113308931 diff --git a/global_step80108/layer_04-model_00-model_states.pt b/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b52b683dfd1ee9015cb8405268b97043388a077 --- /dev/null +++ b/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d7c863f02f31df6a9c5310b51fd7470cdcba016ce4fdad0ab278284135e3ac +size 113308931 diff --git a/global_step80108/layer_04-model_01-model_states.pt b/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90088a039771af5028367299df6f9075727338cc --- /dev/null +++ b/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2651f621c5fa44dffe7c133e3cf0c0489004bad7463c74391eebcb316a01d16 +size 113308931 diff --git a/global_step80108/layer_05-model_00-model_states.pt b/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4448a5b17507c2a3543d7c411dcc63cf196f5f96 --- /dev/null +++ b/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9412d8fa996c7eda09ab2792a6a3cd77a32c3a10e8b96cb74bfcf4ef7d67cd +size 113308931 diff --git a/global_step80108/layer_05-model_01-model_states.pt b/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5235fd487c2663160f50682561098b311b3e7b47 --- /dev/null +++ b/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59165b6896e2f6c57317011824a15317a47f0472a0155c1606ea3f24f6200ec9 +size 113308931 diff --git a/global_step80108/layer_06-model_00-model_states.pt b/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c12262dd90f8194b01669b2e116f02aac5b73836 --- /dev/null +++ b/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e20ff64fa3696c159620de624c858adc0ce7225430754d5ee07bdd0eed736b +size 113308931 diff --git a/global_step80108/layer_06-model_01-model_states.pt b/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbe0e8a707cf8a4301b76df68d480571c7fcca15 --- /dev/null +++ b/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28fad109e1784993074e59e38f41864ee44a71f9743f5fe10b7482efb49a4e27 +size 113308931 diff --git a/global_step80108/layer_07-model_00-model_states.pt b/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..373e9c8b6898a3f73ab10ec12ac501f0daeb4d3c --- /dev/null +++ b/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cec13c651985e20f1533d0c50f93010de165a033ddde6372fae9272cf186ea1 +size 113308931 diff --git a/global_step80108/layer_07-model_01-model_states.pt b/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8287c283818fdda517d244c6678402146253a3 --- /dev/null +++ b/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177df7920629fde6a34a67efc6b08361ecaf29f6f16c257f7322ccff3b2bbaea +size 113308931 diff --git a/global_step80108/layer_08-model_00-model_states.pt b/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2981c56be62ad9585f808554d4759175005a3466 --- /dev/null +++ b/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1ca10eba24023b254f4fb40d0f65e8196afcd0182f8ab19aae5bfb95392125 +size 113308931 diff --git a/global_step80108/layer_08-model_01-model_states.pt b/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53ac049cc24ca2ce9f69f039b589b48fec95aed7 --- /dev/null +++ b/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec3965a46c4c5e657b844e0f237e7569d71cb52e750edb5f01ef473d9919182a +size 113308931 diff --git a/global_step80108/layer_09-model_00-model_states.pt b/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..833d519dec84ea4676ab507aec2c2a7fedf326ce --- /dev/null +++ b/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be6e879a1099696e6cde870143099dcbdb051887fbbe156f7f472334ddca087 +size 113308931 diff --git a/global_step80108/layer_09-model_01-model_states.pt b/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88bcfa705bf3925ee48c2a593311194d192ff75a --- /dev/null +++ b/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:471f1e77a8bb6910d5fb1173233c808fccb99b1296cb8a6ea6ea3a7f27fd384f +size 113308931 diff --git a/global_step80108/layer_10-model_00-model_states.pt b/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c417f950a6ff34ef1c2b73d6cf2d926c3abe4da4 --- /dev/null +++ b/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5d4a495b3a0fe966e7d2b5ce6e304b8ed3b78b26eb47ecabe8ecb4bfffe7ec +size 113308931 diff --git a/global_step80108/layer_10-model_01-model_states.pt b/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5cefe1ba71a47f54018b471b5895eb3fda55cfd --- /dev/null +++ b/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d3e807f0fabaad00435fd4d2dbff4f3225282231c0aef747036e1300e864ad +size 113308931 diff --git a/global_step80108/layer_11-model_00-model_states.pt b/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..796ab724a28cff3990f409e4d97f723c6f1cb32a --- /dev/null +++ b/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b71782511b9640b88afe940c22536b858f99ebc5228289c68e6fdafa1a55fe +size 113308931 diff --git a/global_step80108/layer_11-model_01-model_states.pt b/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3552b424f13cc53cf24aa115dab5c96e5851280a --- /dev/null +++ b/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:427f7a514d635fac57cc9832ecd0e3ea951dfa6edcf1d916fd791dfca862a0b4 +size 113308931 diff --git a/global_step80108/layer_12-model_00-model_states.pt b/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30b11774fdeb74e0dd44249046ce153d6eaac882 --- /dev/null +++ b/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd94bc9a2cfd56485632afecf20406bbe9d0e0cc13de60e3f46f01af5dcc461 +size 113308931 diff --git a/global_step80108/layer_12-model_01-model_states.pt b/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b53cc6b06dfac56b824a3d427e065a6a93b16a10 --- /dev/null +++ b/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d27d54ad0d7a129e1da8598cadf053214b9faed9db3fae6b1a54b0d9202a6a8 +size 113308931 diff --git a/global_step80108/layer_13-model_00-model_states.pt b/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cb6b1c3531ec9384014a24340b169d8d33df167 --- /dev/null +++ b/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ac49c6c6646bd0243890726ee2c6c8c57804ce3b1c5f1902a30d48e72bb739 +size 113308931 diff --git a/global_step80108/layer_13-model_01-model_states.pt b/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec5167aff768536eda8d7af76b61a5529b93e5e9 --- /dev/null +++ b/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24369878c4da5db5e346341b01c339f71cfcc4d5c0b4ef99266647ec703245da +size 113308931 diff --git a/global_step80108/layer_14-model_00-model_states.pt b/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a538fd27d2893784ae7b5a597273fb198f6dc06 --- /dev/null +++ b/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adb868af5fefc0aeea2be7cb9d7c90a3c33f655d208b988b26cd08941c2398f +size 113308931 diff --git a/global_step80108/layer_14-model_01-model_states.pt b/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41f6560cb9f0d66f762a55dc645c7ec62c08f573 --- /dev/null +++ b/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b124b34efbdec3a8cb8518b6f95df0a13159c41602e6a209b71e7b657785b5d0 +size 113308931 diff --git a/global_step80108/layer_15-model_00-model_states.pt b/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b911a9b2afd71ab455270bc39915fa0abc302731 --- /dev/null +++ b/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cebe42cef9aae088f3e3bd3ec566d35809fa69c793e6adf4b49445a2d0ae37b +size 113308931 diff --git a/global_step80108/layer_15-model_01-model_states.pt b/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9a234b43dddf2f9d24e29e351381a42a87e4633 --- /dev/null +++ b/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720a9c21390ae9832a7153198fc211ab0c9d8e9aebbe39c62238b23b871148d2 +size 113308931 diff --git a/global_step80108/layer_16-model_00-model_states.pt b/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..149330a338c897434d6d447b6cf933bfb9feb547 --- /dev/null +++ b/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654f8a6946cc68299c77099efa549b2f1eba764004f176b4443f35d0937f0d09 +size 113308931 diff --git a/global_step80108/layer_16-model_01-model_states.pt b/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d50f3810aa109062be6fa89ebfc3550be523159 --- /dev/null +++ b/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95dd799335224efc1a7cb9c42bcaee9e0731458c661e46f3a95f2711fa4ce1d0 +size 113308931 diff --git a/global_step80108/layer_17-model_00-model_states.pt b/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e4abee7f8f10ff69480832b7626e6b1480b8602 --- /dev/null +++ b/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13035df0c3bedeec75e214092fa3cd4bc43afd813b01d179a8d748d1874155dd +size 113308931 diff --git a/global_step80108/layer_17-model_01-model_states.pt b/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff3c04504228525b44ce2eda8dafabd87255359 --- /dev/null +++ b/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:223a4c57de0751d8d31c66a17583e8f977894095484833a24e5572e3db188be8 +size 113308931 diff --git a/global_step80108/layer_18-model_00-model_states.pt b/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47a80d7a764f49e62ef92671299bf84d0ccc638f --- /dev/null +++ b/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7c730ec1aea8411cd2e3de0c2b4b6dd250a322e52050d3a983169f15a13024 +size 113308931 diff --git a/global_step80108/layer_18-model_01-model_states.pt b/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445b7bea95d7057aa167c189c385751b39606396 --- /dev/null +++ b/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1ad8a75cf90b45cb4229b9a255ff5247d366bf5dcc54497126a943d26c1eb3 +size 113308931 diff --git a/global_step80108/layer_19-model_00-model_states.pt b/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f291f62b3357565edef96dc9fa8032aa518440 --- /dev/null +++ b/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d7914767c0b07eda557864afb9050d644bccdea8873bcf888873726cbc377b +size 113308931 diff --git a/global_step80108/layer_19-model_01-model_states.pt b/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f2bafa92270375ee73d7859c5e6616f1de69e3 --- /dev/null +++ b/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc9fa678ff347f1b15e03b22beb5c5c1096cd530dd267a60f26db653515319be +size 113308931 diff --git a/global_step80108/layer_20-model_00-model_states.pt b/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d86b6a9a52434a87185a3c3b8921f2502010ecb --- /dev/null +++ b/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a4f2e9f26a0f88b624a02de6667c485f9355e67e3e5d126f86304aad394bc8 +size 113308931 diff --git a/global_step80108/layer_20-model_01-model_states.pt b/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f6451d0ca4903adc627688516bcf1565b07be1 --- /dev/null +++ b/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080b58caadd7cb13cd3c1479e53fb1296655f4853668fe34c5b5d1dbd99dc025 +size 113308931 diff --git a/global_step80108/layer_21-model_00-model_states.pt b/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6ee8779f4cc326699fcd44b9beab3df4ea83e1 --- /dev/null +++ b/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c14aa37d1819e2250fd9a536497ff7c33b73ccb4a2a6176fba42f36cdef2d2c +size 113308931 diff --git a/global_step80108/layer_21-model_01-model_states.pt b/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5d3140cb9a0f6abcb4a401bc528c2150c929b6 --- /dev/null +++ b/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3204183a685d3ffd33de410f1dd72f85facc3e2179b59dc2ded47128321ff8 +size 113308931 diff --git a/global_step80108/layer_22-model_00-model_states.pt b/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6709958d94e83206eb9e7ac4902810af19e44c6c --- /dev/null +++ b/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a15e2003f6f818675713bd5f8153414244aaebfb96932ee1967fbfd5cd9ed3 +size 113308931 diff --git a/global_step80108/layer_22-model_01-model_states.pt b/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e7279ea96ef3baa8073c9b5bee050b72b38dcc5 --- /dev/null +++ b/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dfcf385a0ca775a4cb3967794a5a2f10c66716e8a3969076a6c8a8028febacc +size 113308931 diff --git a/global_step80108/layer_23-model_00-model_states.pt b/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6093364a0268dd441388bff99779e36eba126cd8 --- /dev/null +++ b/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59cad3e28f31ab7aee4c3570bba38e8ce1fc27c6c18ae36c7b26b79f4104cbc3 +size 113308931 diff --git a/global_step80108/layer_23-model_01-model_states.pt b/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fc1f0c6b297b831edcab5c654563f0e28d4a44f --- /dev/null +++ b/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10c3c892fdb385e33bfd44e051801e3faf749f83e24b2fcac9867aad3dcbc2b +size 113308931 diff --git a/global_step80108/layer_24-model_00-model_states.pt b/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..934d354684bb463af9b4fa4b03129fa99c1738b3 --- /dev/null +++ b/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0c85313200f5f04b75d636e09d86e94910d87dfccf90d345859c2b4bd3b815 +size 113308931 diff --git a/global_step80108/layer_24-model_01-model_states.pt b/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf2948ccdba0ac6ed004eab6665d4091f3b1425 --- /dev/null +++ b/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704c9078708502bbf3df7b4199268768e88ddc321bd0b2564698967d81d73e29 +size 113308931 diff --git a/global_step80108/layer_25-model_00-model_states.pt b/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3f3e3fcfce746672e7c42b2141fb3e620325e64 --- /dev/null +++ b/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6373047c3497fd3257a6d0f9d73ecf29cfb15e9e8a1c4989281f07ddb8141f8 +size 113308931 diff --git a/global_step80108/layer_25-model_01-model_states.pt b/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a07e783d5ccbc0371dd6fb77d92de2bc8c049c4 --- /dev/null +++ b/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae1a622f08935efc9c1e32e40a6a997a5590c8e9e330924e322a57d149cce95 +size 113308931 diff --git a/global_step80108/layer_26-model_00-model_states.pt b/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1372c70a457a23979b97e5506c9948adcf560b34 --- /dev/null +++ b/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d9e8abd42355a4742cb487330428c11882776261878dccd5a791043b11ac17 +size 113308931 diff --git a/global_step80108/layer_26-model_01-model_states.pt b/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c4a4c77071e3b81041a2ec3d50b877c11ad89fd --- /dev/null +++ b/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9263ff20b0d16fcf7b4126f87f65011a0fcc99a924614ec52674f33d644bbc69 +size 113308931 diff --git a/global_step80108/layer_27-model_00-model_states.pt b/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6c55cff2794031da2b8f669eee7f3d1a596854 --- /dev/null +++ b/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f831b8ffd6201adc342beb5f37c0448babfeeaabf706724b1c853c6ffeaa1fd0 +size 113308931 diff --git a/global_step80108/layer_27-model_01-model_states.pt b/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d868e6abb3b17d91c94768dd966d7d1b3421cee0 --- /dev/null +++ b/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06a7e4dc1e781defe6248569d5b2a737114112462b5473a790e807bbbbec5a8 +size 113308931 diff --git a/global_step80108/layer_28-model_00-model_states.pt b/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e28be3230e5477ebdf0cb445052c2b31a85f4bec --- /dev/null +++ b/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2ff730f4ffe77777d43cf937eea4604c6d61f9d806b13be5c86c14e6328da1 +size 113308931 diff --git a/global_step80108/layer_28-model_01-model_states.pt b/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6784f73578a35fd7bbeacc9abf63ecc594e04c3f --- /dev/null +++ b/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad588b6b0e7fdda122f85a0c93ffc23056d741d5cdd8ddd92d101cafebb1102 +size 113308931 diff --git a/global_step80108/layer_29-model_00-model_states.pt b/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6838f33c71bd97aa59b62ea8725e6803da11794 --- /dev/null +++ b/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd0060d952f51f1c8b6055cb555dffc35b6e767a574321876411fe84971ac13 +size 113308931 diff --git a/global_step80108/layer_29-model_01-model_states.pt b/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05a7d0c61a032c8d0d28c7499e14516407d52607 --- /dev/null +++ b/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364dee0374b3ebbe6b3d4841adce6e9c8d998111e85eaa8fc2ac7e8ec941c1a2 +size 113308931 diff --git a/global_step80108/layer_30-model_00-model_states.pt b/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbb1c90d1bfe324b5aa609d44d50f258edbcf7ee --- /dev/null +++ b/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db5cbb27fecc75877b03f95c765520cda259428a78f8a48f6de3ffe8579bfaa1 +size 113308931 diff --git a/global_step80108/layer_30-model_01-model_states.pt b/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3187d28e7b2bc92ec9dd8edcf9c6328e2122620b --- /dev/null +++ b/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1272f9f2b14edda2f42e1a28ba75a8445fb31a3e4c00a08d2a6fae2876501538 +size 113308931 diff --git a/global_step80108/layer_31-model_00-model_states.pt b/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e21cc1db04639531f81b194e9c9c15cf616e16ce --- /dev/null +++ b/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd54e3e88bc5028341d6f1fdef557e725754d40e496df9c55eba1af05eb93d7 +size 113308931 diff --git a/global_step80108/layer_31-model_01-model_states.pt b/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20dd317b0f3481c87164cc3e24916e3da589f926 --- /dev/null +++ b/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c54e6e3dcf59cb8c7c14d483488a0424f3b909961b662c0ef04d91b18f8505e +size 113308931 diff --git a/global_step80108/layer_32-model_00-model_states.pt b/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc85d475de367ed3d5f2cb168edc1e46455cd9fa --- /dev/null +++ b/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3682c3a5e3ba118686615003740c2a9ac1d5a2e5a3e18851b3079e0f014086d +size 113308931 diff --git a/global_step80108/layer_32-model_01-model_states.pt b/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9d7078348fdf3330d34d0930c944b96025e2a34 --- /dev/null +++ b/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f61b0e1154733b88120d5a047dd69f28f5b529a325bea0b39e4569951e3995a +size 113308931 diff --git a/global_step80108/layer_33-model_00-model_states.pt b/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0677f6a566913350e2575220b9047a833bd3fbd --- /dev/null +++ b/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c111a2381e0e722e44243e9baa1b423d5accbd7412c6348752b98b65ce50388 +size 113308931 diff --git a/global_step80108/layer_33-model_01-model_states.pt b/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e303cff557dde33283cab2ff425baa7e0a4223f1 --- /dev/null +++ b/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa503744e4eab2014bd4efb7338fb719b9af97cb758de453739b763fda8fc58 +size 113308931 diff --git a/global_step80108/layer_34-model_00-model_states.pt b/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fcce9608e1b762f12251acdc508443672bdba51 --- /dev/null +++ b/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888ec64b9d2ffd38e058f98c0813f751c0ffacda469c0b334f05ebe21f11aa0d +size 113308931 diff --git a/global_step80108/layer_34-model_01-model_states.pt b/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edba489c6ae02b36dbb8ce4b7eebb686c9710e2 --- /dev/null +++ b/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803411a6d5aff672e6374ab64fe34534e9397e1531ad2c141832a2a55a6de9f9 +size 113308931 diff --git a/global_step80108/layer_35-model_00-model_states.pt b/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc217f02b368e701ccf0e1257c87e786f9c407c7 --- /dev/null +++ b/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6029e8b66e12ac755a5044bc7fa2f74d7f4084794f70023b777665d83ce817c6 +size 113308931 diff --git a/global_step80108/layer_35-model_01-model_states.pt b/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec9f47d4c8143cf19ac51b42cd8c53e473923db --- /dev/null +++ b/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19685d11ef1f6ab4f4865f655190471dfa532337a32bcc0c83f3e81146a2ba4a +size 113308931 diff --git a/global_step80108/layer_36-model_00-model_states.pt b/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3075cbca55ba87dc528d13fdac45de6afa393eff --- /dev/null +++ b/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664651814970a96a55024e15f4fef0a489d61cccb4468916bcbfae8df38ada42 +size 113308931 diff --git a/global_step80108/layer_36-model_01-model_states.pt b/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb80942c580a46fec2d9788d5ef38adb01321982 --- /dev/null +++ b/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74d7400254bcd534071f24f960dface432ca6ad954ff50824c3dc2288dc55a30 +size 113308931 diff --git a/global_step80108/layer_37-model_00-model_states.pt b/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d7aae2328d212b0853dc23438018e4ab592463 --- /dev/null +++ b/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97292cda0e99bedbd7e05267a138ff61507aec49633d47e914629032785a287e +size 113308931 diff --git a/global_step80108/layer_37-model_01-model_states.pt b/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..510e4431506fe1e62842c2f3eb012f27d59f5aea --- /dev/null +++ b/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8a1bd9600dae26fe304d0bdb785b96ebf6b9759f76e6a46baaaed78b26244b0 +size 113308931 diff --git a/global_step80108/layer_38-model_00-model_states.pt b/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e96f63b03b0664bbd4f84d804ad7d3498ed5ea2 --- /dev/null +++ b/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b3a4c4c9224b42b680b63936535b892713de0cccd8f5a22936851ff40caa1b +size 113308931 diff --git a/global_step80108/layer_38-model_01-model_states.pt b/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c74f1a3ef013b3a885c043667754525a7e9e0d --- /dev/null +++ b/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200d09ded7cfffd0821734f612f46cc74c966dd58309e13b960d0435cce76d6c +size 113308931 diff --git a/global_step80108/layer_40-model_00-model_states.pt b/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e37b01085746fb7e45b195a2768669f1b4192a5 --- /dev/null +++ b/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f95c65426d24c9dce4b24bc2cd6e8ecce48cba9ec66ed11d60267678f29e36c +size 13507 diff --git a/global_step80108/layer_40-model_01-model_states.pt b/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2665f4b568fa29a7a6ffdd942b4a310817e4d53 --- /dev/null +++ b/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424d9f749341c97a99ff33ff195e9a90a9c683e3c60c7ea0ded6573ba9095725 +size 13507 diff --git a/global_step80108/mp_rank_00_model_states.pt b/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef15ddd746abcc20bf4c4c6bf3705961e46df6d8 --- /dev/null +++ b/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fc1cec0a464e3ba3c225623910ffedcc47d48c0a6c612999781bd44c469eeec +size 51699 diff --git a/global_step80108/mp_rank_01_model_states.pt b/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..340d407a992dfb4698f0550e4f6097fabc4b49b6 --- /dev/null +++ b/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c467e202a0888490de224294b4bff494f1dc9ef225216cd43f080d61572ab528 +size 51699 diff --git a/sbatch_4b284b84boscarroots.sh b/sbatch_4b284b84boscarroots.sh new file mode 100644 index 0000000000000000000000000000000000000000..9f1cbc6ee3766eabbe2e828d9247091a748cf9b1 --- /dev/null +++ b/sbatch_4b284b84boscarroots.sh @@ -0,0 +1,163 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=40 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=4b284b84boscarroots + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=trainoscarroots.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/oscar_megatron/gpt2tok_oscar_text_document" +VALID_DATA_PATH=valc4oscar.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=2 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_4516M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 84_000_000_000 +# -> Samples: 41_015_625.0 +TRAIN_SAMPLES=41_015_625 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 410_156 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1676998777.nid007155.119433.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676998777.nid007155.119433.0 new file mode 100644 index 0000000000000000000000000000000000000000..341129c15f98c884bb738d383d2ec46da354c5ea --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676998777.nid007155.119433.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddff7e539101d3f6261203377c567886c4f760c52bbbd957c5cec70067764f75 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999340.nid005745.63112.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999340.nid005745.63112.0 new file mode 100644 index 0000000000000000000000000000000000000000..c40f78ef3b0ebd9b79feeb5b59fdb7dbafb4e19d --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999340.nid005745.63112.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:288452913c04a3136210e1ad2a3143ef88933111fa4f968e2149c5a1dc7d07a9 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999874.nid007155.128286.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999874.nid007155.128286.0 new file mode 100644 index 0000000000000000000000000000000000000000..c4a41677ef646a6a63c92e34ca7fe750a8a13eaf --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1676999874.nid007155.128286.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e5e63f7045848b453abac6b37bc3a662aef16e866ea839be4667b2ab96c31d6 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000305.nid006969.41855.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000305.nid006969.41855.0 new file mode 100644 index 0000000000000000000000000000000000000000..fb1d1c278222c5123b538d3db2e5669cc102680a --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000305.nid006969.41855.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f00d6d18d383ef3c667de70a18343a519faa043974d2458c3abbc9201a5ddac +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000834.nid006761.8011.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000834.nid006761.8011.0 new file mode 100644 index 0000000000000000000000000000000000000000..22223abd97a2c7cb87b25c60deb63d7a4a08b924 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677000834.nid006761.8011.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca030a3bb5bdfb9e76fcbe42ba9f9216faddecf01c22905cbe4d290d18c80254 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001319.nid005631.7331.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001319.nid005631.7331.0 new file mode 100644 index 0000000000000000000000000000000000000000..62236b910e21b5365f3142b70948dfdc33b9fab6 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001319.nid005631.7331.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137011849a4a4bd05e49a1dbbb6fe17efbee8830560fd5663fe718df119d6bc2 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001852.nid005939.4981.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001852.nid005939.4981.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb3e552bfdb33c6ab72ebad5bc1b60bc0b752858 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677001852.nid005939.4981.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32d62874cc78a28154d1328b065fd85f5ef8015f548bb06a780f8be615794ba +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677002394.nid006761.25387.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677002394.nid006761.25387.0 new file mode 100644 index 0000000000000000000000000000000000000000..4093a9b5cb7354beca450af2586f952f057cf699 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677002394.nid006761.25387.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf54ff345f8998bf4aee4e74032cd3e97c95e9d5addb4237be7ea9ccfdecc7b9 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022263.nid005197.96401.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022263.nid005197.96401.0 new file mode 100644 index 0000000000000000000000000000000000000000..8b14d487c09f27fcd8a77963b714a3f13cbf9539 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022263.nid005197.96401.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56478b5de481f9f9ba4afcc855d3127b8f95389fa8a60980093469325e66a011 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022676.nid006444.116684.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022676.nid006444.116684.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d42d1363b2a7e076fe924ab1cb003d6cb2e28cb --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677022676.nid006444.116684.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24765adc4ca7dfb0c618e7ca48749fa1ed1d62016e243d7b598bf953c540a94d +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023079.nid006885.99312.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023079.nid006885.99312.0 new file mode 100644 index 0000000000000000000000000000000000000000..e182b33d0ecf199eb35fb1b42fb8af6f467baae3 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023079.nid006885.99312.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ea2d33eded76f62c2d8ef3b66889059dcc55fb8aebf0489d6c587fe5e92690 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023491.nid007155.125746.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023491.nid007155.125746.0 new file mode 100644 index 0000000000000000000000000000000000000000..415166a082ad6a0fded48e77076f1442e92a88f0 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023491.nid007155.125746.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29f98843c9f25ee79de085d95ecf7bf6c59089c05ccf6b92c126a1a27be984d +size 19750 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023931.nid005197.126630.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023931.nid005197.126630.0 new file mode 100644 index 0000000000000000000000000000000000000000..af921fa9ef4f18e2eb1815c708290c621ec5d94b --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677023931.nid005197.126630.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af1e7269d07738d051b6ae029d62c238f65f4a36bc41817663f729a7190b9d7 +size 19750 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024363.nid006885.119687.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024363.nid006885.119687.0 new file mode 100644 index 0000000000000000000000000000000000000000..e3096a70f6e5b477d61c97a91a7d9a0d1bd601a3 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024363.nid006885.119687.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3486cc141158ba621b86943b7a72c0846af17810b4dd37e43419a27730df8c4 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024786.nid007155.9609.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024786.nid007155.9609.0 new file mode 100644 index 0000000000000000000000000000000000000000..4665fbbbc0fc8dafaf571efcd15160c861b83bd7 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677024786.nid007155.9609.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95751f34a668d7166329c418ce41fea273a0fdc572d1dae7dd0871cfca034b5e +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677025204.nid005287.53125.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677025204.nid005287.53125.0 new file mode 100644 index 0000000000000000000000000000000000000000..d84dfa95b2149e74a1030872ecea5f82f23b31ca --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677025204.nid005287.53125.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631bd79ad9350d0fa30035352520305c306b3359e5e46b02f531d63011108ebc +size 68027574 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677133867.nid006069.7921.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677133867.nid006069.7921.0 new file mode 100644 index 0000000000000000000000000000000000000000..42463ac6866cea197bb2f371806595845d86f776 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677133867.nid006069.7921.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d336102b1a108992453c9ac156dd68820d08d91c532f690cc5c70d512ccddf +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134383.nid006069.16302.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134383.nid006069.16302.0 new file mode 100644 index 0000000000000000000000000000000000000000..07fff9a3a2200e685f9ce58236b1d75362feee66 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134383.nid006069.16302.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f853dd2b58ab051bc8bc4b53ec348cd7f0c66ff14d8272cb2d9ce713f5c21831 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134821.nid005588.113912.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134821.nid005588.113912.0 new file mode 100644 index 0000000000000000000000000000000000000000..7bc8ba2cd1a56055a6aee179ed6b4d9d69425ea0 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677134821.nid005588.113912.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9587c08fed8115a7ad53f0503d744cea429387d12a344881c004d697d860a0d7 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135265.nid005588.122395.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135265.nid005588.122395.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e6a9836e1875d1afcbc8ecb8d5843bacbe3523d --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135265.nid005588.122395.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8457e2f216b513facd805986a7be26b6848c29fd0f9d1db76d58d3e22b71c0b8 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135701.nid007109.129173.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135701.nid007109.129173.0 new file mode 100644 index 0000000000000000000000000000000000000000..73a7f9b85a3d65cf7a7f53d6220d1fd73cc09e32 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677135701.nid007109.129173.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e4304c11ac51b7d7dc235b08c72676783d911db0f5282ed79829d56d8388bc +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136158.nid005240.38842.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136158.nid005240.38842.0 new file mode 100644 index 0000000000000000000000000000000000000000..ae88044bbe760a4f9f2fab6e6e77c86c30ac5476 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136158.nid005240.38842.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35af8ef066eb85574cd137d402c7cf4fd9f31833ce3ba61876e9ca075ba64b5a +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136698.nid005240.44110.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136698.nid005240.44110.0 new file mode 100644 index 0000000000000000000000000000000000000000..cbab7c9047a33d4d5030941feba773b19530cd68 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677136698.nid005240.44110.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a85ca5fe96388e0e9af7f0fbfa475b004bb8b0fb64a86cfbad11f28b58491a7 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137191.nid005282.112474.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137191.nid005282.112474.0 new file mode 100644 index 0000000000000000000000000000000000000000..9cc27f0159e07a24520889ea0578cac883d19482 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137191.nid005282.112474.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6527ccf6b07c924781803573f0c12a799c4c1028c3c5c8e033de1ea7df4c4e57 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137717.nid006831.72023.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137717.nid006831.72023.0 new file mode 100644 index 0000000000000000000000000000000000000000..751b99e56ee935656841daa68a4ce222dee3bfaa --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677137717.nid006831.72023.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:827b7dc5b46b6287d8043fb293a2a0d56d9df64a6fca4681ae9e7c177372ec77 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138268.nid005240.62116.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138268.nid005240.62116.0 new file mode 100644 index 0000000000000000000000000000000000000000..06e3c6ba605b6520f4970aa70f65bdb8480f633e --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138268.nid005240.62116.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330c8142fb7dc2caf56407a4e7dda887cc3bcab5b7cc304d04cefee90d1b2ab6 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138754.nid006831.81737.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138754.nid006831.81737.0 new file mode 100644 index 0000000000000000000000000000000000000000..d0d2f3108b18f04fbe92a75c3e9309154b69ab3b --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677138754.nid006831.81737.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142a098ee301965fd815c955e77296f589e69f146ebc170f4bd785d4d338eedd +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139194.nid007109.41325.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139194.nid007109.41325.0 new file mode 100644 index 0000000000000000000000000000000000000000..3664e7810d07277e3622a975204a20a5ce6bd497 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139194.nid007109.41325.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c42cfb10d3524d8266e21df150427b4fba508ab4ed3ec7cafbb97a2c1dcc67 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139635.nid005240.79873.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139635.nid005240.79873.0 new file mode 100644 index 0000000000000000000000000000000000000000..aa75e83feefcd5a667fc15a73eb6a970fd037ba7 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677139635.nid005240.79873.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced207a5438e989b6aeadf016dfd6c08a5ee410ca820c325b5836915c5c65784 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140080.nid005240.85270.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140080.nid005240.85270.0 new file mode 100644 index 0000000000000000000000000000000000000000..b1b8b885b344ef5939d508e840362dde925c41ad --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140080.nid005240.85270.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b893b0e45f05b0ac1d02ac275a7f19e8cd34f43a9b7b6cd87540f4b0695b83 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140497.nid006831.104825.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140497.nid006831.104825.0 new file mode 100644 index 0000000000000000000000000000000000000000..4f1fe44fa36f1a615c908790b8771d0a7634d190 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677140497.nid006831.104825.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1ed85ed22c397c601f4d68ef9175a8faea68974f630f3c11941d0d47b02860 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141059.nid005240.94554.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141059.nid005240.94554.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d7851308ad47129b22c0a8fd2135ab306757d08 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141059.nid005240.94554.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80961ad56ae51a0b869a28a5693f8a6cd53c017bfceb44bf65ae914dc5702cb8 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141638.nid007109.68180.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141638.nid007109.68180.0 new file mode 100644 index 0000000000000000000000000000000000000000..517662bcc2e3164d72f00ae27939f56b94d1ee82 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677141638.nid007109.68180.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157c78759717dcc64fcd08cecbaa91658d4169e9f16894408713ed4e84cb2b90 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677142065.nid007155.71285.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677142065.nid007155.71285.0 new file mode 100644 index 0000000000000000000000000000000000000000..c9faabaaebed98e27b94eadc1feeb22771e441cd --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677142065.nid007155.71285.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e229515d4ebeb02086fe37d78bd1b3434478963513ba3c5bfda70a9ff42660 +size 90109146 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286334.nid006729.3947.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286334.nid006729.3947.0 new file mode 100644 index 0000000000000000000000000000000000000000..2462087f56fbe1a867d7a3df67eae3644d6483a0 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286334.nid006729.3947.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27b52c2d7e37c04f87e93b36120ec603cdff3ef26f17cc6e90eea9f1fff3755 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286850.nid007155.79071.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286850.nid007155.79071.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f92f7f9fbd67e2a393e51481844d136f590533a --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677286850.nid007155.79071.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:094646d52716e9c4301957beba3cbe5a2b843c594fbcc5df7cae8a3873817555 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287382.nid006601.70059.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287382.nid006601.70059.0 new file mode 100644 index 0000000000000000000000000000000000000000..e06e3e902e6bfa6f9eed3661cee0b9f1e14f8607 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287382.nid006601.70059.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e03e9ed6c552cc15266f321a830fb3d6536fe1789f508297509b3f4da1892cc +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287913.nid007049.114407.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287913.nid007049.114407.0 new file mode 100644 index 0000000000000000000000000000000000000000..2211edc6be8d430e8b210acba3dae1d351c7545a --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677287913.nid007049.114407.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2264d9be74aab531b0ba273e2f6fcf957bf3dcea9ac73b8e344240099bae7db +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288434.nid006601.79940.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288434.nid006601.79940.0 new file mode 100644 index 0000000000000000000000000000000000000000..609b7fe1bc9f6a7f1fc79fcec1919b1868fd7392 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288434.nid006601.79940.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167712459fafdec9368c8af3708dd1cf9a45d09cfdbd8aad7d9133c487d633ae +size 16424 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288621.nid007049.123677.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288621.nid007049.123677.0 new file mode 100644 index 0000000000000000000000000000000000000000..876559de648222b629e6e2d682e2db72722cae3a --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677288621.nid007049.123677.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939346b5981452a374c72ff8ace9423ee003972f6d00e546c12e1e4e5dfbd154 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289158.nid006601.88618.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289158.nid006601.88618.0 new file mode 100644 index 0000000000000000000000000000000000000000..50636e16240e9cc635d0a296df2ccd8cd24e1131 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289158.nid006601.88618.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e34c0f8579cb5d6609a760c13d8bef21594412c7540456501b80a3ec1e0f5719 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289687.nid007049.2903.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289687.nid007049.2903.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc1228803e6b5bf4ec2d9555a6f79acd526e4c60 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677289687.nid007049.2903.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b37575577dc7a8b94f70e394a29ff41882b7be1af5ba22d2ce1c185ed7b323e +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290211.nid006340.55181.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290211.nid006340.55181.0 new file mode 100644 index 0000000000000000000000000000000000000000..78f75f15b87e476f01fd8efe844702e227e921b9 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290211.nid006340.55181.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e667165759172ffddc5e3f31b36d7d3c91feb60d5928c2dde95e8f6b06270fb +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290741.nid007049.16072.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290741.nid007049.16072.0 new file mode 100644 index 0000000000000000000000000000000000000000..1948166a35b044fc38821647b01870774d43815a --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677290741.nid007049.16072.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca4f48f43bd4dbde9a918d2395731344769c4355385d10851c0fdaf258d2bdb +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291271.nid006450.4270.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291271.nid006450.4270.0 new file mode 100644 index 0000000000000000000000000000000000000000..6e95b2cf47910f9909c4f4251e61a8799ed62ee5 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291271.nid006450.4270.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89def7fb3418025435556ce40d6d509ef47f60741fb61a9ba3d166fc0a29b61 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291797.nid006450.13145.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291797.nid006450.13145.0 new file mode 100644 index 0000000000000000000000000000000000000000..ddb9407a56df26aecb163a25b3ddaec3169126e0 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677291797.nid006450.13145.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860274f0c9908245efe7366a9f683940a7343bb467514ac7085ff6ef4619a827 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292347.nid006450.18935.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292347.nid006450.18935.0 new file mode 100644 index 0000000000000000000000000000000000000000..431a4c51e2eb39ceba6dbc2ea9cf2c8f0c10bc7d --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292347.nid006450.18935.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55726586dc59d20c39e4ee1d7a38ed6a3ad0c313acb67888b3407fe0ed90fda +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292869.nid006651.118609.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292869.nid006651.118609.0 new file mode 100644 index 0000000000000000000000000000000000000000..726912640875428e020b418b5e402da8d80252fd --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677292869.nid006651.118609.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15706c32141e61e1ebc17bb92bb8b9cb9cf8f6776c096a7cd6f4898131773198 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293398.nid006450.28065.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293398.nid006450.28065.0 new file mode 100644 index 0000000000000000000000000000000000000000..02c4f71ff1222a89b67f4420adc8bdae7a449e1b --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293398.nid006450.28065.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24c65e207b9d58b89546537aabe188567d5caa0fde86326180797141b0a271d +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293933.nid006651.127898.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293933.nid006651.127898.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f7127f304d4173ae0c0eb5fef99c13f8bbd0ae9 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677293933.nid006651.127898.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50cc479307d3484f4bf61e9c8615ef355e43241ff9743f66c45e2c2f76f869fd +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294447.nid006450.40832.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294447.nid006450.40832.0 new file mode 100644 index 0000000000000000000000000000000000000000..3a990c294e352dfaf317b85403415cf3d4089768 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294447.nid006450.40832.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4209b11e30313c142f33cc03e5e3f6d4d1c8bdfa05b3c1082cfc62ae7ba17080 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294984.nid006450.46450.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294984.nid006450.46450.0 new file mode 100644 index 0000000000000000000000000000000000000000..8a5c75267eb09ca4fad514bed5a4bffbaf19c7b9 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677294984.nid006450.46450.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651237868199b2988b032ca47d5cd5d23327549f6f7e5f590470206710e5db42 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677295510.nid006450.54594.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677295510.nid006450.54594.0 new file mode 100644 index 0000000000000000000000000000000000000000..6cf486d582de978ff3849a018267a998b571d8fd --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677295510.nid006450.54594.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e34813202325f455d7de4f53a0c996a4b57ef12097cc7f7157a666f0131a00fd +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296042.nid006651.12594.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296042.nid006651.12594.0 new file mode 100644 index 0000000000000000000000000000000000000000..c544c5acd4d44053f9b65cdddbb3b878b5988425 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296042.nid006651.12594.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f0afcb0bb854677ad779df4456d379b5eacd45bb63e2fae155c01a845605b0 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296563.nid006450.64171.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296563.nid006450.64171.0 new file mode 100644 index 0000000000000000000000000000000000000000..a144306c5c3bb0f4fa25834f4587df7d02d1730b --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677296563.nid006450.64171.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771a518a883b3506aa5da487ed13c8ffc5052737d08243e21738119e32a301a0 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297089.nid006651.25170.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297089.nid006651.25170.0 new file mode 100644 index 0000000000000000000000000000000000000000..4dc502fe7d56710a4e1ab66aa167a68f8fe67d37 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297089.nid006651.25170.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85180b63a055c4caf8b784363b4652d03d119197f9cf7fe82797714d53c2833a +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297608.nid006937.47532.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297608.nid006937.47532.0 new file mode 100644 index 0000000000000000000000000000000000000000..30a97da3855877d2f624dd50cb244d0d0e0aea21 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677297608.nid006937.47532.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9d81dc9bbd19f8c5ed8d408ef47883239448a73efda682085d9c827b8e4243 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298184.nid006651.34506.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298184.nid006651.34506.0 new file mode 100644 index 0000000000000000000000000000000000000000..733efa843c8451931f818d4772dc96ddc8b69c84 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298184.nid006651.34506.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977ae186e52b193ddacf2b5a14233952986769c46069ee0d05c9d5490573f9ba +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298634.nid007057.13237.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298634.nid007057.13237.0 new file mode 100644 index 0000000000000000000000000000000000000000..327f333bd61c14bcb6093163990a71c62193d3c4 --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677298634.nid007057.13237.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b5e2464e0e5e595d3e954e8f41126ce030c907c391e5ae2fe04c22970d2ff1 +size 40 diff --git a/tensorboard_4b284b84boscarroots/events.out.tfevents.1677299025.nid006651.44168.0 b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677299025.nid006651.44168.0 new file mode 100644 index 0000000000000000000000000000000000000000..74d396d6ade0383a8f7c67644acb983c7f5c11ad --- /dev/null +++ b/tensorboard_4b284b84boscarroots/events.out.tfevents.1677299025.nid006651.44168.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38551ab47b6ba51b19b21a4720d9420f25d13172192b0b4953bb8ca65e39558 +size 40 diff --git a/transformers/config.json b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/transformers/pytorch_model.bin b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b16ea1e85186db07da6f5fcbcc03f1e4a40d2e44 --- /dev/null +++ b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebdc05da3ec6b987b2e41a92230522a21747386f3ede3e9b5172b37615bfdc2d +size 8781203669