diff --git a/.gitattributes b/.gitattributes index 659f68560a4b5d408053031e1530176175b30a8b..586131c607a9b0dbaed9bec8e6af172e64dfcbab 100644 --- a/.gitattributes +++ b/.gitattributes @@ -60,3 +60,79 @@ evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8bdd61ab17f1579de712c07de0c6c1082f4dc0b5 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.29123796712848116, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.024099559164327343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05684299841582745, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016887384375207904}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.26382466542797384, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00448652393967693}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0846007331490898, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017611698640008044}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.024552079352862823, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009251381031279301}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11720876113413588, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030359279375561524}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03751857157597345, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00108659069296553}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05458027450709555, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001588691365439898}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2540701232644345, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004311533260849107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08142615853409181, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001670491088449438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0541293635979088, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016039721945264953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24960718136284848, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0042227139206395545}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08051138355871504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016680677195043975}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6d7696a2f22d9802db35f6d6ee4a290308da8884 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.32421224846581287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.022894553413488398}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06133395467775901, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015235836365749833}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.29325251255888984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004836167389643869}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09410633326390479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001817299240652282}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027879936369681734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010974239499863508}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13641679853598052, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032756808482751125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0422554607577646, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011207429888077064}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05824013808849948, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014483059111597553}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2785195263881824, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004526853798643564}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08936406691785198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001707660234429849}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.058404727742803225, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014611973721867918}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2786788137098633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004519860762866795}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08953461085050565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017195795746719645}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7a6c7f461e60fe1fda03fab6efcd86cfb4dd67ca --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34830681706460126, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01684214623603046}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06326435773545039, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013542606641520488}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3156608861325991, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047388400050451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0986364025189687, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017250228996667696}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028634240678455197, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008657767199386355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14832007806184763, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003300168476456189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.044559368109694755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010908531224967327}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06001818231619863, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012484272002343752}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.299123246297464, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044103995135310195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09365962833176038, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001614688994804722}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06019532321096589, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012630463084520604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.30043891693048896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004444660524612687}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09390588584336734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016304255047587266}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4d77906a19042de3e3b7efcc81c848cbc1a72ec5 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.36470600269670195, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.018280048766308375}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06330533770140873, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011600203995117304}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3259947504941901, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004809345100214171}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10011450605217301, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016506911228713907}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028285266360899328, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006938944946883647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15459267483010083, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00340681133628092}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04497027193243351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010238315815248355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05972837538221139, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010878264157076817}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3073051758906017, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004478239792374778}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09444059545614306, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015438279184580702}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06020601780769939, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001104187247297194}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3095076259209654, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004504005664338164}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09513479449596876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015626056932077051}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..aba724bde3743763f2283f60b4adf8ab0945e41c --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34279547123639, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02166437435240052}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06367441592900581, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001194655773448425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3273817810829883, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004763653283179556}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10065904593799764, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016754751356902707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028523558899898493, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007310056361867258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15423603065118352, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032851282926083694}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04523413495038415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010527829629444607}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05993520541418932, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011028564197777878}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30883518804645416, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004444159365713122}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09483171445464417, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015525134351789466}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06057732250287014, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011347979681458663}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.31052564238961033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004439053679763851}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09570320653415937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015864428965022782}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..50bc867685988668b164c9df5441bb35555c41ef --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.43068686455258365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.024558626439848394}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06591108347919172, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012472199657513222}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3403235719405941, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004965628611695927}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10410497627752861, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017128654339676542}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03003354094036042, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007445009962094013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1663946980145394, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003627902758005641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0477723289558304, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010828661653623512}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.061647771870220795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011365079087437059}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.31937107624477157, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004623821764283096}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09752610184478055, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015891934785872816}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06251543627392657, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011656752479938524}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.32334680308556674, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004688368905057958}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09881610204913661, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016204593561223266}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..21da10ec899a8755df66e8e89923583fae2be55c --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14094551178968198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017988042403353308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2383379873289029, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024508365201313925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16466297522045426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017464500568992482}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025826231379801598, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006644756372248472}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04562095099618684, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001260309972555968}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03044265380148028, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007549449327851908}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1141936744607556, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001311074823465258}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20047392294507563, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020851227283842106}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13521621786999796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013074426897338972}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1281224911907099, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016180585138979911}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2177477559969978, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002237821831406095}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1498377131098679, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015625059702703778}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.150037493962955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03792522803644501}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..293b9a228e1b83310561d81fd1c2818bcb66c8da --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14622799391003813, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020068025807149733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24101862122339654, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026276208678892242}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1683204053948335, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001892698106994734}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.029667497362948447, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008466619702056509}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.048440765255034476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012946101473055032}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03354144102579964, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000822566284455867}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1138608269905594, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014746185711284013}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1931547974295735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021274307166620926}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13222515812033397, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013920016810944796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13544349261022215, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018568387839824677}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22406954780205265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002449960379940128}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15608955729869492, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017500765734040384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5968121086484615, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.054851748142751296}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9294e7a973c8340cf31fa08da2f31d4af0a5f37e --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15460966487470837, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002233041531383059}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23977523386714922, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025640624695031644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17044100733247006, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018672130638160281}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03324641794167163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010616588597732964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.051106504151232426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013379696967192748}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03537634555402942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008649089367972104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1222092984923369, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017390941193497359}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19463277997734565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021294441696277336}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13554325862504094, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014028716662179363}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14302654547194457, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002060935061365854}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2233107296658696, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024112074184366853}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15795207740196257, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017219827845479745}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.7092164171091249, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08765489082275082}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..57aa03a2dd7c546c378a0cf588f272eabaee304b --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1406901039188124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025666252762842315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.19970447237610153, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028390196402756584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.14408176000895695, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020016420554769035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02922353525732899, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011010583273786127}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04191034328930793, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012547885060256734}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.029377172063398457, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008005810773268516}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11281690861703962, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021122923732267928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1629060920599739, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023571083502973668}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1153303057335899, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015400634901938468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13076056418582657, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024324238744350382}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.1857999771905377, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026706910367050693}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.13347692311901044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001853011425694174}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5463404291438052, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08984875953099804}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a49a2618d9faf15ae2bc6808f1945172c24e9d --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.047637385711642166, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019406862995964113}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06935875426191872, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002476239873059244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.047912419187255355, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016885974181252042}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.010533587881846619, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006829459294496357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.01575083046773536, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009533335963566146}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.010490684660423407, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005736260642904359}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.038907290376934564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015632211619916261}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.058100266035812934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020878258346479737}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.039331394950418846, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001357076427861084}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04422693909381412, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018055836955325499}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06455710260564228, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023114528926315003}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.0444398924940209, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015649101599922706}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.3661448228518088, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.033027262924505495}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..27555b6bbd1c8f3bfe9eecb436775d558cab767b --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008290393984892647, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009001034412792107}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011802367196652718, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011618281791076293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008313843592026254, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008265470763649947}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0020266217301853685, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003393709813488467}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0029487651946005756, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004412972611158346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002040994959246997, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00030407491270912355}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006721799139189244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007186545260376111}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0098857093481712, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009864294742971877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006771006570745668, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006635749098480861}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007648580835406893, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008266968946583269}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.011070549839007678, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010938104264188817}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007705400987609899, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007633405146045267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.367443124232542e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.2685163547005723e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7f47cbfed22e5276c0874250597edbab5f374920 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.967183056283888, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0614451409180861}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.17322199542522593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001766739101818456}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.3497612117638542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002145765234933453}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.22316500100906603, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001595359423456744}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.06666478811553239, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001052128094651409}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.13513990600107753, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016103984793018583}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.08520789194179026, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010270065001763392}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.15393062571271574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014926257950038774}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3136929917594451, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0018044289406178228}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.1988974965351846, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001304080390696196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.14930193885489784, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016069977963074835}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.30276071858573167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002055681489475386}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.19244613018340564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001468684623588083}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..220303863dbd6cb998bb21865298aabcb12886c8 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.24858195158816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12182015441698014}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.40889005404754675, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003409449253825524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.38260655862871273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026522545736220606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3648604782443927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002228919554367123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17304656619126002, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024265933354054277}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.15533741505167725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017940218081133016}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1492665013164553, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016682679997427913}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.30433231462665566, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028037834853861434}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2870278031145814, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022278844415098828}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.27089646277222484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017762835796866921}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3368390621347027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031362360403701063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3129980401000163, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002411291755571875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2988385773578741, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002083312510474344}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2c8bf3952584f4b61a79bee9f6ef0b7c44c87567 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.8132898005392, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13889694589808027}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.472247337392176, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003509675155475942}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4109851055076836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00266754752683629}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.40949266454624667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002227174072645473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2221300194890402, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026008629952829765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18747167156183062, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001966631075668386}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18759073054766637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018155332514371313}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.34810606304380215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029168836617550075}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3037441519487516, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022352968777445397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30101808824060367, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001845167102197219}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3930359663685668, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032821280577162463}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.34128557450637836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025177617791370846}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.33997209628594915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021704693429880294}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..678ce1c3807473c87293840467a44e79f23ce729 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.606901971322037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1876717173587565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4792720578842871, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003435623212611771}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4299540279680867, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002709552589644585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.423107786753922, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022021533625304172}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.22961096510876788, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025354521714354276}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2028531159711805, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020459562906288337}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19914466926004393, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00183134409853892}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3508612926375425, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028773466225418217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31576853558586987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023159029356283776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3089647180477385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018748237534710302}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4010458372923884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032049720170719783}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36015366099876867, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002587495579628278}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35385970959123086, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021714504772349687}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e818ac0674040004a2abbb1939ff8feb95888373 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.637879863244894, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16226309008051826}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4652304352934913, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003337521287505696}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43528505234512976, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026695917030513756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.42194593310296813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022114287389486177}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.22302025310290544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002458367724539737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20597912934683074, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002051470584078235}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19912988966042086, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018245099743948883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.34089523951143247, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002747821577994244}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3209553243957463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023209551472440425}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3089991444775559, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018682388377063268}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3927848741866132, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003065974270261921}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3689097427358982, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002571023680832107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35671544335154326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002156063389652602}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..50870f66e9728ee98cad74d2d184e62a761a7f36 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.26475738478149, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10488019812696231}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4479742544722184, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003108871411245775}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4423554172558611, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025756769738496397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.41955022171167694, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002065255587289289}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2123975185096454, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0022240580364677317}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20778597326112527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00197971650755932}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19644636492905912, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001708355406787911}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3257902997295537, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025340439153237536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3232398560031394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022135147638730015}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30489490110399153, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017356656037540608}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.38025656291521354, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002865492941990049}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3766640128082206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002485268728296478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35648196691681816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020231414730809993}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bf8be0a2d167cb786b976ae5ed72e94a4126f9bc --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14955286652112415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020266295880405774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.35543546517620694, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00442547747797648}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20694913889331623, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026118174574717734}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0376041381568334, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001193655014731505}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0933869055501563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003010569547553423}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05271536971805359, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016602940533088598}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11702196333102838, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001508489395430335}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.281518689350463, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035793211165099544}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16253221143739943, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019871124537594923}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1163142271090814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016972579238893975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2797387075449087, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0039649519854766495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16153438576143062, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002249256594915832}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1575498448959216, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08919411230958109}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d05bd0806de0066ac21de142bd52935085090c76 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11987004390929652, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017838594123509761}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2966409602445348, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004159126214657732}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1687358123113738, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024129362829470083}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026631555586252555, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010212047218259958}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06832787071429165, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026781644808146748}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03787201010606323, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014498387144822385}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09946412096799201, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014047697344840638}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.248112655710228, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034716802936847493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14027382835276725, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001921605105364016}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09372299032008248, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014604124390732933}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23430014881481423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036250515591870363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13228905712132874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020123169172413372}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5635386724766893, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11199220007541402}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..09705ad7e766b150673596542c4c7bc36bbbc00a --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12261802535697702, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001802015575276267}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3042881483021127, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004239856666150261}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17272164395046263, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024442934880362266}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02801123042219147, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010421626554945002}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07221142765808251, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027494039338407683}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03985376122882166, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014771066414781765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10218618041428032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014181507052656937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2550776992609646, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00349622255520093}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14412504060617204, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019378546005162558}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09563780121752037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001506049442354842}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23952794956934653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036934108853552503}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1350224868091867, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020648079219729885}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5884835216922304, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0694220243258812}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c0c53d31c2c121e1cb07d1923fee7c8b200f4588 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12058771231639086, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002066164336399918}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.283378982179243, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004430498021847181}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1651398268476812, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025732765693385513}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026878830813233837, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010536649719391797}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06558476547253786, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002641200590918728}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03726421510075795, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014326890233943264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09972103113703992, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001673601901658887}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23548429603769053, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00364743143336554}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13662385100336102, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020655105556114887}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09474676528107442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001734800385670887}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22375657894123885, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003765688599090495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1296880556548729, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002127865421306681}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.548658255159644, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09243037162628143}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c0e03cc4b74542a586c7f8d22e5997240d3f2db8 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03871656302800435, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023171515461883206}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07297233644463587, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00419731966694904}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04630458791276842, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025747339870623113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.007010252770233402, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000677642525994807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.015453001281963676, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014999985743029969}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.009197972474873806, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000868833115217779}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03131649789252053, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019045755355521208}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05884937656119138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003409137251073175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03723052598616332, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020759578853067283}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.030881510184046758, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019314337019311182}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05735625281670475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003380740089049823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03645148435287092, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002076771980839672}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6621697454846989, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10164971536579874}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e685dba09bcb49fd202b7f90d56b329722a49808 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0036570101092707552, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009755024739951457}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.003158552109934381, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.000860982778191664}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0033252826117525294, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008934297630156492}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0006632141135470769, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00022782933435935797}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0006369853770402868, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00023576116891012097}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0006422730362464498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00022885115664468214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002516549335872895, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006650456872731031}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0022033496898103025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006061893464627548}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0023002231158666315, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006174742913966595}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0030601262050967064, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008066078492200342}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002680985690153414, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0007365936380419417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0028016428299652346, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007514162209604014}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2741760295045995e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.398898398772146e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c5328a733cce8f93716850675efe74b7af940036 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94069ac5b212e04a8923d7a3db47e7beb4cac7182bc06dd4fdc9572e15476ec +size 4280211 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c0f4b9b23701ced1f5584bab539470607cc880b0 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50baa2556fb2c4d3ec29a2e45b929d0ee104a2851b10ea2db27f9e1b4a09b68 +size 5148584 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4e81941e7efc27d3c69228d51640823a676c3a74 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1bbba5eab1d908f22a74856ec90ce81130ede748fbc9dcbcb9ee81ba14648ce +size 6041996 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..64d73144b20f3568c93903f6d28f4d757b490f3b --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bfab54b53483034b3b1d8877e2514dc42b6cb6b951957d89166009233bfac9 +size 6955346 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2ac16cc44900e12a7251c01c2889aad5fef82283 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e08071c4b940fdeb0b0e564e7dec456de00f009bff013b640cb3a3a59312ab +size 7840531 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5e8486678e369ebb5e15f6cf2d8cdfe396fa7c5e --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6695d5e4aafdb5c7bd7b4e966595a662b52896121fe7445dc284027f020383d9 +size 8750138 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2b5ccd8b7bb5eacf91cdb6ebf4ad817881043a55 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c430c752ce8d8f74c6be810442904652ca58bdff3e928e01171d8c80e75ca6 +size 7696087 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9b88bccfc4b40b0e002c42e7750243eb25255f83 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a8368681ec1236a0f5d41f38c7e531c662622e69a48049561c14a99a509651 +size 13257518 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..13c4dabc62737d0cd5b7382892056c2a6d66bdcd --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e730793e3278b657304e2c9837b02d49b5466b33c285cabe8e109127c991aa0 +size 18835825 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..edb2b7100a5537d39c52a96414c7a1b480504ebb --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf31ad3e9c5310fc2e64fbf11eb4078aa6285416b2ca7e580c7c4a52edf2499a +size 24269502 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..025be81fccac0fa363cab10e91c1998a668af454 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973805d5b2088a24e94a66006542624f9f51fe74c60f1d49af442092eec082c3 +size 29454246 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e0b3107adfdaa7acc0b2a04cded20ab246a7671e --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af229986a5d66b43d10478f3c2fe46b3b2ad1300581a77ea8d0aea27822f3aaa +size 34798043 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..034b563a3569f0524125091732aae78c86526ee0 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b259ae93db9ee2261be3b36b7e3ed8d932263a9b1cff120f90c971a4f210d1a1 +size 4435431 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..52ee0e8025846455aaac42932373b3ac6ac54ed4 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:572c68c6db95b184b33c0adf690dcd118779510758fe341ed93413efcd658e6f +size 5143973 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..837566520f1da87edcb717eb14c29a3e151764bc --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15fa2489a7f40a6ff3ab3cd46528acc5277ebc5b586366ff2cc1c8efeb905a6 +size 6182952 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aaa7cbc57a6133b925b9d226d387df08d3415965 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad96e78764bd23785e1c23b893ff4cd9582923ad46f2028930bb326bec4e29b +size 7273550 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3588e577ab1bd210e6faf89d922dfce71a7d1692 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a85f5000dce10be20741785972cd85da0a760e3d59779c9ced2cab597c2201 +size 8369161 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..202c867004a426687ec0711c7b51f87b0317fb82 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96042c83247a91edd3316f566ce802f3c19d000bbef97741ed637e7e2bd2c99f +size 9474807 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1fe3fd7418fab5601e785631682caa5950ae7022 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016fb65ec224cb66a67fd28f3aaac68d06a86654ce79036f9e83ebdb8951e2d2 +size 2831644 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..37048acad77fbc5f43e532c130eecae51059d8df --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdca82d356d7c6d77f7366f3dd6f413d7836bf84eee4db6b9ed42c6ac135e589 +size 5099526 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6894fd8cde8b8c1c9edb3c159ea9cdc83dedf5db --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b329152f427d868fdf7ee93f93213b788b515811ac0cf475f784c3a331bc5faf +size 7371227 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d475f3a871fd842c942515eec9c532b65ff851a0 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8b48c29856c08d8d79c7e1e6f4d5e02a90d216934286ef0d3106f15698a4e7 +size 9638201 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7864f27ab154d7cf51dc3e845c03eef571e30571 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723f14dbec0512df2730b35c1fc9fd56b05a58b557efb11f12da79d36a316dee +size 11670205 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..075a3024bececb6806ce2c9cb0f3e2420d97961e --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2182b8656a555afea53aab37a35d2540d1fdae8ee7581d406a5dfa0334e5a1a0 +size 13897485 diff --git a/perplexity25/evaluation/generation/merged.csv b/perplexity25/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..4d5b8fc25743961e4623c9af8f9e809d40844dba --- /dev/null +++ b/perplexity25/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.08520789194179026 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.08520789194179026 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.1492665013164553 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.1492665013164553 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.18759073054766637 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.18759073054766637 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.19914466926004393 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.19914466926004393 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.19912988966042086 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.19912988966042086 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19644636492905912 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19644636492905912 +e2e_nlg_cleaned,5,average,multiple,0.16946434127590598 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.05271536971805359 +gem_xsum,0,median,rouge2_fmeasure,0.05271536971805359 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03787201010606323 +gem_xsum,1,median,rouge2_fmeasure,0.03787201010606323 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03985376122882166 +gem_xsum,2,median,rouge2_fmeasure,0.03985376122882166 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03726421510075795 +gem_xsum,3,median,rouge2_fmeasure,0.03726421510075795 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.009197972474873806 +gem_xsum,4,median,rouge2_fmeasure,0.009197972474873806 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0006422730362464498 +gem_xsum,5,median,rouge2_fmeasure,0.0006422730362464498 +gem_xsum,5,average,multiple,0.02959093361080278 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03751857157597345 +web_nlg_en,0,median,rouge2_fmeasure,0.03751857157597345 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0422554607577646 +web_nlg_en,1,median,rouge2_fmeasure,0.0422554607577646 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.044559368109694755 +web_nlg_en,2,median,rouge2_fmeasure,0.044559368109694755 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.04497027193243351 +web_nlg_en,3,median,rouge2_fmeasure,0.04497027193243351 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.04523413495038415 +web_nlg_en,4,median,rouge2_fmeasure,0.04523413495038415 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.0477723289558304 +web_nlg_en,5,median,rouge2_fmeasure,0.0477723289558304 +web_nlg_en,5,average,multiple,0.043718356047013476 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03044265380148028 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03044265380148028 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.03354144102579964 +wiki_lingua_en,1,median,rouge2_fmeasure,0.03354144102579964 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.03537634555402942 +wiki_lingua_en,2,median,rouge2_fmeasure,0.03537634555402942 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.029377172063398457 +wiki_lingua_en,3,median,rouge2_fmeasure,0.029377172063398457 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.010490684660423407 +wiki_lingua_en,4,median,rouge2_fmeasure,0.010490684660423407 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002040994959246997 +wiki_lingua_en,5,median,rouge2_fmeasure,0.002040994959246997 +wiki_lingua_en,5,average,multiple,0.0235448820107297 diff --git a/perplexity25/evaluation/generation/merged.json b/perplexity25/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..e058540cabaef6c60d483017dba0e82ffb4d3b44 --- /dev/null +++ b/perplexity25/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.29123796712848116, "bleu_stderr": 0.024099559164327343, "rouge1_fmeasure": 0.0846007331490898, "rouge1_fmeasure_stderr": 0.0017611698640008044, "rouge1_precision": 0.05684299841582745, "rouge1_precision_stderr": 0.0016887384375207904, "rouge1_recall": 0.26382466542797384, "rouge1_recall_stderr": 0.00448652393967693, "rouge2_fmeasure": 0.03751857157597345, "rouge2_fmeasure_stderr": 0.00108659069296553, "rouge2_precision": 0.024552079352862823, "rouge2_precision_stderr": 0.0009251381031279301, "rouge2_recall": 0.11720876113413588, "rouge2_recall_stderr": 0.0030359279375561524, "rougeL_fmeasure": 0.08142615853409181, "rougeL_fmeasure_stderr": 0.001670491088449438, "rougeL_precision": 0.05458027450709555, "rougeL_precision_stderr": 0.001588691365439898, "rougeL_recall": 0.2540701232644345, "rougeL_recall_stderr": 0.004311533260849107, "rougeLsum_fmeasure": 0.08051138355871504, "rougeLsum_fmeasure_stderr": 0.0016680677195043975, "rougeLsum_precision": 0.0541293635979088, "rougeLsum_precision_stderr": 0.0016039721945264953, "rougeLsum_recall": 0.24960718136284848, "rougeLsum_recall_stderr": 0.0042227139206395545}}, "1": {"PALM_prompt": {"bleu": 0.32421224846581287, "bleu_stderr": 0.022894553413488398, "rouge1_fmeasure": 0.09410633326390479, "rouge1_fmeasure_stderr": 0.001817299240652282, "rouge1_precision": 0.06133395467775901, "rouge1_precision_stderr": 0.0015235836365749833, "rouge1_recall": 0.29325251255888984, "rouge1_recall_stderr": 0.004836167389643869, "rouge2_fmeasure": 0.0422554607577646, "rouge2_fmeasure_stderr": 0.0011207429888077064, "rouge2_precision": 0.027879936369681734, "rouge2_precision_stderr": 0.0010974239499863508, "rouge2_recall": 0.13641679853598052, "rouge2_recall_stderr": 0.0032756808482751125, "rougeL_fmeasure": 0.08936406691785198, "rougeL_fmeasure_stderr": 0.001707660234429849, "rougeL_precision": 0.05824013808849948, "rougeL_precision_stderr": 0.0014483059111597553, "rougeL_recall": 0.2785195263881824, "rougeL_recall_stderr": 0.004526853798643564, "rougeLsum_fmeasure": 0.08953461085050565, "rougeLsum_fmeasure_stderr": 0.0017195795746719645, "rougeLsum_precision": 0.058404727742803225, "rougeLsum_precision_stderr": 0.0014611973721867918, "rougeLsum_recall": 0.2786788137098633, "rougeLsum_recall_stderr": 0.004519860762866795}}, "2": {"PALM_prompt": {"bleu": 0.34830681706460126, "bleu_stderr": 0.01684214623603046, "rouge1_fmeasure": 0.0986364025189687, "rouge1_fmeasure_stderr": 0.0017250228996667696, "rouge1_precision": 0.06326435773545039, "rouge1_precision_stderr": 0.0013542606641520488, "rouge1_recall": 0.3156608861325991, "rouge1_recall_stderr": 0.0047388400050451, "rouge2_fmeasure": 0.044559368109694755, "rouge2_fmeasure_stderr": 0.0010908531224967327, "rouge2_precision": 0.028634240678455197, "rouge2_precision_stderr": 0.0008657767199386355, "rouge2_recall": 0.14832007806184763, "rouge2_recall_stderr": 0.003300168476456189, "rougeL_fmeasure": 0.09365962833176038, "rougeL_fmeasure_stderr": 0.001614688994804722, "rougeL_precision": 0.06001818231619863, "rougeL_precision_stderr": 0.0012484272002343752, "rougeL_recall": 0.299123246297464, "rougeL_recall_stderr": 0.0044103995135310195, "rougeLsum_fmeasure": 0.09390588584336734, "rougeLsum_fmeasure_stderr": 0.0016304255047587266, "rougeLsum_precision": 0.06019532321096589, "rougeLsum_precision_stderr": 0.0012630463084520604, "rougeLsum_recall": 0.30043891693048896, "rougeLsum_recall_stderr": 0.004444660524612687}}, "3": {"PALM_prompt": {"bleu": 0.36470600269670195, "bleu_stderr": 0.018280048766308375, "rouge1_fmeasure": 0.10011450605217301, "rouge1_fmeasure_stderr": 0.0016506911228713907, "rouge1_precision": 0.06330533770140873, "rouge1_precision_stderr": 0.0011600203995117304, "rouge1_recall": 0.3259947504941901, "rouge1_recall_stderr": 0.004809345100214171, "rouge2_fmeasure": 0.04497027193243351, "rouge2_fmeasure_stderr": 0.0010238315815248355, "rouge2_precision": 0.028285266360899328, "rouge2_precision_stderr": 0.0006938944946883647, "rouge2_recall": 0.15459267483010083, "rouge2_recall_stderr": 0.00340681133628092, "rougeL_fmeasure": 0.09444059545614306, "rougeL_fmeasure_stderr": 0.0015438279184580702, "rougeL_precision": 0.05972837538221139, "rougeL_precision_stderr": 0.0010878264157076817, "rougeL_recall": 0.3073051758906017, "rougeL_recall_stderr": 0.004478239792374778, "rougeLsum_fmeasure": 0.09513479449596876, "rougeLsum_fmeasure_stderr": 0.0015626056932077051, "rougeLsum_precision": 0.06020601780769939, "rougeLsum_precision_stderr": 0.001104187247297194, "rougeLsum_recall": 0.3095076259209654, "rougeLsum_recall_stderr": 0.004504005664338164}}, "4": {"PALM_prompt": {"bleu": 0.34279547123639, "bleu_stderr": 0.02166437435240052, "rouge1_fmeasure": 0.10065904593799764, "rouge1_fmeasure_stderr": 0.0016754751356902707, "rouge1_precision": 0.06367441592900581, "rouge1_precision_stderr": 0.001194655773448425, "rouge1_recall": 0.3273817810829883, "rouge1_recall_stderr": 0.004763653283179556, "rouge2_fmeasure": 0.04523413495038415, "rouge2_fmeasure_stderr": 0.0010527829629444607, "rouge2_precision": 0.028523558899898493, "rouge2_precision_stderr": 0.0007310056361867258, "rouge2_recall": 0.15423603065118352, "rouge2_recall_stderr": 0.0032851282926083694, "rougeL_fmeasure": 0.09483171445464417, "rougeL_fmeasure_stderr": 0.0015525134351789466, "rougeL_precision": 0.05993520541418932, "rougeL_precision_stderr": 0.0011028564197777878, "rougeL_recall": 0.30883518804645416, "rougeL_recall_stderr": 0.004444159365713122, "rougeLsum_fmeasure": 0.09570320653415937, "rougeLsum_fmeasure_stderr": 0.0015864428965022782, "rougeLsum_precision": 0.06057732250287014, "rougeLsum_precision_stderr": 0.0011347979681458663, "rougeLsum_recall": 0.31052564238961033, "rougeLsum_recall_stderr": 0.004439053679763851}}, "5": {"PALM_prompt": {"bleu": 0.43068686455258365, "bleu_stderr": 0.024558626439848394, "rouge1_fmeasure": 0.10410497627752861, "rouge1_fmeasure_stderr": 0.0017128654339676542, "rouge1_precision": 0.06591108347919172, "rouge1_precision_stderr": 0.0012472199657513222, "rouge1_recall": 0.3403235719405941, "rouge1_recall_stderr": 0.004965628611695927, "rouge2_fmeasure": 0.0477723289558304, "rouge2_fmeasure_stderr": 0.0010828661653623512, "rouge2_precision": 0.03003354094036042, "rouge2_precision_stderr": 0.0007445009962094013, "rouge2_recall": 0.1663946980145394, "rouge2_recall_stderr": 0.003627902758005641, "rougeL_fmeasure": 0.09752610184478055, "rougeL_fmeasure_stderr": 0.0015891934785872816, "rougeL_precision": 0.061647771870220795, "rougeL_precision_stderr": 0.0011365079087437059, "rougeL_recall": 0.31937107624477157, "rougeL_recall_stderr": 0.004623821764283096, "rougeLsum_fmeasure": 0.09881610204913661, "rougeLsum_fmeasure_stderr": 0.0016204593561223266, "rougeLsum_precision": 0.06251543627392657, "rougeLsum_precision_stderr": 0.0011656752479938524, "rougeLsum_recall": 0.32334680308556674, "rougeLsum_recall_stderr": 0.004688368905057958}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.150037493962955, "bleu_stderr": 0.03792522803644501, "rouge1_fmeasure": 0.16466297522045426, "rouge1_fmeasure_stderr": 0.0017464500568992482, "rouge1_precision": 0.14094551178968198, "rouge1_precision_stderr": 0.0017988042403353308, "rouge1_recall": 0.2383379873289029, "rouge1_recall_stderr": 0.0024508365201313925, "rouge2_fmeasure": 0.03044265380148028, "rouge2_fmeasure_stderr": 0.0007549449327851908, "rouge2_precision": 0.025826231379801598, "rouge2_precision_stderr": 0.0006644756372248472, "rouge2_recall": 0.04562095099618684, "rouge2_recall_stderr": 0.001260309972555968, "rougeL_fmeasure": 0.13521621786999796, "rougeL_fmeasure_stderr": 0.0013074426897338972, "rougeL_precision": 0.1141936744607556, "rougeL_precision_stderr": 0.001311074823465258, "rougeL_recall": 0.20047392294507563, "rougeL_recall_stderr": 0.0020851227283842106, "rougeLsum_fmeasure": 0.1498377131098679, "rougeLsum_fmeasure_stderr": 0.0015625059702703778, "rougeLsum_precision": 0.1281224911907099, "rougeLsum_precision_stderr": 0.0016180585138979911, "rougeLsum_recall": 0.2177477559969978, "rougeLsum_recall_stderr": 0.002237821831406095}}, "1": {"tldr_en": {"bleu": 1.5968121086484615, "bleu_stderr": 0.054851748142751296, "rouge1_fmeasure": 0.1683204053948335, "rouge1_fmeasure_stderr": 0.001892698106994734, "rouge1_precision": 0.14622799391003813, "rouge1_precision_stderr": 0.0020068025807149733, "rouge1_recall": 0.24101862122339654, "rouge1_recall_stderr": 0.0026276208678892242, "rouge2_fmeasure": 0.03354144102579964, "rouge2_fmeasure_stderr": 0.000822566284455867, "rouge2_precision": 0.029667497362948447, "rouge2_precision_stderr": 0.0008466619702056509, "rouge2_recall": 0.048440765255034476, "rouge2_recall_stderr": 0.0012946101473055032, "rougeL_fmeasure": 0.13222515812033397, "rougeL_fmeasure_stderr": 0.0013920016810944796, "rougeL_precision": 0.1138608269905594, "rougeL_precision_stderr": 0.0014746185711284013, "rougeL_recall": 0.1931547974295735, "rougeL_recall_stderr": 0.0021274307166620926, "rougeLsum_fmeasure": 0.15608955729869492, "rougeLsum_fmeasure_stderr": 0.0017500765734040384, "rougeLsum_precision": 0.13544349261022215, "rougeLsum_precision_stderr": 0.0018568387839824677, "rougeLsum_recall": 0.22406954780205265, "rougeLsum_recall_stderr": 0.002449960379940128}}, "2": {"tldr_en": {"bleu": 1.7092164171091249, "bleu_stderr": 0.08765489082275082, "rouge1_fmeasure": 0.17044100733247006, "rouge1_fmeasure_stderr": 0.0018672130638160281, "rouge1_precision": 0.15460966487470837, "rouge1_precision_stderr": 0.002233041531383059, "rouge1_recall": 0.23977523386714922, "rouge1_recall_stderr": 0.0025640624695031644, "rouge2_fmeasure": 0.03537634555402942, "rouge2_fmeasure_stderr": 0.0008649089367972104, "rouge2_precision": 0.03324641794167163, "rouge2_precision_stderr": 0.0010616588597732964, "rouge2_recall": 0.051106504151232426, "rouge2_recall_stderr": 0.0013379696967192748, "rougeL_fmeasure": 0.13554325862504094, "rougeL_fmeasure_stderr": 0.0014028716662179363, "rougeL_precision": 0.1222092984923369, "rougeL_precision_stderr": 0.0017390941193497359, "rougeL_recall": 0.19463277997734565, "rougeL_recall_stderr": 0.0021294441696277336, "rougeLsum_fmeasure": 0.15795207740196257, "rougeLsum_fmeasure_stderr": 0.0017219827845479745, "rougeLsum_precision": 0.14302654547194457, "rougeLsum_precision_stderr": 0.002060935061365854, "rougeLsum_recall": 0.2233107296658696, "rougeLsum_recall_stderr": 0.0024112074184366853}}, "3": {"tldr_en": {"bleu": 1.5463404291438052, "bleu_stderr": 0.08984875953099804, "rouge1_fmeasure": 0.14408176000895695, "rouge1_fmeasure_stderr": 0.0020016420554769035, "rouge1_precision": 0.1406901039188124, "rouge1_precision_stderr": 0.0025666252762842315, "rouge1_recall": 0.19970447237610153, "rouge1_recall_stderr": 0.0028390196402756584, "rouge2_fmeasure": 0.029377172063398457, "rouge2_fmeasure_stderr": 0.0008005810773268516, "rouge2_precision": 0.02922353525732899, "rouge2_precision_stderr": 0.0011010583273786127, "rouge2_recall": 0.04191034328930793, "rouge2_recall_stderr": 0.0012547885060256734, "rougeL_fmeasure": 0.1153303057335899, "rougeL_fmeasure_stderr": 0.0015400634901938468, "rougeL_precision": 0.11281690861703962, "rougeL_precision_stderr": 0.0021122923732267928, "rougeL_recall": 0.1629060920599739, "rougeL_recall_stderr": 0.0023571083502973668, "rougeLsum_fmeasure": 0.13347692311901044, "rougeLsum_fmeasure_stderr": 0.001853011425694174, "rougeLsum_precision": 0.13076056418582657, "rougeLsum_precision_stderr": 0.0024324238744350382, "rougeLsum_recall": 0.1857999771905377, "rougeLsum_recall_stderr": 0.0026706910367050693}}, "4": {"tldr_en": {"bleu": 0.3661448228518088, "bleu_stderr": 0.033027262924505495, "rouge1_fmeasure": 0.047912419187255355, "rouge1_fmeasure_stderr": 0.0016885974181252042, "rouge1_precision": 0.047637385711642166, "rouge1_precision_stderr": 0.0019406862995964113, "rouge1_recall": 0.06935875426191872, "rouge1_recall_stderr": 0.002476239873059244, "rouge2_fmeasure": 0.010490684660423407, "rouge2_fmeasure_stderr": 0.0005736260642904359, "rouge2_precision": 0.010533587881846619, "rouge2_precision_stderr": 0.0006829459294496357, "rouge2_recall": 0.01575083046773536, "rouge2_recall_stderr": 0.0009533335963566146, "rougeL_fmeasure": 0.039331394950418846, "rougeL_fmeasure_stderr": 0.001357076427861084, "rougeL_precision": 0.038907290376934564, "rougeL_precision_stderr": 0.0015632211619916261, "rougeL_recall": 0.058100266035812934, "rougeL_recall_stderr": 0.0020878258346479737, "rougeLsum_fmeasure": 0.0444398924940209, "rougeLsum_fmeasure_stderr": 0.0015649101599922706, "rougeLsum_precision": 0.04422693909381412, "rougeLsum_precision_stderr": 0.0018055836955325499, "rougeLsum_recall": 0.06455710260564228, "rougeLsum_recall_stderr": 0.0023114528926315003}}, "5": {"tldr_en": {"bleu": 6.367443124232542e-07, "bleu_stderr": 1.2685163547005723e-06, "rouge1_fmeasure": 0.008313843592026254, "rouge1_fmeasure_stderr": 0.0008265470763649947, "rouge1_precision": 0.008290393984892647, "rouge1_precision_stderr": 0.0009001034412792107, "rouge1_recall": 0.011802367196652718, "rouge1_recall_stderr": 0.0011618281791076293, "rouge2_fmeasure": 0.002040994959246997, "rouge2_fmeasure_stderr": 0.00030407491270912355, "rouge2_precision": 0.0020266217301853685, "rouge2_precision_stderr": 0.0003393709813488467, "rouge2_recall": 0.0029487651946005756, "rouge2_recall_stderr": 0.0004412972611158346, "rougeL_fmeasure": 0.006771006570745668, "rougeL_fmeasure_stderr": 0.0006635749098480861, "rougeL_precision": 0.006721799139189244, "rougeL_precision_stderr": 0.0007186545260376111, "rougeL_recall": 0.0098857093481712, "rougeL_recall_stderr": 0.0009864294742971877, "rougeLsum_fmeasure": 0.007705400987609899, "rougeLsum_fmeasure_stderr": 0.0007633405146045267, "rougeLsum_precision": 0.007648580835406893, "rougeLsum_precision_stderr": 0.0008266968946583269, "rougeLsum_recall": 0.011070549839007678, "rougeLsum_recall_stderr": 0.0010938104264188817}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 3.967183056283888, "bleu_stderr": 0.0614451409180861, "rouge1_fmeasure": 0.22316500100906603, "rouge1_fmeasure_stderr": 0.001595359423456744, "rouge1_precision": 0.17322199542522593, "rouge1_precision_stderr": 0.001766739101818456, "rouge1_recall": 0.3497612117638542, "rouge1_recall_stderr": 0.002145765234933453, "rouge2_fmeasure": 0.08520789194179026, "rouge2_fmeasure_stderr": 0.0010270065001763392, "rouge2_precision": 0.06666478811553239, "rouge2_precision_stderr": 0.001052128094651409, "rouge2_recall": 0.13513990600107753, "rouge2_recall_stderr": 0.0016103984793018583, "rougeL_fmeasure": 0.1988974965351846, "rougeL_fmeasure_stderr": 0.001304080390696196, "rougeL_precision": 0.15393062571271574, "rougeL_precision_stderr": 0.0014926257950038774, "rougeL_recall": 0.3136929917594451, "rougeL_recall_stderr": 0.0018044289406178228, "rougeLsum_fmeasure": 0.19244613018340564, "rougeLsum_fmeasure_stderr": 0.001468684623588083, "rougeLsum_precision": 0.14930193885489784, "rougeLsum_precision_stderr": 0.0016069977963074835, "rougeLsum_recall": 0.30276071858573167, "rougeLsum_recall_stderr": 0.002055681489475386}}, "1": {"generate_text_restaurant": {"bleu": 7.24858195158816, "bleu_stderr": 0.12182015441698014, "rouge1_fmeasure": 0.3648604782443927, "rouge1_fmeasure_stderr": 0.002228919554367123, "rouge1_precision": 0.40889005404754675, "rouge1_precision_stderr": 0.003409449253825524, "rouge1_recall": 0.38260655862871273, "rouge1_recall_stderr": 0.0026522545736220606, "rouge2_fmeasure": 0.1492665013164553, "rouge2_fmeasure_stderr": 0.0016682679997427913, "rouge2_precision": 0.17304656619126002, "rouge2_precision_stderr": 0.0024265933354054277, "rouge2_recall": 0.15533741505167725, "rouge2_recall_stderr": 0.0017940218081133016, "rougeL_fmeasure": 0.27089646277222484, "rougeL_fmeasure_stderr": 0.0017762835796866921, "rougeL_precision": 0.30433231462665566, "rougeL_precision_stderr": 0.0028037834853861434, "rougeL_recall": 0.2870278031145814, "rougeL_recall_stderr": 0.0022278844415098828, "rougeLsum_fmeasure": 0.2988385773578741, "rougeLsum_fmeasure_stderr": 0.002083312510474344, "rougeLsum_precision": 0.3368390621347027, "rougeLsum_precision_stderr": 0.0031362360403701063, "rougeLsum_recall": 0.3129980401000163, "rougeLsum_recall_stderr": 0.002411291755571875}}, "2": {"generate_text_restaurant": {"bleu": 9.8132898005392, "bleu_stderr": 0.13889694589808027, "rouge1_fmeasure": 0.40949266454624667, "rouge1_fmeasure_stderr": 0.002227174072645473, "rouge1_precision": 0.472247337392176, "rouge1_precision_stderr": 0.003509675155475942, "rouge1_recall": 0.4109851055076836, "rouge1_recall_stderr": 0.00266754752683629, "rouge2_fmeasure": 0.18759073054766637, "rouge2_fmeasure_stderr": 0.0018155332514371313, "rouge2_precision": 0.2221300194890402, "rouge2_precision_stderr": 0.0026008629952829765, "rouge2_recall": 0.18747167156183062, "rouge2_recall_stderr": 0.001966631075668386, "rougeL_fmeasure": 0.30101808824060367, "rougeL_fmeasure_stderr": 0.001845167102197219, "rougeL_precision": 0.34810606304380215, "rougeL_precision_stderr": 0.0029168836617550075, "rougeL_recall": 0.3037441519487516, "rougeL_recall_stderr": 0.0022352968777445397, "rougeLsum_fmeasure": 0.33997209628594915, "rougeLsum_fmeasure_stderr": 0.0021704693429880294, "rougeLsum_precision": 0.3930359663685668, "rougeLsum_precision_stderr": 0.0032821280577162463, "rougeLsum_recall": 0.34128557450637836, "rougeLsum_recall_stderr": 0.0025177617791370846}}, "3": {"generate_text_restaurant": {"bleu": 10.606901971322037, "bleu_stderr": 0.1876717173587565, "rouge1_fmeasure": 0.423107786753922, "rouge1_fmeasure_stderr": 0.0022021533625304172, "rouge1_precision": 0.4792720578842871, "rouge1_precision_stderr": 0.003435623212611771, "rouge1_recall": 0.4299540279680867, "rouge1_recall_stderr": 0.002709552589644585, "rouge2_fmeasure": 0.19914466926004393, "rouge2_fmeasure_stderr": 0.00183134409853892, "rouge2_precision": 0.22961096510876788, "rouge2_precision_stderr": 0.0025354521714354276, "rouge2_recall": 0.2028531159711805, "rouge2_recall_stderr": 0.0020459562906288337, "rougeL_fmeasure": 0.3089647180477385, "rougeL_fmeasure_stderr": 0.0018748237534710302, "rougeL_precision": 0.3508612926375425, "rougeL_precision_stderr": 0.0028773466225418217, "rougeL_recall": 0.31576853558586987, "rougeL_recall_stderr": 0.0023159029356283776, "rougeLsum_fmeasure": 0.35385970959123086, "rougeLsum_fmeasure_stderr": 0.0021714504772349687, "rougeLsum_precision": 0.4010458372923884, "rougeLsum_precision_stderr": 0.0032049720170719783, "rougeLsum_recall": 0.36015366099876867, "rougeLsum_recall_stderr": 0.002587495579628278}}, "4": {"generate_text_restaurant": {"bleu": 10.637879863244894, "bleu_stderr": 0.16226309008051826, "rouge1_fmeasure": 0.42194593310296813, "rouge1_fmeasure_stderr": 0.0022114287389486177, "rouge1_precision": 0.4652304352934913, "rouge1_precision_stderr": 0.003337521287505696, "rouge1_recall": 0.43528505234512976, "rouge1_recall_stderr": 0.0026695917030513756, "rouge2_fmeasure": 0.19912988966042086, "rouge2_fmeasure_stderr": 0.0018245099743948883, "rouge2_precision": 0.22302025310290544, "rouge2_precision_stderr": 0.002458367724539737, "rouge2_recall": 0.20597912934683074, "rouge2_recall_stderr": 0.002051470584078235, "rougeL_fmeasure": 0.3089991444775559, "rougeL_fmeasure_stderr": 0.0018682388377063268, "rougeL_precision": 0.34089523951143247, "rougeL_precision_stderr": 0.002747821577994244, "rougeL_recall": 0.3209553243957463, "rougeL_recall_stderr": 0.0023209551472440425, "rougeLsum_fmeasure": 0.35671544335154326, "rougeLsum_fmeasure_stderr": 0.002156063389652602, "rougeLsum_precision": 0.3927848741866132, "rougeLsum_precision_stderr": 0.003065974270261921, "rougeLsum_recall": 0.3689097427358982, "rougeLsum_recall_stderr": 0.002571023680832107}}, "5": {"generate_text_restaurant": {"bleu": 10.26475738478149, "bleu_stderr": 0.10488019812696231, "rouge1_fmeasure": 0.41955022171167694, "rouge1_fmeasure_stderr": 0.002065255587289289, "rouge1_precision": 0.4479742544722184, "rouge1_precision_stderr": 0.003108871411245775, "rouge1_recall": 0.4423554172558611, "rouge1_recall_stderr": 0.0025756769738496397, "rouge2_fmeasure": 0.19644636492905912, "rouge2_fmeasure_stderr": 0.001708355406787911, "rouge2_precision": 0.2123975185096454, "rouge2_precision_stderr": 0.0022240580364677317, "rouge2_recall": 0.20778597326112527, "rouge2_recall_stderr": 0.00197971650755932, "rougeL_fmeasure": 0.30489490110399153, "rougeL_fmeasure_stderr": 0.0017356656037540608, "rougeL_precision": 0.3257902997295537, "rougeL_precision_stderr": 0.0025340439153237536, "rougeL_recall": 0.3232398560031394, "rougeL_recall_stderr": 0.0022135147638730015, "rougeLsum_fmeasure": 0.35648196691681816, "rougeLsum_fmeasure_stderr": 0.0020231414730809993, "rougeLsum_precision": 0.38025656291521354, "rougeLsum_precision_stderr": 0.002865492941990049, "rougeLsum_recall": 0.3766640128082206, "rougeLsum_recall_stderr": 0.002485268728296478}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.1575498448959216, "bleu_stderr": 0.08919411230958109, "rouge1_fmeasure": 0.20694913889331623, "rouge1_fmeasure_stderr": 0.0026118174574717734, "rouge1_precision": 0.14955286652112415, "rouge1_precision_stderr": 0.0020266295880405774, "rouge1_recall": 0.35543546517620694, "rouge1_recall_stderr": 0.00442547747797648, "rouge2_fmeasure": 0.05271536971805359, "rouge2_fmeasure_stderr": 0.0016602940533088598, "rouge2_precision": 0.0376041381568334, "rouge2_precision_stderr": 0.001193655014731505, "rouge2_recall": 0.0933869055501563, "rouge2_recall_stderr": 0.003010569547553423, "rougeL_fmeasure": 0.16253221143739943, "rougeL_fmeasure_stderr": 0.0019871124537594923, "rougeL_precision": 0.11702196333102838, "rougeL_precision_stderr": 0.001508489395430335, "rougeL_recall": 0.281518689350463, "rougeL_recall_stderr": 0.0035793211165099544, "rougeLsum_fmeasure": 0.16153438576143062, "rougeLsum_fmeasure_stderr": 0.002249256594915832, "rougeLsum_precision": 0.1163142271090814, "rougeLsum_precision_stderr": 0.0016972579238893975, "rougeLsum_recall": 0.2797387075449087, "rougeLsum_recall_stderr": 0.0039649519854766495}}, "1": {"article_DOC_summary": {"bleu": 1.5635386724766893, "bleu_stderr": 0.11199220007541402, "rouge1_fmeasure": 0.1687358123113738, "rouge1_fmeasure_stderr": 0.0024129362829470083, "rouge1_precision": 0.11987004390929652, "rouge1_precision_stderr": 0.0017838594123509761, "rouge1_recall": 0.2966409602445348, "rouge1_recall_stderr": 0.004159126214657732, "rouge2_fmeasure": 0.03787201010606323, "rouge2_fmeasure_stderr": 0.0014498387144822385, "rouge2_precision": 0.026631555586252555, "rouge2_precision_stderr": 0.0010212047218259958, "rouge2_recall": 0.06832787071429165, "rouge2_recall_stderr": 0.0026781644808146748, "rougeL_fmeasure": 0.14027382835276725, "rougeL_fmeasure_stderr": 0.001921605105364016, "rougeL_precision": 0.09946412096799201, "rougeL_precision_stderr": 0.0014047697344840638, "rougeL_recall": 0.248112655710228, "rougeL_recall_stderr": 0.0034716802936847493, "rougeLsum_fmeasure": 0.13228905712132874, "rougeLsum_fmeasure_stderr": 0.0020123169172413372, "rougeLsum_precision": 0.09372299032008248, "rougeLsum_precision_stderr": 0.0014604124390732933, "rougeLsum_recall": 0.23430014881481423, "rougeLsum_recall_stderr": 0.0036250515591870363}}, "2": {"article_DOC_summary": {"bleu": 1.5884835216922304, "bleu_stderr": 0.0694220243258812, "rouge1_fmeasure": 0.17272164395046263, "rouge1_fmeasure_stderr": 0.0024442934880362266, "rouge1_precision": 0.12261802535697702, "rouge1_precision_stderr": 0.001802015575276267, "rouge1_recall": 0.3042881483021127, "rouge1_recall_stderr": 0.004239856666150261, "rouge2_fmeasure": 0.03985376122882166, "rouge2_fmeasure_stderr": 0.0014771066414781765, "rouge2_precision": 0.02801123042219147, "rouge2_precision_stderr": 0.0010421626554945002, "rouge2_recall": 0.07221142765808251, "rouge2_recall_stderr": 0.0027494039338407683, "rougeL_fmeasure": 0.14412504060617204, "rougeL_fmeasure_stderr": 0.0019378546005162558, "rougeL_precision": 0.10218618041428032, "rougeL_precision_stderr": 0.0014181507052656937, "rougeL_recall": 0.2550776992609646, "rougeL_recall_stderr": 0.00349622255520093, "rougeLsum_fmeasure": 0.1350224868091867, "rougeLsum_fmeasure_stderr": 0.0020648079219729885, "rougeLsum_precision": 0.09563780121752037, "rougeLsum_precision_stderr": 0.001506049442354842, "rougeLsum_recall": 0.23952794956934653, "rougeLsum_recall_stderr": 0.0036934108853552503}}, "3": {"article_DOC_summary": {"bleu": 1.548658255159644, "bleu_stderr": 0.09243037162628143, "rouge1_fmeasure": 0.1651398268476812, "rouge1_fmeasure_stderr": 0.0025732765693385513, "rouge1_precision": 0.12058771231639086, "rouge1_precision_stderr": 0.002066164336399918, "rouge1_recall": 0.283378982179243, "rouge1_recall_stderr": 0.004430498021847181, "rouge2_fmeasure": 0.03726421510075795, "rouge2_fmeasure_stderr": 0.0014326890233943264, "rouge2_precision": 0.026878830813233837, "rouge2_precision_stderr": 0.0010536649719391797, "rouge2_recall": 0.06558476547253786, "rouge2_recall_stderr": 0.002641200590918728, "rougeL_fmeasure": 0.13662385100336102, "rougeL_fmeasure_stderr": 0.0020655105556114887, "rougeL_precision": 0.09972103113703992, "rougeL_precision_stderr": 0.001673601901658887, "rougeL_recall": 0.23548429603769053, "rougeL_recall_stderr": 0.00364743143336554, "rougeLsum_fmeasure": 0.1296880556548729, "rougeLsum_fmeasure_stderr": 0.002127865421306681, "rougeLsum_precision": 0.09474676528107442, "rougeLsum_precision_stderr": 0.001734800385670887, "rougeLsum_recall": 0.22375657894123885, "rougeLsum_recall_stderr": 0.003765688599090495}}, "4": {"article_DOC_summary": {"bleu": 0.6621697454846989, "bleu_stderr": 0.10164971536579874, "rouge1_fmeasure": 0.04630458791276842, "rouge1_fmeasure_stderr": 0.0025747339870623113, "rouge1_precision": 0.03871656302800435, "rouge1_precision_stderr": 0.0023171515461883206, "rouge1_recall": 0.07297233644463587, "rouge1_recall_stderr": 0.00419731966694904, "rouge2_fmeasure": 0.009197972474873806, "rouge2_fmeasure_stderr": 0.000868833115217779, "rouge2_precision": 0.007010252770233402, "rouge2_precision_stderr": 0.000677642525994807, "rouge2_recall": 0.015453001281963676, "rouge2_recall_stderr": 0.0014999985743029969, "rougeL_fmeasure": 0.03723052598616332, "rougeL_fmeasure_stderr": 0.0020759578853067283, "rougeL_precision": 0.03131649789252053, "rougeL_precision_stderr": 0.0019045755355521208, "rougeL_recall": 0.05884937656119138, "rougeL_recall_stderr": 0.003409137251073175, "rougeLsum_fmeasure": 0.03645148435287092, "rougeLsum_fmeasure_stderr": 0.002076771980839672, "rougeLsum_precision": 0.030881510184046758, "rougeLsum_precision_stderr": 0.0019314337019311182, "rougeLsum_recall": 0.05735625281670475, "rougeLsum_recall_stderr": 0.003380740089049823}}, "5": {"article_DOC_summary": {"bleu": 1.2741760295045995e-38, "bleu_stderr": 6.398898398772146e-33, "rouge1_fmeasure": 0.0033252826117525294, "rouge1_fmeasure_stderr": 0.0008934297630156492, "rouge1_precision": 0.0036570101092707552, "rouge1_precision_stderr": 0.0009755024739951457, "rouge1_recall": 0.003158552109934381, "rouge1_recall_stderr": 0.000860982778191664, "rouge2_fmeasure": 0.0006422730362464498, "rouge2_fmeasure_stderr": 0.00022885115664468214, "rouge2_precision": 0.0006632141135470769, "rouge2_precision_stderr": 0.00022782933435935797, "rouge2_recall": 0.0006369853770402868, "rouge2_recall_stderr": 0.00023576116891012097, "rougeL_fmeasure": 0.0023002231158666315, "rougeL_fmeasure_stderr": 0.0006174742913966595, "rougeL_precision": 0.002516549335872895, "rougeL_precision_stderr": 0.0006650456872731031, "rougeL_recall": 0.0022033496898103025, "rougeL_recall_stderr": 0.0006061893464627548, "rougeLsum_fmeasure": 0.0028016428299652346, "rougeLsum_fmeasure_stderr": 0.0007514162209604014, "rougeLsum_precision": 0.0030601262050967064, "rougeLsum_precision_stderr": 0.0008066078492200342, "rougeLsum_recall": 0.002680985690153414, "rougeLsum_recall_stderr": 0.0007365936380419417}}}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..64f7599aecf7e33e00b242ec0367cd8394391513 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.29123796712848116, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.024099559164327343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05684299841582745, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016887384375207904 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.26382466542797384, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00448652393967693 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0846007331490898, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017611698640008044 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.024552079352862823, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009251381031279301 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11720876113413588, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030359279375561524 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03751857157597345, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00108659069296553 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05458027450709555, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001588691365439898 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2540701232644345, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004311533260849107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08142615853409181, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001670491088449438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0541293635979088, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016039721945264953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24960718136284848, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0042227139206395545 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08051138355871504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016680677195043975 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..83c9ec913554435b65b10e9960bd0b83ad292130 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.32421224846581287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.022894553413488398 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06133395467775901, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015235836365749833 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.29325251255888984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004836167389643869 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09410633326390479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001817299240652282 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027879936369681734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010974239499863508 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13641679853598052, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032756808482751125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0422554607577646, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011207429888077064 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05824013808849948, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014483059111597553 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2785195263881824, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004526853798643564 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08936406691785198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001707660234429849 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.058404727742803225, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014611973721867918 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2786788137098633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004519860762866795 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08953461085050565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017195795746719645 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5a90e1a122ed6861a06eef65a527f4102afbb9 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34830681706460126, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.01684214623603046 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06326435773545039, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013542606641520488 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3156608861325991, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047388400050451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0986364025189687, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017250228996667696 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028634240678455197, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008657767199386355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14832007806184763, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003300168476456189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.044559368109694755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010908531224967327 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06001818231619863, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012484272002343752 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.299123246297464, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044103995135310195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09365962833176038, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001614688994804722 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06019532321096589, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012630463084520604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.30043891693048896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004444660524612687 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09390588584336734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016304255047587266 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4d520f3c64c5bfd7cc1304b09fd77176b5cbd604 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.36470600269670195, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.018280048766308375 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06330533770140873, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011600203995117304 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3259947504941901, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004809345100214171 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10011450605217301, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016506911228713907 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028285266360899328, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006938944946883647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15459267483010083, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00340681133628092 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04497027193243351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010238315815248355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05972837538221139, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010878264157076817 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3073051758906017, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004478239792374778 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09444059545614306, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015438279184580702 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06020601780769939, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001104187247297194 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3095076259209654, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004504005664338164 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09513479449596876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015626056932077051 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..718e74a67e73eede110a87e564df048020c716a4 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34279547123639, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02166437435240052 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06367441592900581, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001194655773448425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3273817810829883, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004763653283179556 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10065904593799764, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016754751356902707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028523558899898493, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007310056361867258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15423603065118352, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032851282926083694 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04523413495038415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010527829629444607 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05993520541418932, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011028564197777878 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30883518804645416, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004444159365713122 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09483171445464417, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015525134351789466 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06057732250287014, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011347979681458663 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.31052564238961033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004439053679763851 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09570320653415937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015864428965022782 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6e073b56b224c11973d92fec546f8d61cfcdab23 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.43068686455258365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.024558626439848394 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06591108347919172, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012472199657513222 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3403235719405941, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004965628611695927 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10410497627752861, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017128654339676542 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03003354094036042, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007445009962094013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1663946980145394, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003627902758005641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0477723289558304, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010828661653623512 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.061647771870220795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011365079087437059 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.31937107624477157, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004623821764283096 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09752610184478055, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015891934785872816 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06251543627392657, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011656752479938524 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.32334680308556674, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004688368905057958 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09881610204913661, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016204593561223266 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4661b0441ba357068c99be64c7fe3c7e2e18b7 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14094551178968198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017988042403353308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2383379873289029, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024508365201313925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16466297522045426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017464500568992482 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025826231379801598, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006644756372248472 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04562095099618684, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001260309972555968 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03044265380148028, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007549449327851908 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1141936744607556, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001311074823465258 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20047392294507563, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020851227283842106 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13521621786999796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013074426897338972 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1281224911907099, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016180585138979911 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2177477559969978, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002237821831406095 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1498377131098679, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015625059702703778 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.150037493962955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03792522803644501 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f598595fc09194e6ddcb1a0ca34ce5109f814084 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14622799391003813, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020068025807149733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24101862122339654, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026276208678892242 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1683204053948335, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001892698106994734 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.029667497362948447, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008466619702056509 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.048440765255034476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012946101473055032 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03354144102579964, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000822566284455867 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1138608269905594, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014746185711284013 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1931547974295735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021274307166620926 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13222515812033397, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013920016810944796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13544349261022215, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018568387839824677 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22406954780205265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002449960379940128 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15608955729869492, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017500765734040384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5968121086484615, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.054851748142751296 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b02e80c19456e2031add3391e2e87c1e4ed15640 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15460966487470837, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002233041531383059 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23977523386714922, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025640624695031644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17044100733247006, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018672130638160281 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03324641794167163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010616588597732964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.051106504151232426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013379696967192748 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03537634555402942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008649089367972104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1222092984923369, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017390941193497359 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19463277997734565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021294441696277336 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13554325862504094, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014028716662179363 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14302654547194457, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002060935061365854 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2233107296658696, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024112074184366853 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15795207740196257, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017219827845479745 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.7092164171091249, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08765489082275082 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b33a48ad4d71e45862907672c435e1d0272b35e5 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1406901039188124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0025666252762842315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.19970447237610153, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028390196402756584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.14408176000895695, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020016420554769035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02922353525732899, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011010583273786127 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04191034328930793, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012547885060256734 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.029377172063398457, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008005810773268516 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11281690861703962, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0021122923732267928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1629060920599739, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023571083502973668 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1153303057335899, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015400634901938468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13076056418582657, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0024324238744350382 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.1857999771905377, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026706910367050693 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.13347692311901044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001853011425694174 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5463404291438052, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08984875953099804 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..171c2e508312569b956758d18b2c36830b5a5aba --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.047637385711642166, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019406862995964113 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06935875426191872, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002476239873059244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.047912419187255355, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016885974181252042 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.010533587881846619, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006829459294496357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.01575083046773536, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0009533335963566146 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.010490684660423407, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005736260642904359 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.038907290376934564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015632211619916261 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.058100266035812934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020878258346479737 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.039331394950418846, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001357076427861084 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04422693909381412, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018055836955325499 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06455710260564228, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023114528926315003 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.0444398924940209, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015649101599922706 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.3661448228518088, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.033027262924505495 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e9d0f2852747a8c862ba5d2d27d0a208871619ff --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008290393984892647, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009001034412792107 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011802367196652718, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011618281791076293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008313843592026254, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008265470763649947 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0020266217301853685, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0003393709813488467 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0029487651946005756, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004412972611158346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002040994959246997, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00030407491270912355 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006721799139189244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007186545260376111 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0098857093481712, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009864294742971877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006771006570745668, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006635749098480861 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007648580835406893, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0008266968946583269 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.011070549839007678, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010938104264188817 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007705400987609899, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007633405146045267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.367443124232542e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.2685163547005723e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d28273c1f5cc6219a9725e64019a9d64491470 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.967183056283888, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0614451409180861 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.17322199542522593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001766739101818456 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.3497612117638542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002145765234933453 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.22316500100906603, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001595359423456744 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.06666478811553239, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001052128094651409 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.13513990600107753, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0016103984793018583 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.08520789194179026, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0010270065001763392 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.15393062571271574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0014926257950038774 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3136929917594451, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0018044289406178228 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.1988974965351846, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001304080390696196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.14930193885489784, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0016069977963074835 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.30276071858573167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002055681489475386 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.19244613018340564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001468684623588083 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..48845b8447cb0d36a7afdbad4a5a99c439a36eda --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.24858195158816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12182015441698014 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.40889005404754675, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003409449253825524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.38260655862871273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026522545736220606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3648604782443927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002228919554367123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17304656619126002, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024265933354054277 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.15533741505167725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0017940218081133016 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1492665013164553, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016682679997427913 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.30433231462665566, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028037834853861434 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2870278031145814, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022278844415098828 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.27089646277222484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017762835796866921 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3368390621347027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031362360403701063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3129980401000163, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002411291755571875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2988385773578741, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002083312510474344 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e37e643a6f0fed016eabb85c1ec7cb6d3ca387fa --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.8132898005392, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13889694589808027 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.472247337392176, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003509675155475942 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4109851055076836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00266754752683629 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.40949266454624667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002227174072645473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2221300194890402, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026008629952829765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18747167156183062, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001966631075668386 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18759073054766637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018155332514371313 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.34810606304380215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029168836617550075 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3037441519487516, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022352968777445397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30101808824060367, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001845167102197219 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3930359663685668, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032821280577162463 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.34128557450637836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025177617791370846 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.33997209628594915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021704693429880294 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..337efab23589b86e6880892f0aef77ca028ad3a8 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.606901971322037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1876717173587565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4792720578842871, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003435623212611771 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4299540279680867, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002709552589644585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.423107786753922, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022021533625304172 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.22961096510876788, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025354521714354276 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2028531159711805, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020459562906288337 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19914466926004393, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00183134409853892 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3508612926375425, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028773466225418217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31576853558586987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023159029356283776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3089647180477385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018748237534710302 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4010458372923884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032049720170719783 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36015366099876867, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002587495579628278 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35385970959123086, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021714504772349687 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f8265ea1df741c2d37477adc34c1d11100e170fb --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.637879863244894, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16226309008051826 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4652304352934913, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003337521287505696 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43528505234512976, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026695917030513756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.42194593310296813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022114287389486177 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.22302025310290544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002458367724539737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20597912934683074, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002051470584078235 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19912988966042086, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018245099743948883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.34089523951143247, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002747821577994244 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3209553243957463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023209551472440425 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3089991444775559, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018682388377063268 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3927848741866132, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003065974270261921 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3689097427358982, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002571023680832107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35671544335154326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002156063389652602 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f4eb32fab8ff1fa9eb8677a46b9ebc35b504551a --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.26475738478149, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10488019812696231 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4479742544722184, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003108871411245775 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4423554172558611, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025756769738496397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.41955022171167694, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002065255587289289 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2123975185096454, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0022240580364677317 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20778597326112527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00197971650755932 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19644636492905912, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001708355406787911 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3257902997295537, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0025340439153237536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3232398560031394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022135147638730015 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30489490110399153, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017356656037540608 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.38025656291521354, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002865492941990049 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3766640128082206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002485268728296478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35648196691681816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020231414730809993 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c10eb45d629ed8fc8d65e0271e5ebd45d81f0d3f --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14955286652112415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020266295880405774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.35543546517620694, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00442547747797648 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20694913889331623, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026118174574717734 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0376041381568334, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001193655014731505 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0933869055501563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.003010569547553423 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05271536971805359, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016602940533088598 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11702196333102838, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001508489395430335 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.281518689350463, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035793211165099544 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16253221143739943, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019871124537594923 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1163142271090814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016972579238893975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2797387075449087, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0039649519854766495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16153438576143062, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002249256594915832 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1575498448959216, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08919411230958109 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef9ec33781e29d3c6df229139d13262d457a153 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11987004390929652, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017838594123509761 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2966409602445348, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004159126214657732 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1687358123113738, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024129362829470083 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026631555586252555, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010212047218259958 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06832787071429165, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026781644808146748 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03787201010606323, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014498387144822385 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09946412096799201, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014047697344840638 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.248112655710228, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034716802936847493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14027382835276725, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001921605105364016 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09372299032008248, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014604124390732933 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23430014881481423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036250515591870363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13228905712132874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020123169172413372 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5635386724766893, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11199220007541402 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6d02bef4e9da9f70e17f75ec21800c1b4710125b --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12261802535697702, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001802015575276267 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3042881483021127, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004239856666150261 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17272164395046263, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024442934880362266 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02801123042219147, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010421626554945002 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07221142765808251, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027494039338407683 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03985376122882166, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014771066414781765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10218618041428032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014181507052656937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2550776992609646, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00349622255520093 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14412504060617204, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019378546005162558 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09563780121752037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001506049442354842 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23952794956934653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036934108853552503 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1350224868091867, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020648079219729885 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5884835216922304, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0694220243258812 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f26f61862a88a02ae663aca4ff7f3e3cf4a60d --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12058771231639086, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002066164336399918 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.283378982179243, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004430498021847181 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1651398268476812, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025732765693385513 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026878830813233837, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010536649719391797 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06558476547253786, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002641200590918728 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03726421510075795, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014326890233943264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09972103113703992, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001673601901658887 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23548429603769053, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00364743143336554 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13662385100336102, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020655105556114887 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09474676528107442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001734800385670887 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22375657894123885, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003765688599090495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1296880556548729, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002127865421306681 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.548658255159644, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09243037162628143 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..28ee15ceb5c01f2b69b5fa9feadf60ad89a2a319 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03871656302800435, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0023171515461883206 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07297233644463587, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00419731966694904 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04630458791276842, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025747339870623113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.007010252770233402, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000677642525994807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.015453001281963676, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014999985743029969 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.009197972474873806, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.000868833115217779 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03131649789252053, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019045755355521208 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05884937656119138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003409137251073175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03723052598616332, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020759578853067283 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.030881510184046758, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019314337019311182 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05735625281670475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003380740089049823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03645148435287092, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002076771980839672 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6621697454846989, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10164971536579874 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9838ed9c9f6f5556bb8940670d030fc28be11bf6 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0036570101092707552, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0009755024739951457 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.003158552109934381, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.000860982778191664 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0033252826117525294, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008934297630156492 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0006632141135470769, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00022782933435935797 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0006369853770402868, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00023576116891012097 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0006422730362464498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00022885115664468214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002516549335872895, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0006650456872731031 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0022033496898103025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006061893464627548 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0023002231158666315, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006174742913966595 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0030601262050967064, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008066078492200342 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002680985690153414, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0007365936380419417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0028016428299652346, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007514162209604014 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2741760295045995e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 6.398898398772146e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_0.csv b/perplexity25/evaluation/rankeval/perplexity25_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..16f6b613452105119f77631a508a67976955177c --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.01500870618212173,0 +anli_r2,acc,0.335,0.01493311749093257,0 +anli_r3,acc,0.3333333333333333,0.013613950010225601,0 +arc_challenge,acc,0.28242320819112626,0.013155456884097224,0 +arc_challenge,acc_norm,0.30802047781569963,0.013491429517292038,0 +arc_easy,acc,0.6338383838383839,0.009885391390947731,0 +arc_easy,acc_norm,0.5551346801346801,0.010197216690356425,0 +boolq,acc,0.5412844036697247,0.008715193815788284,1 +cb,acc,0.32142857142857145,0.06297362289056341,1 +cb,f1,0.21886695057426764,,1 +copa,acc,0.8,0.04020151261036845,0 +hellaswag,acc,0.4554869547898825,0.00496996845825617,0 +hellaswag,acc_norm,0.5894244174467238,0.004909328992915069,0 +piqa,acc,0.7285092491838956,0.010376251176596135,0 +piqa,acc_norm,0.7279651795429815,0.010382763786247388,0 +rte,acc,0.5631768953068592,0.029855247390314935,0 +sciq,acc,0.828,0.011939788882495321,0 +sciq,acc_norm,0.734,0.013979965645145165,0 +storycloze_2016,acc,0.6889363976483164,0.010705164869803167,0 +winogrande,acc,0.595895816890292,0.013791610664670845,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_0.json b/perplexity25/evaluation/rankeval/perplexity25_0.json new file mode 100644 index 0000000000000000000000000000000000000000..731528d66fce9c70244fbbdeba9872746a66dd43 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.01493311749093257 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225601 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.21886695057426764 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036845 + }, + "hellaswag": { + "acc": 0.4554869547898825, + "acc_stderr": 0.00496996845825617, + "acc_norm": 0.5894244174467238, + "acc_norm_stderr": 0.004909328992915069 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314935 + }, + "winogrande": { + "acc": 0.595895816890292, + "acc_stderr": 0.013791610664670845 + }, + "storycloze_2016": { + "acc": 0.6889363976483164, + "acc_stderr": 0.010705164869803167 + }, + "boolq": { + "acc": 0.5412844036697247, + "acc_stderr": 0.008715193815788284 + }, + "arc_easy": { + "acc": 0.6338383838383839, + "acc_stderr": 0.009885391390947731, + "acc_norm": 0.5551346801346801, + "acc_norm_stderr": 0.010197216690356425 + }, + "arc_challenge": { + "acc": 0.28242320819112626, + "acc_stderr": 0.013155456884097224, + "acc_norm": 0.30802047781569963, + "acc_norm_stderr": 0.013491429517292038 + }, + "sciq": { + "acc": 0.828, + "acc_stderr": 0.011939788882495321, + "acc_norm": 0.734, + "acc_norm_stderr": 0.013979965645145165 + }, + "piqa": { + "acc": 0.7285092491838956, + "acc_stderr": 0.010376251176596135, + "acc_norm": 0.7279651795429815, + "acc_norm_stderr": 0.010382763786247388 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_1.csv b/perplexity25/evaluation/rankeval/perplexity25_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..68b1685736b31b7998115d1af474023c7c186671 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.338,0.014965960710224468,0 +anli_r2,acc,0.316,0.01470919305605713,0 +anli_r3,acc,0.3383333333333333,0.013664144006618275,0 +arc_challenge,acc,0.29436860068259385,0.013318528460539426,0 +arc_challenge,acc_norm,0.31313993174061433,0.013552671543623497,0 +arc_easy,acc,0.6380471380471381,0.00986099146668848,0 +arc_easy,acc_norm,0.609006734006734,0.01001299223254063,0 +boolq,acc,0.57217125382263,0.008653474894637178,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.3633879781420766,,1 +copa,acc,0.74,0.044084400227680794,0 +hellaswag,acc,0.45030870344552876,0.004965078477435578,0 +hellaswag,acc_norm,0.5908185620394344,0.0049067795231926645,0 +piqa,acc,0.7181719260065288,0.010496675231258152,0 +piqa,acc_norm,0.7247007616974973,0.010421429277369531,0 +rte,acc,0.5379061371841155,0.030009848912529113,0 +sciq,acc,0.879,0.010318210380946095,0 +sciq,acc_norm,0.864,0.01084535023047299,0 +storycloze_2016,acc,0.6814537680384821,0.01077416522976135,0 +winogrande,acc,0.5737963693764798,0.013898585965412338,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_1.json b/perplexity25/evaluation/rankeval/perplexity25_1.json new file mode 100644 index 0000000000000000000000000000000000000000..81708d390eda0533dba4f7fb5a5a890936f8b6a6 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224468 + }, + "anli_r2": { + "acc": 0.316, + "acc_stderr": 0.01470919305605713 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618275 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.3633879781420766 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.45030870344552876, + "acc_stderr": 0.004965078477435578, + "acc_norm": 0.5908185620394344, + "acc_norm_stderr": 0.0049067795231926645 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529113 + }, + "winogrande": { + "acc": 0.5737963693764798, + "acc_stderr": 0.013898585965412338 + }, + "storycloze_2016": { + "acc": 0.6814537680384821, + "acc_stderr": 0.01077416522976135 + }, + "boolq": { + "acc": 0.57217125382263, + "acc_stderr": 0.008653474894637178 + }, + "arc_easy": { + "acc": 0.6380471380471381, + "acc_stderr": 0.00986099146668848, + "acc_norm": 0.609006734006734, + "acc_norm_stderr": 0.01001299223254063 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539426, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623497 + }, + "sciq": { + "acc": 0.879, + "acc_stderr": 0.010318210380946095, + "acc_norm": 0.864, + "acc_norm_stderr": 0.01084535023047299 + }, + "piqa": { + "acc": 0.7181719260065288, + "acc_stderr": 0.010496675231258152, + "acc_norm": 0.7247007616974973, + "acc_norm_stderr": 0.010421429277369531 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_2.csv b/perplexity25/evaluation/rankeval/perplexity25_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..46e4dda33f0e2964654a4fb74d39a71302e105f0 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.31,0.014632638658632902,0 +anli_r2,acc,0.345,0.015039986742055238,0 +anli_r3,acc,0.31916666666666665,0.013462309712005136,0 +arc_challenge,acc,0.30119453924914674,0.013406741767847626,0 +arc_challenge,acc_norm,0.3191126279863481,0.013621696119173307,0 +arc_easy,acc,0.6464646464646465,0.00980972894815149,0 +arc_easy,acc_norm,0.6212121212121212,0.009953737656542042,0 +boolq,acc,0.5837920489296636,0.008621380519419276,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.26053639846743293,,1 +copa,acc,0.8,0.040201512610368445,0 +hellaswag,acc,0.4486158135829516,0.004963362085275558,0 +hellaswag,acc_norm,0.59061939852619,0.004907146229347537,0 +piqa,acc,0.7247007616974973,0.01042142927736953,0 +piqa,acc_norm,0.719260065288357,0.010484325438311827,0 +rte,acc,0.5054151624548736,0.03009469812323996,0 +sciq,acc,0.872,0.010570133761108665,0 +sciq,acc_norm,0.855,0.01113997751789013,0 +storycloze_2016,acc,0.6846606092998396,0.01074498911626067,0 +winogrande,acc,0.5880031570639306,0.013833112857645935,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_2.json b/perplexity25/evaluation/rankeval/perplexity25_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a3ed41246a160b9222dc0101fc67d7adb9f47578 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.31, + "acc_stderr": 0.014632638658632902 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055238 + }, + "anli_r3": { + "acc": 0.31916666666666665, + "acc_stderr": 0.013462309712005136 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.26053639846743293 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4486158135829516, + "acc_stderr": 0.004963362085275558, + "acc_norm": 0.59061939852619, + "acc_norm_stderr": 0.004907146229347537 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.03009469812323996 + }, + "winogrande": { + "acc": 0.5880031570639306, + "acc_stderr": 0.013833112857645935 + }, + "storycloze_2016": { + "acc": 0.6846606092998396, + "acc_stderr": 0.01074498911626067 + }, + "boolq": { + "acc": 0.5837920489296636, + "acc_stderr": 0.008621380519419276 + }, + "arc_easy": { + "acc": 0.6464646464646465, + "acc_stderr": 0.00980972894815149, + "acc_norm": 0.6212121212121212, + "acc_norm_stderr": 0.009953737656542042 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.013406741767847626, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.013621696119173307 + }, + "sciq": { + "acc": 0.872, + "acc_stderr": 0.010570133761108665, + "acc_norm": 0.855, + "acc_norm_stderr": 0.01113997751789013 + }, + "piqa": { + "acc": 0.7247007616974973, + "acc_stderr": 0.01042142927736953, + "acc_norm": 0.719260065288357, + "acc_norm_stderr": 0.010484325438311827 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_3.csv b/perplexity25/evaluation/rankeval/perplexity25_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..6cca2bf42d89d6a92f42a19415f4e857ae291037 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.317,0.014721675438880215,0 +anli_r2,acc,0.36,0.015186527932040133,0 +anli_r3,acc,0.3433333333333333,0.01371263383046586,0 +arc_challenge,acc,0.2977815699658703,0.013363080107244484,0 +arc_challenge,acc_norm,0.31569965870307165,0.01358257109581529,0 +arc_easy,acc,0.6405723905723906,0.009845958893373766,0 +arc_easy,acc_norm,0.6237373737373737,0.009940646221513774,0 +boolq,acc,0.5889908256880734,0.008605429733982185,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.26666666666666666,,1 +copa,acc,0.79,0.04093601807403326,0 +hellaswag,acc,0.4473212507468632,0.004962010338226347,0 +hellaswag,acc_norm,0.5924118701453893,0.004903815885983272,0 +piqa,acc,0.7154515778019587,0.010527218464130612,0 +piqa,acc_norm,0.7268770402611534,0.010395730264453258,0 +rte,acc,0.5631768953068592,0.029855247390314945,0 +sciq,acc,0.877,0.010391293421849877,0 +sciq,acc_norm,0.852,0.01123486636423525,0 +storycloze_2016,acc,0.6926777124532336,0.010669445081866666,0 +winogrande,acc,0.579321231254933,0.013874526372008315,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_3.json b/perplexity25/evaluation/rankeval/perplexity25_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8fb6290d851b87936587866e9ffbe49c4112fe06 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.317, + "acc_stderr": 0.014721675438880215 + }, + "anli_r2": { + "acc": 0.36, + "acc_stderr": 0.015186527932040133 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.26666666666666666 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.04093601807403326 + }, + "hellaswag": { + "acc": 0.4473212507468632, + "acc_stderr": 0.004962010338226347, + "acc_norm": 0.5924118701453893, + "acc_norm_stderr": 0.004903815885983272 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.579321231254933, + "acc_stderr": 0.013874526372008315 + }, + "storycloze_2016": { + "acc": 0.6926777124532336, + "acc_stderr": 0.010669445081866666 + }, + "boolq": { + "acc": 0.5889908256880734, + "acc_stderr": 0.008605429733982185 + }, + "arc_easy": { + "acc": 0.6405723905723906, + "acc_stderr": 0.009845958893373766, + "acc_norm": 0.6237373737373737, + "acc_norm_stderr": 0.009940646221513774 + }, + "arc_challenge": { + "acc": 0.2977815699658703, + "acc_stderr": 0.013363080107244484, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.01358257109581529 + }, + "sciq": { + "acc": 0.877, + "acc_stderr": 0.010391293421849877, + "acc_norm": 0.852, + "acc_norm_stderr": 0.01123486636423525 + }, + "piqa": { + "acc": 0.7154515778019587, + "acc_stderr": 0.010527218464130612, + "acc_norm": 0.7268770402611534, + "acc_norm_stderr": 0.010395730264453258 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_4.csv b/perplexity25/evaluation/rankeval/perplexity25_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..964e78f05fe2f8affa75d21905255f0f3fa42793 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.326,0.014830507204541037,0 +anli_r2,acc,0.345,0.015039986742055238,0 +anli_r3,acc,0.3258333333333333,0.013535422043417452,0 +arc_challenge,acc,0.2909556313993174,0.013273077865907576,0 +arc_challenge,acc_norm,0.31569965870307165,0.013582571095815288,0 +arc_easy,acc,0.6435185185185185,0.00982804654450442,0 +arc_easy,acc_norm,0.6144781144781145,0.009987250004629007,0 +boolq,acc,0.5767584097859327,0.008641391399113586,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.27476190476190476,,1 +copa,acc,0.77,0.042295258468165065,0 +hellaswag,acc,0.4433379804819757,0.004957637648426472,0 +hellaswag,acc_norm,0.5919139613622785,0.004904747752286929,0 +piqa,acc,0.7159956474428727,0.010521147542454229,0 +piqa,acc_norm,0.7247007616974973,0.01042142927736953,0 +rte,acc,0.5234657039711191,0.030063300411902652,0 +sciq,acc,0.862,0.010912152632504408,0 +sciq,acc_norm,0.85,0.011297239823409301,0 +storycloze_2016,acc,0.692143238909674,0.010674598158758182,0 +winogrande,acc,0.574585635359116,0.013895257666646378,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_4.json b/perplexity25/evaluation/rankeval/perplexity25_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0d23b7d3b791913c60bc72b4f68c6d2746569511 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541037 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055238 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417452 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.27476190476190476 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4433379804819757, + "acc_stderr": 0.004957637648426472, + "acc_norm": 0.5919139613622785, + "acc_norm_stderr": 0.004904747752286929 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646378 + }, + "storycloze_2016": { + "acc": 0.692143238909674, + "acc_stderr": 0.010674598158758182 + }, + "boolq": { + "acc": 0.5767584097859327, + "acc_stderr": 0.008641391399113586 + }, + "arc_easy": { + "acc": 0.6435185185185185, + "acc_stderr": 0.00982804654450442, + "acc_norm": 0.6144781144781145, + "acc_norm_stderr": 0.009987250004629007 + }, + "arc_challenge": { + "acc": 0.2909556313993174, + "acc_stderr": 0.013273077865907576, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815288 + }, + "sciq": { + "acc": 0.862, + "acc_stderr": 0.010912152632504408, + "acc_norm": 0.85, + "acc_norm_stderr": 0.011297239823409301 + }, + "piqa": { + "acc": 0.7159956474428727, + "acc_stderr": 0.010521147542454229, + "acc_norm": 0.7247007616974973, + "acc_norm_stderr": 0.01042142927736953 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_5.csv b/perplexity25/evaluation/rankeval/perplexity25_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..caf4184ffe14243049ea9d31cc85c24cafd0d8c9 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928357,0 +anli_r2,acc,0.349,0.015080663991563098,0 +anli_r3,acc,0.33166666666666667,0.013596836729485176,0 +arc_challenge,acc,0.30802047781569963,0.01349142951729204,0 +arc_challenge,acc_norm,0.3216723549488055,0.013650488084494162,0 +arc_easy,acc,0.6401515151515151,0.009848484848484846,0 +arc_easy,acc_norm,0.6136363636363636,0.009991296778159619,0 +boolq,acc,0.5874617737003058,0.008610223886822883,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.2909356725146199,,1 +copa,acc,0.82,0.038612291966536955,0 +hellaswag,acc,0.4449312885879307,0.004959425421382028,0 +hellaswag,acc_norm,0.592212706632145,0.004904189257891276,0 +piqa,acc,0.7236126224156693,0.01043416238827561,0 +piqa,acc_norm,0.7268770402611534,0.010395730264453262,0 +rte,acc,0.5018050541516246,0.030096267148976633,0 +sciq,acc,0.869,0.010674874844837957,0 +sciq,acc_norm,0.863,0.010878848714333316,0 +storycloze_2016,acc,0.6825227151256013,0.010764505409830935,0 +winogrande,acc,0.5706393054459353,0.013911537499969165,0 diff --git a/perplexity25/evaluation/rankeval/perplexity25_5.json b/perplexity25/evaluation/rankeval/perplexity25_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c187058cc2ec54ab161522774a93ebf0b8c1ce5d --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928357 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563098 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.013596836729485176 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2909356725146199 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.4449312885879307, + "acc_stderr": 0.004959425421382028, + "acc_norm": 0.592212706632145, + "acc_norm_stderr": 0.004904189257891276 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5706393054459353, + "acc_stderr": 0.013911537499969165 + }, + "storycloze_2016": { + "acc": 0.6825227151256013, + "acc_stderr": 0.010764505409830935 + }, + "boolq": { + "acc": 0.5874617737003058, + "acc_stderr": 0.008610223886822883 + }, + "arc_easy": { + "acc": 0.6401515151515151, + "acc_stderr": 0.009848484848484846, + "acc_norm": 0.6136363636363636, + "acc_norm_stderr": 0.009991296778159619 + }, + "arc_challenge": { + "acc": 0.30802047781569963, + "acc_stderr": 0.01349142951729204, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494162 + }, + "sciq": { + "acc": 0.869, + "acc_stderr": 0.010674874844837957, + "acc_norm": 0.863, + "acc_norm_stderr": 0.010878848714333316 + }, + "piqa": { + "acc": 0.7236126224156693, + "acc_stderr": 0.01043416238827561, + "acc_norm": 0.7268770402611534, + "acc_norm_stderr": 0.010395730264453262 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cfe1371b97e81be38317c15e3f44ebc790a772e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d2196f6de51aceb4e6065cd8c426da87bea495e921978621a5ce52e1873679 +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22dbef80927c932afe73d6692a4d2b4791728430 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23f2a15c2d185a6cfbf74a11dca31c5a40908752a7f6247109abc70698144ba +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782bc3a248e02b160870980d4730695556fbdf62 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ae1db004ba1b6df6a441bef2f700420843e585f25d2c86769ea6a680b3b443 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..395700f32d7e7e10f05b07a9a59ee2c72d0a169b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b92213ba48fc6894c6a9c296e4c6df049d8b494e054cac55ae7337d7b54186 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b1b7063dfe7818a6289efa96a8ec0829dac723 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:125f2e9dc31eb5f829fa58b576474e815b1e1d22b5fb1548b55717e49060b6d8 +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4dd60750829e036c1b579f967aa6e4748749119 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c0f8756587e0b55042476a727cd6c899a8bca5356294da149ce906be023c5b +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..019b8fbe79195894c91e9bcfdb108f9cc43e2d68 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04e01fdd8ce70410b1063d299c9ccd043f425de47dbd2712a7cfa461e152f8c2 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fc6ba245d2bde3815429983693e8be5f2827147 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef596e8c2f8bc491f203d06f082281eac38a3303de9cf72476f82a26dd0b3b06 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..685034af3b70ed3cdf44af9ad9c2e69f71198564 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc42ea19ea813e4e4cd01a5c935b8ff397e0b4d044365a72a351fb2a2c5756ce +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..774a51af722f7206d71b202f752d9692ec07fa8a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce80041c53ffe63785e39f08e142c2e46faabc3207dbed8fcc1dcb7cb380f8c +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..483f8feb11a6d6d13e0ad20d22cc9732d0909274 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77996049c1f8ecadb1c90e10548c5e38ca65f758695116f61eb7ebd7e655c002 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b19b01d2fe654c95d2d722e4013127574c37a03 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e69fa8af9763cecdcddf0b03499106dcf9ff3acd07b3c0c7c95f6116bc48cf +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bedd214a9e6331b549eb75013d1dcfbc7db94baf --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:affb16cf88ff94988ab576ec6e28c28626dd7f95e3e0e4e1f5805ee3f65c82cc +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d68245c71bec879a18922e2ce144c7c5939cfe --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02bbb021a768892cf211e6e6dce3c376862e4e19e0bd7a9dd0bf5daa8e55e9b8 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2532cfb54775e5a69269db2fd2589c98ce6b500d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b45b941b2022acc62746cb7c61d62144a967d42ba097accdd8461f493d4cea +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a164f86815fd67ee7b0f1455ee61ddb9d9ad7ea --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aba887a5b506d21112be7aa658c93e42957f0f0fd7d29ba9106d3e268910111 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77075dfb46b5bf9e28329d8e57273113bd868a2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dcf2f68e9834cbf3b2e069a36ae47c79181b7f2e6f242fdf024fe14ce52b66d +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edcf9cc8ea92f614d94912065bcce438273568ee --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d213610e9b7f1a18c8d7359b6beb2740dc762b6e1dc18ce7ccc95703c72986f +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c1bbf01f89522fdd48b99b28a58d634a0c801b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442c8b23e6f3d4d17cbaf9f10c888f0101ca024ddc3bdc1605750baf9f4f3f9f +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc4d44dcabbc50003b156adf7032d29cbe30539 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1a9c8919fb4517d45e538d9f8295bf4b6bd5c175115f590e5e75d7c342e9dc +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4141f12255d711cc49f4717d23ea095deca1d269 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b0abda6ce4e4b50363e460f285d9cd7634c7d71357926577cb986849764e71 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a933c7f4bfb770f8ec288931a93d021ff7a7f8c9 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecf9f61a5820412e48ea42e3bc467731ae01586f1e3bde0c997b82a5f8604b0 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34e594953529fa3be4660beb4574f340d2fe005 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3570f6a915b50b27b45b97e7edb8be72a684fb3633129ec92bb31e6d274564 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..081c17bfbb40b2cebac6c3e222007fa01cb65b43 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae1ad1b13970707b1ecf252d0b48854f9ba78b3fcc41a929fe4ef723f48a4e7 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b9a71d6b9eee9187fd8e4d72ea31beb11727e8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0705b48d4ccad93c2834bc98ccd1927d07c59d4971dbdcd1c4cda03c8e4fb9 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7151bcae17ebc2cb1c180edc2db23a92b4425991 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8195c6503f83c2c5fa280169ce9e070417267dadc2d410638ab72ceb64c0d8 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a280603ed005def4fc11a686124ab0ec2af01c9f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ad253ebef5ea0cfbc0d165e7ce5d3183d87b1dd8be9fc8061a6374d2c8932e +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce88b88774ee3a1c70aedb94450f634201e44cd --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4cb59945282c18d8889384943874fb5bd176a2b46f9aca61034af280b34d803 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eab678673c676ea440e72fb3b197f4762dd102b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92dd71e5947ffa9642b7f9c634e48119b22ea34c5cf479f795e885069600054 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d37abee51896aa2d347c73d2ecfdaa984e64ef --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a564e278507739cfb3fdfedac0e4a878acd8d2bc59d11d9284c36928b50fa3cc +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..478b82e478c4924563b089fe25b5b10ea66c58fb --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bbd0981b0ccfd87c2d06600e36148a4febaa4c850bc5b4ad7b2870757f7e20 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78fa3fcf998f920540c3d3809b28b7f36dd3f9de --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caae4a84a0ff532d1add32db24924f6cc60dcb826ecfad5ad7905e7f9582d943 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7f5151151e6cad02b0f86c9290b2fcaa5cea4e2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e39157b252e0c351322a1b92eaf2fbc127887ccfb9566883ac327e6d437f81 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3829f2bb70a6ce42693828576fd674f0a8d3325c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2f2bb1421035452fe8bad8a730e7e9f10f6927f2d09b0e798b87b29c009cec +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fee217bc239ea3bb3f6954e5859317c707d8adf8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52dfaf8df0a1edf10d6490fd5531369784c403cf1c4b252c9c53b1f0338f9edf +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5db2d8eaa383822c70330ecbbe92d80766182df4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de452d331bea4f4c62c25e455f78219c0d323ff48634fdecb80da2f69005451 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1428ef97c04e27240785eb8be1732340da08423d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0526362e0ff4a9cf856830991047ef0e6e625069fb8ab5f26cdc7eea2374e1 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6900592d9f6782421756621fe39cf40e4200de83 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8267ff1be68c4b68c794048b141a86b65dde7a7034935ed680926142fd1a19b0 +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..693e72d7aa7070400a5e63991e230696a39a523a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7700193b707cb933df79319d05fe06d1aff1ff63e5786ba44ef01ddab99ddbbe +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aecb14f000a393451b9cc3a3fa7a3ce465acfbc3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc66bf9753588fdec4841ff8ba0776a9b1bf259c632109b013f3b88848e57d5 +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d476fa0b3164b8614563708dd811708a4a458f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e80b2dba1afd492fe34d79fbb2ef0958e4f4db96e6f35f2f88a22b66241f7d5 +size 131963693 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e8bc83a5060e984cabaf4708a686cde55e46737 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73133f07493e17afbb65ccd959b23ac3876eb9d9fb37c8f8777d84ce646438e2 +size 131963693 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a040f286ebde3f0b97f77d24f7cbb51d1afe95 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb80afb9fa012ece71e929235f652a3dff608034dfc6cd1f6636ef1186493d0 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a7adaddee7689a31ffa3e73e8e4b14460d1fcc --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d3b664c3db35543a7a50b2348f6b208e328e758070ad750ecf0e50bc681a5e +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09b9e153df62460900dd68da9e1e493075c90bf6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08b8263388a4d3471cab2956502814726a9315067f2c11d824557076e12a39a2 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de2f9a54d32c7ee4e5dc167a478ab15eca5d878 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77abca5b7c4b269a3ed8211c229e9df03882562176830be09d051bb5d0361c50 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2301e7650ea2d3d80c79df4612742091d55201d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3d6e7e6c4911b5cf5cb513d675c952ae73891105a65aec81b2542e10c9a75c +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7e4408012c0a9bc99f03d9bacd9a0bd87705d5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0405217712131a8a71e3d353ace1dfd54ab86d21ed5b3ee2e8b07ca4d30383b +size 131963565 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23dcb41668fe93efd888671d6922d0feaf522a10 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc6a77e71cc05633198f3c5a14e1f0cae8ee1ecdff63366a3c6f26d5e8fd1a2 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e3e08287a63f85be369d35795944ade8ba6263a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22db1970620a0e808d8bd49ea2b607be370e9e9264b9139267ab7c5b6878ff6 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13cd32699ba5fabc30484d84b267c859b4d4abb1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef1a1fd89e5e52ffa7567f0c150a39b86e908a659763937cf1909ee012eacd81 +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..567e8c7cd7b11c25a46f86eb4816bad86de12bc1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e48403bb5b661d503556e50cfa5424b8ee4e4c7ebf87bead68e938f6afd84e +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e458f367a55e6dc57bc47ac9201892fd5d8b1682 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c595c7798a9c5200c58ab7e58b38b34673e352e5c41807da06bb0a125c71464e +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9113d97b9a8baab98c3fd02711814679cc584d4b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add5c542b08da75eba99db10c66ca674fb5b1f9cf81818fb7fdc06f827bd88d3 +size 131963629 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a18efdfd7779e27485edde6272d82614af1dc1e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8965f09af057f70e7ebf5b179c143f2ad83092efcff050264a6732d3c31dae +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fdc5b91453820afabb8bc14f6eff03666b5b2de --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bcc0d4dc620fa0a1e7337ae3e5f2629e1172d67762b33e542732037b07c770d +size 131963501 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66642a1a82be0d9c7a5fc22e568e2f453980996e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb76f6c361748b659ebc6bc43c2fc442ab23ddd172b7be80ad89ab44588b69da +size 131963693 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d0051bd1b9faed8c684a97da1ad994d2c150a2d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca84d24fc59596294d7a2c783dd4576b5eb7bdf39d8c1f8f27a1e7164ecdd87 +size 131963693 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d550038ca6b9ef56fb3eae44622be9afc12e35 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c871eeafc3df70c8edf4ab117d78f470df8586e84166fec6ccf005c44ca7f4 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416dad05a3a70eee6bb3af661923cb59b9ff4cd1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7360e87406a8fdcb36dae0070c2194b9ff2dd2ab170ce1473bf8506aec767217 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64b3a82a84957405213bdb3b26a71afef75ff18 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0db422d98a79de7d257f3775d91117c1e1ab909b016307ff9df8fcce351089 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8944a1a7068908d205143becd40dd6884c04c913 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035d6084cf6ef1893f635389857e91e8a1f8b7b4b14343cba9f27931495b3648 +size 131963437 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a860d4462728aed7a6b93309f5860348d830af02 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3656b5d45ea0568a46c84e87f388cbfce30423a20bec690eab6a85b7da8aef3e +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cfd9b7a1c12b51f08c72597c6d138a622edbbcd --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f490da109db91d4b33b31d3b14a563a93d94c0153b233436118bfd7302d633f +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f2bab9ed61a09804947f1c3f374aa3bdfbfe20d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e984af1fa7679c7c3b75b8fc1010e0126cdb72ad528d7239a0962da2e17232 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..683c5a9a5f81af483f2c8432d2cfdcb568451327 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1812b9bd00e5130e56c6160a487b77eb96f97b97b7407171cedc3cc02d6d97a4 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76cf7f67832bebb4d295b635e27b489ca8cf6108 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc91d91e2a9ecd7a20fdb050e0a2a5277a5191dbb6a1394796ecd258c3c5d652 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4d291681a84a1e84e058baa1c037ab031f054f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ee63baefe487e5ae872c46e603ea4bfa7cc42d4e180277e42880c0b2d0596 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3449a9b0da65c8f8db596fec96a0e0983389868d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:355a721f64ddbc7b484c4e971839290736caad587ecbc41d09000c6d9605820e +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49564e01a57cd4805eecf6da6e919e777e77267 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367712ca74b31446a78d59ac4ca6083938e6581ce963427587e6ea02fc25e8ce +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07d3623bacb2c6f39b6e94063b568e1fbbb2000 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a25719db584e52af37d95855cef085cefc3110f4e17c5a5f3a64f664f1afad +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a68a9dcb5a7baf014f719d85444be0c9c1c6c013 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7d8afb306e47f78d65a366caaf2dfab6dd5a1d75872a3946740b4379377490 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..110b95acd2e34f31f972477757ebd310c3cdd62d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a38e7c01e2165cbc5374e8a37db07f5b0c56873ce8d5e38608e9b45a5c9324 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5251f254dc9cbd32030e1d1c0a49bd956bc98c9e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ff81453618bcc96b5a68ca776464ea3abdf052e020051c396c262416a856fb +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e7d726fba0b9f1502af9921dd3ef8a9919e98c8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd24eebcb781f1e7021c9991c2df8e4debcf0bd365139defe677fac2295f257 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99db2cc93f36f320bfec771de4462986de29683c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d8f1b7ffac7fb6385d3baf15fbefed2c3bb840fd538503132b1f6f9688bd87 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07032d15585e17cf66f5b176749563983c387844 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a05baacf14259e633e635075d188fc3087c50c23e46f190870d0ebd1eb71bf1 +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f42970231c5159209233e04b5a0707421326fbc8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df645f86faa36dbfbff7ddf4abe7fa9cc560152019e2758884450220b0ac888 +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..400b0e7430398a05128790f883b3ec2d6823c799 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e54bbb83158bb7b6cbed4584b7afa89a65b2de74b7f5428b00790c6262dcab7c +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58860d3ac807803e0d6990e7a902e1d571159cd7 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743d19d93df9cca254240ba752dc9e7f0cb96c9af465b95643d93363bf957216 +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31df99c274659dab0b5e6db91407beec52430f4b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1dac032921751e5167bdee8e482c86e0a4e1eb9ca8a1ca55a6d2cf6be3fb29d +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e60952f0e00b9f34e40feb7a660bf5aca691dded --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac2335e4fdb82ae078bfc4b7890117df85d9c09d76742657f92a90805ae08b9 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e211e476090d87a36e9128f29741492bb9b2281 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8dae04c4a52b2a6a4b20c271f88c92cc898f9111134c73b405a6abeb59d5ae8 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b982ce1e248caca7a9c498240b8761d58220531 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d57e4633b7052d42d527e3526d7d145af3405fc247965389bd45ed7918fb49 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a98b071988fb17948fda521e78e4e2ba3e839ccd --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79ebcd23cae18f9c1536a0a2b93d4db6bc63fbba064a30711643da9cdb1252c3 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..260cf0faff41a76a9e15ef772928732428a5a2ed --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de7fd2b94898a5a9621ea6ebc91f4163813db415e7df52601f8e598b8319b876 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ca965f4b012ca40f92d340fd44edc5d03a5eca --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb2314919280c9894ff59ce499b8bfdd150781f201a28524beab1114f927d42b +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eaa40b3f33f551dd2dff05ee17795d4beaaac4b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a2b1e6495dc042be6fc81e2ae49e7018e655b67f4650b30c0cbfb1abc56d79 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6752ef0ba7c11bd3882d7cbc907cabcaa762b47d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a23cfbc88d770fc8ab1bf4562c574821b68ad08905e15156decc3e581a84831 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9efb75ca55e89cf004feb7aadcd6bb0f85775ea --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d35554742930bb4a9ef02e4ab4444a5acd24c5607dfdce43c8560c2e2c995b8 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76e7d30bb5d5849c7b125e2791bdf35c3a417380 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7ab294fb4731dca4dfb113d412f613174d4edf156ec441387818ccf81a087e +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1265ae6adf941530954b157d184edd4d01417a95 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a6405eae53d6360e983d32827e8df7c31ca68601ca079cf2208d7a2967ebc6 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0773f8728b4b1059aa5f0678dfe8a162374a607d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b21095357332f590bdba75914e137e64854cc6f81dcbbf675f9ac477068931 +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db705e290d3dc73a8da3ea29cd6c506779e4dcdc --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e02c7ffdf6e8f86f967e97aad0278f728ff720f5cb9af87685e36df497c8fc +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da04553139f40213134fa4a7621e18e6075064ca --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0233c168d8e44b47de2343e7d421b8929d922ca43e6eab551687acc3587574 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7da549fb87d156bb8b6284ce33981fac5c715cf --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39fb8a6b1b86c932639eeb184dba6ae6f5f95f0dbc6a51f13f6891d4e2bf3f94 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce75e65bdc3eb5eae3f73f789b46352b2dd8341a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f31b6135e851c16061e5675700b09c203aca425241dd587cac4d43ddd360a35 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a68badc2e5ac63ab21897a1e9c0c7f8b0f70014a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3825807c48572e17c3e96228cbde332adb1b588da07fda94a28988fb5f3ffa55 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83147fe4df03baa12b4acde81e5a81fb4ebb541 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb31dc7acd8124f7d3b84194bfccacc76e4a2738ced3b798b89294f9f402771 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf543b2156ba1a3e612c77c8380e5cdba46e75a3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63040cc064762b2845d2d1ca2974c38b53be34eab8f0f344768657a7baa44744 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91aab96ab2675f3eafd2f10c71baa548a5ff1b84 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce0c29242a5edc840dc3c3da5c61a3194fc7a51a05a334f121e2cc804f9af02 +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f97d5a168d3e084198c3d81bebd13491b0698e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5fad30b30eb86dd083021b3180fb4b209b8a89a9e8784ce87d14d463c3ef2f +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a323202d392517d1b7c90eec88f8b936dfb6175d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2793e3715d18f60836ed5ad1b401a697a20b6bd1010a35d7cfc3c95f5ba4f4d3 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b016f905df01e663c77477d62d9ce5c0cf1ebbe5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa13cbbdb5b6357afff8031c67390735466c11ee9dfcbc8e8fd1ecbd367ed51 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75bae522b403bb7d3c7b37f943513565cfdae02f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21ab33504127d26f0b16fa26f1bffd884b80ed39b2b72946715f87d1d669ef3 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81859f5283725a052d67d692c33383e06430f6c8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0a9fafac96392018ae0899dfa58c8f19caac5fa6d66fb8f853de8de9dc8fba +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d778abaa0fdff7b9e3e844f41cfbca1c60a5ad4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ec58afb5a003a94458df7dd42f530dc16f8605fc9304bdf18998ab1f784b20 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e504449fefa0c7eabd76546c7eb6384b6e3a1f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88507323e1516a8d108a438fbb104aa1146fa84af18c7c7dbc6a4e54b302073b +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01cfa3ab92795f0258b626d014077aae5f4ad21c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d4c1abf254003582f4b1385fe3f1f390a23054d9636958f24591da49225a28 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf7b2586fbbd6ce5f0a5697ca089118fe04fc3c3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7723204a03ae2bd7ec79cad55fbdb7b74967fa8075d04ae7e49b5fb38ba6a7f +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a673efe563bc9fafa32a49cefd1f89b431505c11 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5817748e50bbf855f79fa23e1da74b3b874b91c4e6a9a73433536643784d6a +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d99e5a18d0de1cc8953732b3e9b1596041e0868d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be420abda363abcd9c89642a807639b60521e59407fde1fc8203458cbe44b39 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41ca1f4740829ae220cd2c975cdc62e94961360b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90dd3a7806ca7dffacece727939d02f84303dc1fd9b7ca4f8352bd6a27e1a3fc +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db25c8bcfbb11e443edd2889d2b2650d6a2876d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a534a82824838e469b3ab28a438d3d435dd56ae9982f031cad95a07a496d6a +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..138beced59df95890c1472c7c3da3d44bd1e70b8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:593a693dbde699bfc394ee5b936e2241b2e9efd9534abef64579ad9cc04671a4 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445437d64ada2ff94b9c3f648ce7ebc0ab35f6d3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541d109cc498d0042906ed6742359a385a5c0062745355e0acb4768e1f2b7abe +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb0ddab982eee8dc8a08b478689a319ed2cd6afe --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48f4ce84c7c6634e81497d43a157d59a78995b60665a5902456efd41c1fc679 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..756bb84c2f8f313c97ab28e8c0f7221d691dfbbe --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17da6ea8cfdf6e63d9ce1db7de8ede677214145a728c9e7be4aa0a47a74ed5f8 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6b15443ee4e561d97f860f14d06114eed7bb66 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445fce5ed864fb16ca6c4254711bf38da9913aa53008aa1d37fab0e84e2bfe84 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e91cf5faba8b6e63988b44e077c406f6199e8e32 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d980c2f1c9c3856419c368473d9d2967ce1fd5d6e41e20edaed5c879251b8d +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f374224009c530746e28c1184e46bb9796b9b3e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790e6d9050042332cbf83d2d766bf8d640957cbc5660d8d3d80e34945701812f +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86da7ad1714ba7ef9056653709376a3eae7d5c52 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13c41ede8ff1fa5ac0f37b2e27800552faf05bce3d77005679513515bf30906 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4effb87abe13c70a5daac7c381df9cd7d635df4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cf71854483aaed96ae7fb708e9f330529862d177b2daaf814419ccd35ef534 +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c3ce55f206313dc1f33da8d3528063cf8d20367 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e259d78ff63ee51d4a59a4466e0b62797a2613832a68cbd13ba82af8c9f8469d +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2241931d08ec81312f9c1667e3fd7cf1caacb629 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c054d956bbdaa776b737b2481fc94afda5a36b5ce9764ab3ee45395a86dce39 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f83c3aca594927100f89fb716b155723445d15db --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00060583abc901e77b7d67b885aba0d8c62c217aa93d533200a4b9fdc55aa7be +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb1a1e5d51d6a998dd2d772bc39172ea09c6c4c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea43f54a5b02d118282a1bea0b5064fd0dcb6ca6e65c37bcd7900f4d0469383 +size 131963746 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f08404188206729c840b163c4e1ddb9ee41fb5a3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83907ddfcdfa4fe27ffe2e9efc74d20f37bde2c5654ea891698961d7494e0e8c +size 131963746 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..187293c35355eeb8e153ffe3b84659b5d1a4d87f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f96e25513fdb450defa8e6bf55a206e1772a8cb649abc2b5b6747041dfb096 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55c00f61230d2c6fe0c58c743db6fb05934b183 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9768558b311319a254fb571ccfd778b9704768cd6f7a4182da2a65a8f4a5e995 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd7ae1695747f652c19763704d78df04c4d060c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e0740224f421ed9c298eae31c52daf79e44375fbbabcdafed5f397520ed7f3 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de8ee561addb9d22999f3a272ed609a7e4d45c8d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e74adb36305624f39e02892ba26313287e4f33b1949a67b8fadbd8bd88764657 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b0e8ffd9cd152044d81e8036331879e49f452ae --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1776e09a3020e6c56a1c89b7f5bc2522c9f92db46702cbb60106fd4690933b7e +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..792f38f46c60f650e14c214c6d482a651d7b7df0 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92516722334ab7ee575c8bd27022827eecc5332ac9f86ad087e461131f769b26 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f4e1f49f08f4bde85ddada967510854032d197 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe6e8c150f02254f73a84da5faba9f9ab7762f7ce7c0849fa5155dcc0a62ed6 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..524dd9aad1070f3de77e97d8ace2f7695e984874 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba20d07aed78829f50a1523588d7f3e9390f57eddad10a44c2fb3ed1dcead639 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9285d2aec0c7348d519d7defada209bccd00f6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:441b1b1ad04b07e3af726b3d86fcab7d5eb1cb588d0ec841dc6ae8cb3299ab0d +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ecc696b7bf0a9a8eaecaa645e7b84f2ba497b5e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5306bd8307b374b1c3f85126a55a39b2a458b36812b51df60eb14402e28418a7 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8869bd5de9a040f96ed853bedc6b69be22550392 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68163aed232f5dcdc54e8da68103dd0316fc352b8f72f532fe04e088be8b0b9 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af26c990e9c5589a198c496a5d5506868561eedc --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48101e2bb2927e496a7ef789d9e2bbfe065b75f7dfff2836e4319112062e6c18 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f15391691ec0385089a95c22b44fd83dae12718d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05fb348a84862c6fa63c881a23a0b31026867b5da84c96d26a098a17a63391a +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4a7b96c19ad0ec41892682639ed2315754a9b6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cef1983c12c0deee6f5ecf1a13e59f2d4db3781d7b5adb0a24b0e24c1f985ad +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de87dd5101a580a94cde9403413222a3c8b4d044 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1971206d09b206dec89239d758ad82f37be32e04f63c1ee548b43d75e16f00 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f80e744d5c73b885d56f0dd292b0de9bf4ae1620 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c331b0dcbe099ffd75a2414c1fc636915555d8acb488915ba364e934da1e3b +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4de4534eced05157326097fe8ae4d9d2d4172e5b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68f874525308353cb229427a399080954c0841dd9585cf59b59fed93d5457e3 +size 131963607 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2128b8581a469e2e711f9484482ee4b2034df3c4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71850538dd3f28f0d091dd93d8cce53c7ca471c9173587b4d70b601738195160 +size 131963607 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6052834b841753d4746625af9df3778a1d12ca46 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8d55d5588fe357fa8bf774c20f4c9a8fc4a491314e7287932f9899812817d5 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b71ed5d3ecac677e22519476c8a37bc4f3ab1fa9 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8e4e7220877bfe913845a3151915691009a2204eadd753d0ad3a61e7fbe14f +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ab4ce964558a6d06d24741cdd6d00a0ba8229b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb50cdc87377816f0c1899bbea43a5f040b5389112e0d6c3503708d4cee2b5c +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def7296eba78a46aa146bf7a00f46b22414cc8e9 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2e6bad5f57a277349be473f48670b4d6c0032d0a5ddd7b84cecd05b8bfdd49 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d340b8627e7d0e4e9700fbc918bae7d4776b4679 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a414e0d502258070ed0b8ab261488500e66cd2b37b5fcc9a7eefa85dcbbdfa96 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b252d5b30526a1b11d9289dbbde4feae263196b9 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe4c48759c5261a224aee270c51279761d168cc0165df659966b5b5d2a7f700 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31fb50aaf5b05a92e7ba14b64cc2ff7a0622c463 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b86e521a05ac609fc7008751402cd5b63271b1a73ecfeff264eb87723a0bbff3 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f981791a74323364a0a9d2a2896edc8d5712b0 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32109118246ba830d454e273ac4b459511174bc618e1116d2741621f659fc43b +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480a60b78e090c27a716b5b6de6b58ae19b8cdd1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c4b8c26ca42af0d31bf729999c68c689b6bf579266314fb43e93c12d8b66bb7 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c6e32269e691b1e27344a67f140d7cd2612c39 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39179693f55e42279a93d0d1eb527e95b88a81c55d99ca6bc9f138830a73b1b6 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed5e59eed11e48905999be84edcb06b505e63ea --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82d779056d2b9580f67e2b08e3f0c08aefbd80b3da8f9ba52b0ff6ff600a6287 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f26b10971ce7ba3b0ac7fc0d3e8ff98d3dfd02a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910293d0d1f66ae0d81b783effb1a5a3d78a2f8ad4b09bae3631795a9940e96b +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..099af98dfef926b63b41d8c8f73cf89a2dba3dfb --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3348b87741918b400d234efec90847ebdbc9348b356c721b8ad013d36cee5ee7 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..832d76d4e49c411c0122dcc3012818b27489653f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fffd1e87bc8196d0e705eac4bbc2cbd92bb9f592b621442f86b2103de3103d99 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1c28f5653f98294f1f8b9e04200521345d0453 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a117d0424ce30aac21953f52b9d94f6e1931b49c833777895828ed0c0337a56 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0508ffb801091f2e750195323aecd913e465904 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:534f42aef234905804f4c512f481739a67880b1ad774d4143e5fe5ad1dc5118e +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b397e1cdc1b0c6474de8b1e0ae584543f7decfc3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e44eea559656f9f8a3485efad43547e89314ea451af7f1792f6e8ea408d474 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c068ea24798c01d19924821b76621647ee651e4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e6ace02eb7255c8f6ec888df78cb02ec6f230f695d525002dd864958c4f552 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cc3738c86d17a34eb35f363e04d9879259b6692 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4221c9a05de4bf9dfe76502fc5d95f6401f6cb32fa775f1dbc2bd750d46b5f3 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6637d72633e06469ea6d53c2e738d948fd3c8d61 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db0baea687f66cef6dfb2ff3346fb17e3696e7545275bae845ac5e0c2289f96 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee238d0fbc8ac812a8d95a3f76cf43bfb9fb6ec6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2023e6e3e4fe312fabf9a95926924dde3a8d1b834bfb2ff6609a489af9d73d98 +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c811eef2ef96bd1f5f7431dc2d5c566b1e5aba53 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a145cdfcd8c4de8aefc7c30918c8f1c081472ed1cf2626c79dacbfe54644cd +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e62f0724fa4b6849aba3aa4ebbfe2d6bdd4f2a9 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f0a0388dac254a5ca4114b2983573bad06086ca371e94b3cbdb73bc21d9cdf +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0acd652c35bcb744cd135b0b62319ab179180b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c1d6b76ac2b46e667fb254d780040657427a72680ae88bb8e59cb9f19c8aaf +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45ff80a4b5c51497704dd3f41c13a47f3103a7ed --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e70091c1464435b07f11a2f85b0a7b6dc214d64805bb599f53466018bdd230 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f750ab593fdbcdb4eb0e996ae803b7573f85de2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd4b2d954ccac750a28603e779e18f8411e0ae696d546ed55cec6ea778f4b9e +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e36491b53c857fdf5917f74163098f1d04c585 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae9796c6afe67b023f2d5fcf3cae0f44803a176b85bdc12845ceed33d3067908 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c198d1bc9f916bfaec299ea1d05222a9fb00bd8 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f358b2a98c2d70062550ec8cf3cda5042bb45cdb86b499b31cf5bd016f158b0 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36f9779cccb105319c12ff843a93d61112c3d43d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d91484a9f556a730fc5590599e33457f9d88c451be195d104d8289bac065230 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08838a4b57d93779019f0ce3404d150af95779ee --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bfe8d60751a6e45499e61dff850508c0068941dcce2cb5f26cfd59a4795b53e +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9b651193fe87deed1e207075489b0a971452d2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2db82b44b2e1693dd17449e671516daf6e8d8d31d1545fab2c3b3158651aa57 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97016d8e1c85795571800c0903b000210bde9065 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e3e1645834145624e89457f26ec4be093b8fa6dfeb0b1bb8e72539aa1a5f027 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c41e681b37511994e99696002508f24bcde2f4ba --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97c52ff949d2792c12591375446907af2fb4bebb5199bcd69e69fd1069dd6db +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ebebcb9327f188e0427bca76e30b3974ac6f235 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f3fc1b09d2872539ef95ce43fecb1a2de3fd8883d32ea8ccc21dd13f75f0229 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1be405c6b80f2ffe93047deece29baac1a7ff1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb949cd3a2cda808f19463adf5cb8b4b9740363429293f3dea144b7f6705541 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..055f5c1b9ac97989950d857587cd94721bb2329d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e28f5185728e8c6bbb47eddee9355fd6dcb09b7585fc9b517fd61e5bbe6591c +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d5b8a64af86061f265ceb63c21e4f6607835ba --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080526058bb69eb3dc8674e257f156e8461c9a5d0150b024ffb3dd6bf79a4d82 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06e9fe02eb1da0aabe235e2856c5fdff77cfc5db --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148064dd3d85351c8e229717cd36e3fba32a3711afbcce2a93ac618aebda8654 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a4412cbf682b5b761e6d209ef18acc81dd58c4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbc9c6a59dbbda5b46f265f2c671f8cfd9cf06087d2693854378a83a7e82a13 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..222c96db2056fdf82bd2d12730e8c41d1dc283ce --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f660420a6653fa3a54522c7bb927621913a075e5d61770bc99eb869051d32ad5 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19b5f511a834b62171d64c55fbe8a8a618feb3b6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31038afdcb0958b08e44a5ffd2574db025742450d79b4dcb608f91612a739b6 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb17c39d1c8f8fc153d0cf06b7d0be49c04343ed --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ade0ee4a6c315d671fb960f0ec91e4f096bd60b8854a1f0b0a6380515e9764c +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..246922cc171ff91b22e74ed9271674dc62c591cb --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73bc60f43df978a62e66f01106542803439f319a37ec9764ee1208cef0eeeec +size 131963415 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deb8a89c33ca21ab4514f82454196ab5d62f9145 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2adcbd2d2a0309f118d92128f434ee9160bec50e1c028154f40fec2512a14f3a +size 131963415 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..149f10667429a2a84f809acadc5ac9a9d3bbd0f3 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23b9415c53afff2a4b9c556dc9c6a679cbc7dcd2e9dcd2f0d6a6429e0a89fea +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcfdfc8b85f7baff00c4abf27d0be02601da072d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41448b745e64a93cde2b315daaea17c2af9a85d00ef785f3ed23fb99ca291e9d +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c482fc36d1034fcc427d53ea81dd6ba100eb9d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08f39b83810e9d747a6012bc8ea370874bbaa77a804b4aadf1cb4a3adf644c5 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..948a25b3473259972f3044bf1a7d141aabdb2191 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9c33627723cb67d73709a95ab8d5c467e17cf2b7e1d8371b5dc48f13841fb0 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2179b2525f371a019661056658114b56ede2947f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:280dd84d3ab2e944d2af98f938c3048a2c5823e4d630589d740ec46405aefe5e +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b598acc37dec7f710541da2be35c0a5e558ea0 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:273c42987bad6b79885fa6c42fcd100b304cfc90c6609fe0b738db9e6126117f +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b906ecf9577d36a931cbbf7e34bed9856fa68a16 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d394de74f6b581b92159d69e464337b5c4ebb91df8a9d719d85353ab97cf77f6 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c480d76460c96ba6b0c671bb664d5423d0ce5b5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440b69872559808440d27308d0a1e122af2e07e88b742790619f137deb72128f +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1216e7afc2d6a167bd2d285ca28cf23fa5dd594 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2fa7bf61971c2a86b7966a26336c9b1cb33ad75427d685c7e5f87145f5f10ff +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..896f20420d171fe94b965e94ad842e88500aa4e4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c020c386e05c3a25367f7263bb59843705f99de5b658564fb704f3d5f3fc6ac6 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c869bbdd6f098f4cdbc1d84a0394e85f5bd8f2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4b6297d89239646e1000f0bc1aec7a8973faab0da6c7256fd190d7c529e697 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f238d007fa6a8af9d7e2cb9017aa613c10e467f7 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd493e4f976571b6c433b7d835bba4095bb4cc0b72020b383acd5b0db1dc1fa4 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad0e2bcae6f361be0bce60354f767eae4cb3b2c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3eda011001e3d445d5ef831fd15dcdeb69af35349fa3cc016ba72792031951 +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81eb370ccbbdf544247a9b0208d5c98b5c93724 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32be01b63d3c38236bba41ebdec756b708d6db76ccbfdea01ed294dce4ea87d3 +size 131963682 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e460c640609a35aa81006d4e9d345c48da0429 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2025c4e581f6ff38e622035b5ad8e6b6a7b948842e73951af5d9e2fb903225c0 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd77015d3955ff1768d1c1e8c52eb5d177147b12 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac24419528e8790685bdd4df7163df0c0bc9ce9f315a50180bcd30d9b611bf5 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..738dfac85d7f9798d10bd1c4f65e229f33b35c5a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6ae61a90b3bad9937774fcb22713162215734931ed85d5761cc99c3adfbd83 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6398033550681898128fe7262de79e282277ed5d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36a19461238390d14f76b417fa529aa45e6247a9946d0b7cf459c4aa8088447 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ae502032c17bf101cecf61edb63503a7b265e03 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26ecadd873a42972da81a316850e8f8124947482dc12f7df6294807d11f38f2 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c29ee5fbd8b5fec85cce28c4ca42f101efa563 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbee0b7f9e08b1eca98cfadd56b936eaab1005b6a08b38c43ed593f63da97d5a +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a59086dfc1f03b8c4d0d20f36a8c009c857cb1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b694e87fd22d75b10446007143bf5fc757040f17d82928d411a3dfa0d53e112 +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e508953eea8c5b178388249d7f2a2d66260ca0 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d569c786809e81d6711f8c0f2826e61e0f4fc4b571185980442cf0f58939480 +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f34d35263adf04df96367889df72b6da7bf1499 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a77a63a6a3aa98156ce4fcb5d5f2601f9290605119413fbc88a502765fac738 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e95dec20ac2f7a3e243e5fc2afcb3cb1bb46c2 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08763b58013cb90fe5e29644b87fa6756c35a1917c3d59fc6a1eb5d42aa72eae +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8adf767a62bb53c3b53744e09585e9d095836aaf --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866d82f87aa62dd587770ec8320c79c4ba9a01b3a8d0c3e7a2302efb5d9ab0ad +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3771e3a3f03495eab9b18f3ce35614cf723e7935 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5fbe88840a0a5f13244340d92cd4b992f0c5fbe551a20a774f1d6fb37b249a2 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ff7db329c4058f7c35edab677866df2412c4a5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3063757421672a9395f5336ad94c7fb942719436f4b2cdd0393106aa24ca2722 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d20f33261ba1ca0349edc9eb3655a69fb1ad5ec --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967012b12e11d9376807090bfa45a224c34280c11ccc8f83f1c51c179f122bc7 +size 131963426 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..999194cd292445c57cdac7c05a311ddabe80c29f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b3bfa0baa7b36be293214ca960b6a6c0dd488f0182189814acf87969788c6b +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59fcc861a31f8e3c39f5a2d497049848c24225b5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b140e4588788af9a758e524c8ca47ef80e9de4a435619d0ac0c8385192d49486 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c7d82625d93ecfb11b881c996daaac97dd2a95 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33117bcad865583046d6518904ee41036e7c1a892dca8389826fae455bd78b1e +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b98d2dc77284842aa57a82550ba67ff2ef7d6e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d0e1e3dc76b491168aa9be968b85fcf023271473e783a30980a2ca31219af8 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87c4f37ee1f894aaefa330b16b3d5d4aad25660e --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e3e92aa6e644195904d856d45d969530949b433978b1f45959181ed09b0cb4 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df2809b52c546402fd7d6cd91b7b28077da9fc25 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2cd67de2d77117cbadfdd94230ba94a09ae4091e1415faba066e893898930d +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6851b88a72bd36997f95c74f177551e571672a1a --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb3e5ea373fa3f4cdb2420088b411604fdf62a465efcbfcf29ca0b56da5b7ee +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..853ee19104ee8c6ed8f4d94d8db9c177153c3e1f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0abb1be28c5cc2dd773286871b2cdcdf0c6e1b148cae16cadff0c98cb703a3a6 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4daef96ef3f5f6de8036f77dd290e8c82b981669 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f69360c1b01082d128dfdf839c30371fc88989d782fdee1b5ff0ce960c5329 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7bcfe7fdff3de2f75c52d870091267c6d895372 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51049c8a3ee624b676dc6fd51186b8db1e73fab6a4b3413f0aee505d53f094b +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d885fbdbce606fe285323e473c864576aeafdabd --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd59f99ca8826cf53430c8fbd7f686f6668b4b1b19c8f85120f1a3e74e74f54 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b5d57ea846ff7cec66f8f76d9ed03aafe47959 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b89fa9a19b0fe209c492ad9ab1604cd03b8bc673a9d684c78c718357534deaf +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3ba1c73455c497f411ece1772d116623001a87 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364dee987372940574c26d87e6f71321837b9caac8d375392f82f59dd2d394a9 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17d71dde68920997d12be07ee37af5abec478012 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6877490364d3a771f71ef7e5f306ff3bdcb9f2fb3d0051fa4e0280073e3f4d5 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4babb52f1d53fa11627238817946f786e82df05 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b946fbeed806a4927fb6e6fd887bc71d4d6e482af9a75fcaefd8081e713e177 +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dbd267967cf3298479dca361cce9a0aa798b935 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618b7d3033cfdbcee1c0d2e5d65272f4f16d8d5ee6edd2656d779229a5ac701f +size 131963479 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da9b2459584ad3f434aabbd0edc44b433efa7e5 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e302131c6d30ef2a6b87d8cdc9b115372c8921ed361aeed243f68cc098ab012 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7bdbf9359171f0f77c17134fe577aef4d618f4 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1321af2235c3b726b67d968642879e21b53574b84a4306c73afc51a84967802d +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9116ef24a037f4c3d4827e9f06ca2fe2ae8cc32b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7431dd0f1866dee8dddfdaff231cdce8e3aa3e471f1fc48ddd1e9f3ffa2bec54 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb898438fa66009b037e325614c2ce9b1b796382 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f7b9a06736fce49656f38f997708758e7a8a60b54db298a4840abefc893f7d +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..471e945a94bbaac0ca1e28c320259b90472c2b16 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f9f0b730d5ee1db27a4a31b6e80750d6ae55fe9140677ffd5f0a894498fbdc +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d333b1ea3f1cef549ba5cdf4f7b28ac8053911a1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7e3123b824ebe812fd07aa066ee0b89d14126dc874dd569e3c830b0fabe64d +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce6c856b7264d983b90918dcb20f26dbc13cd8d7 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b279189a0f57207e8ac4a69aee9e4448eaeac97ecaa080565801a932dfef5a +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a8356f7ee00b6f7e75713c3a34b661fe61f828 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4ae68c83f4214187bf557179b1bdf79c361332adf8996789331eacabf30664 +size 131963618 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c57d76fd6dd4f79907ddbc608ec580b1e41242b --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6503619d5599b846e737927dc26527e9e392119ae5378a248ac8806573c6b787 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e8da6c07ffb74c56d71f8dea3b4e801f22d70f --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216de80780e11fcc13579d6bbffd27f72e8f039bb428c6f97e1085f15c74eede +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..084ed81d77f43ea44773ffbbe713028d9d36af45 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4480b8b1721b6d87edbd0cc7c56b8a76a9161972bc201d42e7ef860fa83c54 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f08adc9759848262350da72ec54ff62ba76acc --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f53b54915eaf682f82b7ebad4ccc47af49ec7caa05d7a0a1bb2409448c1dd07 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2703f96984f0c9701dd87569896a15f342bdc952 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24569a18bd7c2313383bdf0df8d0535aed3b368920a69d618050346f55d30063 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6651eb8ecc81fa40693ad3daa1b5ad9d5c261974 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304d0f56fc14a28326e58a00e49739738bd4e4b948062b9b359e12e0db52cc15 +size 131963490 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b46856bffff96b30c9ddd397a9ed24425127924 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee00d92f4ba2b7bc6128a3ecf194abd128fe720f0ead9963c5a99ae22cb52f8 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b6ff3c6d041bde7272caa35996727a616b543d --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0becd5b42b903da887b552e83a09e9925f97def043855449b3158c81b12072e5 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ecd1687affbb560e1d09107d56d25676a037a1 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9fd6c58ca34fae816b07c8519519a0b1a6bfa1d9063a66f4d8e1fa997883c74 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..880217ecc5cca6c96f5f3c4e66f6dc9ac0876ff6 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1769c45b059d2d8dbda7b0bb3c43f9961342cffb1a8be19700af768019f99242 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2752594fa343c45f4049631e745d411f5b8107c --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6536b7e9a3353026064dad776fbcbaec91108e729cab31262c0b95d38434e67 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbcc180c65143746489414c4e26ba97bf4fa8f63 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9357aa1ab1a0033a9dec107240190ac28095aa7fbbf22c5c67fbf8bdc01583 +size 131963554 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4098ff06e879bc509427e0b57a785ca902bce4eb --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:705bf534bf0a87250d950c3c31c7a5ceac7526b1739449377fd07007a3654426 +size 131963543 diff --git a/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9caa9982333101b439f4b076c413ec03987fcd16 --- /dev/null +++ b/perplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4d6e50d1ac9c8097fb1a10ad6bdf1ee1c7e6607a611dc5883cc5634551ec5f +size 131963543 diff --git a/perplexity25/global_step80108/layer_01-model_00-model_states.pt b/perplexity25/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccd4119393d0fb929d54e32d6a4bd90f4127393a --- /dev/null +++ b/perplexity25/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c57a59363ca227926039fd33f2063473b284b8cc41bd8787afce3576cbf0f7 +size 139592963 diff --git a/perplexity25/global_step80108/layer_01-model_01-model_states.pt b/perplexity25/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f985c1ea2c5fc3a7b2573edb0f1539e28965fb --- /dev/null +++ b/perplexity25/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c95c345b3c724c120ca3743eafa430f7ab15357227e97360865f92d39df823 +size 139592963 diff --git a/perplexity25/global_step80108/layer_03-model_00-model_states.pt b/perplexity25/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97667b66cca5fc0a2a57245cbbafdbeff61a89ef --- /dev/null +++ b/perplexity25/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00666d317f44d0b68f8607b2512a39f8dda52239c075433a071c15d68f515a4 +size 78696195 diff --git a/perplexity25/global_step80108/layer_03-model_01-model_states.pt b/perplexity25/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bd5cde6ba780b418486c16fe4ae9b14c19f1582 --- /dev/null +++ b/perplexity25/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19417fdccc3e88df3f929c27a2ad80b01cbc6a06b2b009d5d595ab2e3a3655cf +size 78696195 diff --git a/perplexity25/global_step80108/layer_04-model_00-model_states.pt b/perplexity25/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9034cdd188559279d69df6652ac9604dde7a2729 --- /dev/null +++ b/perplexity25/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3605abb875836cc909c0ceb5a6c4cc86b956026ef7a103ff82b9ca3a1b0b3d0 +size 78696195 diff --git a/perplexity25/global_step80108/layer_04-model_01-model_states.pt b/perplexity25/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a652c8bb3a0cee27ea97d2c25fecd55b2fa1db85 --- /dev/null +++ b/perplexity25/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e67236f5a3bdf8b2939d62e5e9dbbe8621ac7810757bd512bb68babee30700c +size 78696195 diff --git a/perplexity25/global_step80108/layer_05-model_00-model_states.pt b/perplexity25/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4a9b5d40ec48645bda61ea74ae5ad002dd0c6ed --- /dev/null +++ b/perplexity25/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0ad8d8226680a3e959303f6cb3f0db6370318dab7057dd40ef95cd79adbd35 +size 78696195 diff --git a/perplexity25/global_step80108/layer_05-model_01-model_states.pt b/perplexity25/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad79c3cb199791a1c8c25884e8ca1660238a4ee --- /dev/null +++ b/perplexity25/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef09861d191ce185cb3be9eed4da0039e6e5d71b6ab68aec3b7ac30e2f45d0a +size 78696195 diff --git a/perplexity25/global_step80108/layer_06-model_00-model_states.pt b/perplexity25/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea6b15084b645fe5edc8ea0bb01309cf42321bdb --- /dev/null +++ b/perplexity25/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61e5961b430bfa772d012f5c6ba1b2ea224bf960ea71c68890feb5e5f4d011f +size 78696195 diff --git a/perplexity25/global_step80108/layer_06-model_01-model_states.pt b/perplexity25/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d1dd6ea3bb18e7f43af9d42db8cb11f001160d6 --- /dev/null +++ b/perplexity25/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925886874b27b779bf10db0fe9a7bc178f1cdacbdb256d8aa93a55723e526608 +size 78696195 diff --git a/perplexity25/global_step80108/layer_07-model_00-model_states.pt b/perplexity25/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66db9ffd1b03a7c9c955a4dac89e1942c99cab3a --- /dev/null +++ b/perplexity25/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f82f2934f83a703fed79e1215bfb929c5a2beb0c3874bc3f639b3cf2d358a92a +size 78696195 diff --git a/perplexity25/global_step80108/layer_07-model_01-model_states.pt b/perplexity25/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..255281a120a55118ea6734b1d1811b3bd59aef0f --- /dev/null +++ b/perplexity25/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae57dba75564e400b5e2eaea99774892258e2f606fdda9b123652af3d8b28888 +size 78696195 diff --git a/perplexity25/global_step80108/layer_08-model_00-model_states.pt b/perplexity25/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeef25a322118794aca8828c34e9a12b8c614a03 --- /dev/null +++ b/perplexity25/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657e072a11786ec583a91c61acc4ad72aeaa1a4949bf4b426d1be09eeb87684a +size 78696195 diff --git a/perplexity25/global_step80108/layer_08-model_01-model_states.pt b/perplexity25/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..854af888526414d49bf683acc66cc121d9cc5766 --- /dev/null +++ b/perplexity25/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa61ad569c990d20b7c3999d4215e9bfda99a87d6a0869e64fd1be89bfee0b4d +size 78696195 diff --git a/perplexity25/global_step80108/layer_09-model_00-model_states.pt b/perplexity25/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a61e6fbd98750d5445e2f84cfda277009a6fe64 --- /dev/null +++ b/perplexity25/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10737466536f51811bab5c4382189be291133bdd482dbea12c131781df923677 +size 78696195 diff --git a/perplexity25/global_step80108/layer_09-model_01-model_states.pt b/perplexity25/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e19bfc1ea33f30d72b63d48a049050c9f4ca3e --- /dev/null +++ b/perplexity25/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44c0b47961dacc1bd735da828f6842f9ed60bc9f4887da258ae0acc45c0d46b +size 78696195 diff --git a/perplexity25/global_step80108/layer_10-model_00-model_states.pt b/perplexity25/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f13dcf1401946f446d3044d5a8ba5a067aa56b7 --- /dev/null +++ b/perplexity25/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c46b80c2b2e90944290336c8635204dc3c95457a576c86ebed2f96ad8c4f3ee +size 78696195 diff --git a/perplexity25/global_step80108/layer_10-model_01-model_states.pt b/perplexity25/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1369386fc429206ac6fdbb1de0a5b917d00db6 --- /dev/null +++ b/perplexity25/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e4dc9f2cda10effdcf3e64614e1b8e24881de24e6f6951136c41ad7741e0fc +size 78696195 diff --git a/perplexity25/global_step80108/layer_11-model_00-model_states.pt b/perplexity25/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12abdcc7485bd09e7ce520e93554bfdcc74b1efc --- /dev/null +++ b/perplexity25/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368819880bc24647af3a6af594c56dbcfbf986d09ee4847914fa0181cb02a41c +size 78696195 diff --git a/perplexity25/global_step80108/layer_11-model_01-model_states.pt b/perplexity25/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bea9a1eaffa35d8c7e9b1326d03b8cbe41a661d --- /dev/null +++ b/perplexity25/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c38064e86c9148e3de2ff0e9492ad8fb743fcb0db503eed5966d67191cc9855 +size 78696195 diff --git a/perplexity25/global_step80108/layer_12-model_00-model_states.pt b/perplexity25/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca158ae88a710771fe69253e3cefc6f61b999798 --- /dev/null +++ b/perplexity25/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a30761afbf29ce98bed2482e00727da6b4a6cbc7a9526e9a69d1ba2c1ce209 +size 78696195 diff --git a/perplexity25/global_step80108/layer_12-model_01-model_states.pt b/perplexity25/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc843edbc1077c43582fdc20ced3dcac0a0905f --- /dev/null +++ b/perplexity25/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d413f14c05008ccec297eec7fc38ae1716a7d662080f250a77f15fe18ce090 +size 78696195 diff --git a/perplexity25/global_step80108/layer_13-model_00-model_states.pt b/perplexity25/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c179c3a4adb3c1bb8b2cda7efc7e44a52fc8fd --- /dev/null +++ b/perplexity25/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d6cda7b90781c3bb741d97413b09503e23e2f9376a909e520133a844d287ff +size 78696195 diff --git a/perplexity25/global_step80108/layer_13-model_01-model_states.pt b/perplexity25/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d22958ce4dd9221f07ffb3de0a8ce5d99943500 --- /dev/null +++ b/perplexity25/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7a123088eac11be88a0991a600c00ed66600f0402e3fabdb676ae083f73a95 +size 78696195 diff --git a/perplexity25/global_step80108/layer_14-model_00-model_states.pt b/perplexity25/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2f4daee83efaba92bb4ec2ef7109dcce5d49f54 --- /dev/null +++ b/perplexity25/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968a930d9fdd0baa3837a099e8f0acf15f413e6d61b10b4838d91e4f7d335a50 +size 78696195 diff --git a/perplexity25/global_step80108/layer_14-model_01-model_states.pt b/perplexity25/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73d2862c8282d3389a1c6235f8712bc09d25839c --- /dev/null +++ b/perplexity25/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a1deaab3d7249874d48e8d3ab2b9b1ce135ee6486eef95b426d6dc7e3e3e78 +size 78696195 diff --git a/perplexity25/global_step80108/layer_15-model_00-model_states.pt b/perplexity25/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da50541735317758902cda582f1630a9ef907c9 --- /dev/null +++ b/perplexity25/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2dd92f91390df075dd45567de93207571991690df6f032971a8972dd94af2c3 +size 78696195 diff --git a/perplexity25/global_step80108/layer_15-model_01-model_states.pt b/perplexity25/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f5bfd55219ec43331c0c4d101e01514c776f7fe --- /dev/null +++ b/perplexity25/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d0032b02196a708f84168923d598d74a296fc425cbb2f3fc908cbcb29cf0a0 +size 78696195 diff --git a/perplexity25/global_step80108/layer_16-model_00-model_states.pt b/perplexity25/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..941c782b91a199ad364158566c395314b0edbebf --- /dev/null +++ b/perplexity25/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8300a1f560ff13a656adb2f45543971635018d1d964a6ef3d2a312f6f527d739 +size 78696195 diff --git a/perplexity25/global_step80108/layer_16-model_01-model_states.pt b/perplexity25/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fd06ee8b57c512e450139514a59acbc749e4bad --- /dev/null +++ b/perplexity25/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8190a95a57805a278b3f519a425d394faf8821f8a80fb01dda06e3f7f4a43df5 +size 78696195 diff --git a/perplexity25/global_step80108/layer_17-model_00-model_states.pt b/perplexity25/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7911b579a9bf2487bc74d6e5a0b25babac4e130 --- /dev/null +++ b/perplexity25/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf6f5debd2fdf64807b807e35d9d7a10f3e17715bf6fed509f9ed6250278d7c +size 78696195 diff --git a/perplexity25/global_step80108/layer_17-model_01-model_states.pt b/perplexity25/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e563ff84fee57409caac95b2bdc54de34858c8d9 --- /dev/null +++ b/perplexity25/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c7e5f84625dccf4cc8637639f9082a9d1c19676fdc54c8c79d47c0d02873e9 +size 78696195 diff --git a/perplexity25/global_step80108/layer_18-model_00-model_states.pt b/perplexity25/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f326d25789f1c1def1e1b1631584e02c500f11f --- /dev/null +++ b/perplexity25/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb40b1cb78a04adea01f55b3294edf2453fdce8dde0fd1f56d3bb8bf12e53303 +size 78696195 diff --git a/perplexity25/global_step80108/layer_18-model_01-model_states.pt b/perplexity25/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3caa2e5c65f4bee84ef3e4b7859ad290e582f2c7 --- /dev/null +++ b/perplexity25/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07658d0d335ca03f4fd465bade251d8c8cc8d01aaf2456dc5da1726bb565311d +size 78696195 diff --git a/perplexity25/global_step80108/layer_19-model_00-model_states.pt b/perplexity25/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c9b679eb38834769f143369228b5e576d0104f5 --- /dev/null +++ b/perplexity25/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b269d035a347cb7936f5758d9b8a14de86690be897adbf2b4d006f18d170e1f +size 78696195 diff --git a/perplexity25/global_step80108/layer_19-model_01-model_states.pt b/perplexity25/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07b63e969b4fa1ce3d178714b601ea843de341a --- /dev/null +++ b/perplexity25/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dcc335b775e5b2ea1cca3001ba1eace3e2fb5a91bec045177afa5e9e2d4668 +size 78696195 diff --git a/perplexity25/global_step80108/layer_20-model_00-model_states.pt b/perplexity25/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff310b4a407f443f9c0a17c797cb24671b7d15a --- /dev/null +++ b/perplexity25/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8d4b8481316ba3d9cfc7ba57f95a3cbc85fa1a6a56810889f3febabaddcf4b +size 78696195 diff --git a/perplexity25/global_step80108/layer_20-model_01-model_states.pt b/perplexity25/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..929a4e5e9f1b5492c545bfe695af87601edef16f --- /dev/null +++ b/perplexity25/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae80c3abd6d11cd4524f064a3d88a78146ef6818d906b85e6620b28acdfe91d +size 78696195 diff --git a/perplexity25/global_step80108/layer_21-model_00-model_states.pt b/perplexity25/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c657bc98b37d55bc733a98380b7d2f5f380ada5 --- /dev/null +++ b/perplexity25/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec236ea83e78cacd4f86d80b5c58d009d0a950da68273c24f1dcc48a04eb69a +size 78696195 diff --git a/perplexity25/global_step80108/layer_21-model_01-model_states.pt b/perplexity25/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff8da0e208ab350f0de7176b01dea5b89a1bf7ce --- /dev/null +++ b/perplexity25/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6c3d782f9cac5d0ec8814b24f31b59a5191391d4b50e5550137d0e3f402289 +size 78696195 diff --git a/perplexity25/global_step80108/layer_22-model_00-model_states.pt b/perplexity25/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6c91fa7ff444f4e4d81a6b96e4a377211ae52b --- /dev/null +++ b/perplexity25/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80bc0787038e6498576832dd7ed0dc8ef94c4d5011de7e7c5195bd077bde2dca +size 78696195 diff --git a/perplexity25/global_step80108/layer_22-model_01-model_states.pt b/perplexity25/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f4278e28881896ac4c2bcaf6948137cd62e82e7 --- /dev/null +++ b/perplexity25/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de52e6dc9d2100acbfddfb1967db8c709e440d7cf8095bf3eb09af76ecf00eb4 +size 78696195 diff --git a/perplexity25/global_step80108/layer_23-model_00-model_states.pt b/perplexity25/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c3717fb3267065928d1fac641d124b8b79eb87 --- /dev/null +++ b/perplexity25/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa37268853dab5e006669a7a85a6246ddba0b8432a287f3a159073c2f7c03c2 +size 78696195 diff --git a/perplexity25/global_step80108/layer_23-model_01-model_states.pt b/perplexity25/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d190bf160a9466910f8d91403e4414ac9c64aba --- /dev/null +++ b/perplexity25/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74095f564806866b6069b4744292ae5f8ce998d90b1b03a2dd340d7bb1347d57 +size 78696195 diff --git a/perplexity25/global_step80108/layer_24-model_00-model_states.pt b/perplexity25/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad590fbc20cb356304b4949440dcf82f66f2f23 --- /dev/null +++ b/perplexity25/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d295f6ac9b159596e9d07470fd0f1cdcc6a0ada5931189865366f76a17bf0e +size 78696195 diff --git a/perplexity25/global_step80108/layer_24-model_01-model_states.pt b/perplexity25/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abc1f6282cd6639e73bd268a24cae3cf8a79374e --- /dev/null +++ b/perplexity25/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f2f651e03b92ff5a8d8da8036cbb3ccd37e79734b95cb3ba032a3da93ddcc1 +size 78696195 diff --git a/perplexity25/global_step80108/layer_25-model_00-model_states.pt b/perplexity25/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30623d322cd326c44de55415dd6b3a7270d1b7d5 --- /dev/null +++ b/perplexity25/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fa2a00d3540beb6554366885909aed6aaaa791bc872429d83bff03306532bc +size 78696195 diff --git a/perplexity25/global_step80108/layer_25-model_01-model_states.pt b/perplexity25/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9330f8210c45e2d27b90c349a077a517132d5fd --- /dev/null +++ b/perplexity25/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b1a86d6f6f0bb6058b39f0ee6ece765c7ec03ffddb0bb49ea1940c2a43cf7b9 +size 78696195 diff --git a/perplexity25/global_step80108/layer_26-model_00-model_states.pt b/perplexity25/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c34ddfa84a264d0bc1a335b6847bc4f64cc14af --- /dev/null +++ b/perplexity25/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc62cf22b3bf3f48662c8cbad4f8a0681ae015dd5846cfd58ec9bd93d1d2c833 +size 78696195 diff --git a/perplexity25/global_step80108/layer_26-model_01-model_states.pt b/perplexity25/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f9611f77145cc8a0c6ed33f4caf08833e7cb3e4 --- /dev/null +++ b/perplexity25/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c94f4f738b1c3d0c635141509a55f09041eb61ceb132494a899058880fb382a +size 78696195 diff --git a/perplexity25/global_step80108/layer_27-model_00-model_states.pt b/perplexity25/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2762596454a4a86d5e7be4d9d234ad253f627c8b --- /dev/null +++ b/perplexity25/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cdc38918abb1147495250ef4cb858f3fc968150dd3b375ac95f6a1f53f9643 +size 78696195 diff --git a/perplexity25/global_step80108/layer_27-model_01-model_states.pt b/perplexity25/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b9e7df2fbccab853c66c073583cc31a0d5f72ab --- /dev/null +++ b/perplexity25/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e3c7a2ed1c8066e3a128faa759d9026c714f6cb622316c1a4afabf51e8040f2 +size 78696195 diff --git a/perplexity25/global_step80108/layer_28-model_00-model_states.pt b/perplexity25/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0acb474fbb0215a4519f1a9e475108b8f105ee2 --- /dev/null +++ b/perplexity25/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac45cd37cddd48c8533381f33b36fdb759bcdfd1ab895619d2b99d2235ac5d7 +size 78696195 diff --git a/perplexity25/global_step80108/layer_28-model_01-model_states.pt b/perplexity25/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..134b9932507a3961c72692281d72555b26afc6c9 --- /dev/null +++ b/perplexity25/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98e4ca06fec7b3d4d95192089893c80c22bee5d349afcc3ea643ecccf9de791 +size 78696195 diff --git a/perplexity25/global_step80108/layer_29-model_00-model_states.pt b/perplexity25/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef42b05711fc4341684b485223d353a5e343340a --- /dev/null +++ b/perplexity25/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6baebaf9e81593699c7f643ea88013baac347916375e2371e3ef558c2e1141 +size 78696195 diff --git a/perplexity25/global_step80108/layer_29-model_01-model_states.pt b/perplexity25/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8716b5f9d410c17bcc1ca3b71a27a448ffe2c939 --- /dev/null +++ b/perplexity25/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a466458545fa8cdf98ae1bda2c786fcc633ab1f8c283474ae3fcb5ce02fe23 +size 78696195 diff --git a/perplexity25/global_step80108/layer_30-model_00-model_states.pt b/perplexity25/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0447ee6c7d02299ee9da09e58e58148a96f457d8 --- /dev/null +++ b/perplexity25/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1394bd57f87a5c7abacc24ffe34ceba6433c0f93a1c3cf8b64148a54817d38b1 +size 78696195 diff --git a/perplexity25/global_step80108/layer_30-model_01-model_states.pt b/perplexity25/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe558fceab1111b61634c8e814194d54cdcfd974 --- /dev/null +++ b/perplexity25/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e84625fa1340140fedce60d603bc18d3cb51b4f1bfd872ed2224ffb8a7ec56 +size 78696195 diff --git a/perplexity25/global_step80108/layer_31-model_00-model_states.pt b/perplexity25/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c50bbfe54088d4aa9a996e35d9d8995a113d28f6 --- /dev/null +++ b/perplexity25/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e5c77a4911db4d9c8d4ef5d800b443b27f9fd3c41213c1188c96ade016c39a +size 78696195 diff --git a/perplexity25/global_step80108/layer_31-model_01-model_states.pt b/perplexity25/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9712e953e6c7304c9418cd6c6e11d51569b20875 --- /dev/null +++ b/perplexity25/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd324ac249345dd93b17c440021c7e84fba3a6e827f49bd51af14f705f84f74 +size 78696195 diff --git a/perplexity25/global_step80108/layer_32-model_00-model_states.pt b/perplexity25/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b8a44c6f8aeaa3955be24adf56c68bec53c19ab --- /dev/null +++ b/perplexity25/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0705c0124823726da9ec9d7c4a21a560d74ce7311a5d64e0dd8397c3645a3278 +size 78696195 diff --git a/perplexity25/global_step80108/layer_32-model_01-model_states.pt b/perplexity25/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d098e5c21a36fc85fef743aad3fd993079dfef78 --- /dev/null +++ b/perplexity25/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd360f16e4f83a3b16d9e58907f0f63c70c4c6772aa2e1eb5091752f21600d1b +size 78696195 diff --git a/perplexity25/global_step80108/layer_33-model_00-model_states.pt b/perplexity25/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad32a75c8a562287a569ce940c0601a6a625fa94 --- /dev/null +++ b/perplexity25/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3faf57fff5a61bbf0470a1f7e97a4dfec61704e49bcc899c8532351e024e7756 +size 78696195 diff --git a/perplexity25/global_step80108/layer_33-model_01-model_states.pt b/perplexity25/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefd67763fc039a3581ae3978f73af1dbf9cc42f --- /dev/null +++ b/perplexity25/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7351750f2561107d6dcfd3223ea72676c53f7e958214ec53858b1431581526f2 +size 78696195 diff --git a/perplexity25/global_step80108/layer_34-model_00-model_states.pt b/perplexity25/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c6590a67eb7a071c8f6d6176175462c7409877 --- /dev/null +++ b/perplexity25/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a0b3f69e0955a8a342497dcc8672bab7f6b3319c6a9c2ef436315132f5e9bb +size 78696195 diff --git a/perplexity25/global_step80108/layer_34-model_01-model_states.pt b/perplexity25/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9c155afdff7bb45f5081ad21d0dc838425b826 --- /dev/null +++ b/perplexity25/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a53da4269f01bf9e2c41328a3bde3fa826ce2ab07b64526309b47ee942a06686 +size 78696195 diff --git a/perplexity25/global_step80108/layer_35-model_00-model_states.pt b/perplexity25/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40f1486135c7abd6352fc4b1b320add72baeefa2 --- /dev/null +++ b/perplexity25/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b46e84fb8823a82cefa94cada92cd7f801a2a8acd66903d1a447057cb63377f +size 78696195 diff --git a/perplexity25/global_step80108/layer_35-model_01-model_states.pt b/perplexity25/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03443baaf98fda48c08ee2edf14572b39389db4c --- /dev/null +++ b/perplexity25/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b8c892cd92257deaaf97fe19e86c2685ea912d6bf766f08c20489250115516 +size 78696195 diff --git a/perplexity25/global_step80108/layer_36-model_00-model_states.pt b/perplexity25/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4efa86f914e0fd78712cb71ab7505ca17ee7719b --- /dev/null +++ b/perplexity25/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9446f1ed07fd37cd360fcadb0b1f39e0b40e3aa9536dcbb34adbce068092b79 +size 78696195 diff --git a/perplexity25/global_step80108/layer_36-model_01-model_states.pt b/perplexity25/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea05cb91970fc84b4fd84adb7eeeb2268811b5ab --- /dev/null +++ b/perplexity25/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f693e45be46e13ec044d376cbc37db27e60c9977eecb1aa22a4db544e5541b +size 78696195 diff --git a/perplexity25/global_step80108/layer_38-model_00-model_states.pt b/perplexity25/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb22f75d8a574a92b76791ecfdd26eb6c1507fd0 --- /dev/null +++ b/perplexity25/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78869a56fc80c150a40eeb135b0d86921c281ae6a5dbf1efb7dc5242459d34d8 +size 11459 diff --git a/perplexity25/global_step80108/layer_38-model_01-model_states.pt b/perplexity25/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9947d305a9ae42d9ba5a5139eae957c7f0a65cae --- /dev/null +++ b/perplexity25/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d60e7abdf675ab34fd4d3233b6af21b0acc619c681601209273872f18edb6a +size 11459 diff --git a/perplexity25/global_step80108/mp_rank_00_model_states.pt b/perplexity25/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..947760f5aa54b876e8a914ad0ce830883fc5c7ba --- /dev/null +++ b/perplexity25/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7117a0bb2d6b82b4c06d9abeb3da2a807bf51ff1855d8a2c2c3325dc849432 +size 49971 diff --git a/perplexity25/global_step80108/mp_rank_01_model_states.pt b/perplexity25/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f38bcba2f08ea3be5dc0bd0a67aab54146f9be --- /dev/null +++ b/perplexity25/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de44a95b2b2f22ba5e191ae2e68b6123906731036c21f26c3aab6591360149d6 +size 49971 diff --git a/transformers/config.json b/perplexity25/transformers/config.json similarity index 100% rename from transformers/config.json rename to perplexity25/transformers/config.json diff --git a/perplexity25/transformers/pytorch_model.bin b/perplexity25/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ad4777935ba76ee14f4ec523d1c09b730f2b1bd --- /dev/null +++ b/perplexity25/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ac55f0258e990222162bdd779b6ae070dc193a76f7ca8934c5a87568f3f694 +size 5904072781 diff --git a/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/agg.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json diff --git a/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json b/perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json similarity index 100% rename from evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json rename to perplexity2575/evaluation/generation/agg.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json diff --git a/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl b/perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl similarity index 100% rename from evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl rename to perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl diff --git a/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl b/perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl similarity index 100% rename from evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl rename to perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl diff --git a/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl b/perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl similarity index 100% rename from evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl rename to perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl diff --git a/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl b/perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl similarity index 100% rename from evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl rename to perplexity2575/evaluation/generation/examples.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.jsonl diff --git a/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.jsonl b/perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.jsonl similarity index 100% rename from evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.jsonl rename to perplexity2575/evaluation/generation/examples.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.jsonl diff --git a/evaluation/generation/merged.csv b/perplexity2575/evaluation/generation/merged.csv similarity index 100% rename from evaluation/generation/merged.csv rename to perplexity2575/evaluation/generation/merged.csv diff --git a/evaluation/generation/merged.json b/perplexity2575/evaluation/generation/merged.json similarity index 100% rename from evaluation/generation/merged.json rename to perplexity2575/evaluation/generation/merged.json diff --git a/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-web_nlg_en.templates=PALM_prompt.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=GEM-wiki_lingua_en.templates=tldr_en.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=e2e_nlg_cleaned.templates=generate_text_restaurant.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json b/perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json similarity index 100% rename from evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json rename to perplexity2575/evaluation/generation/slim.limited=3000.model=lm1-4b2-84b-c4-perplexity.task=gem_xsum.templates=article_DOC_summary.fewshot=5.batchsize=16.seed=1234.timestamp=2023-01-26T10:29:52.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_0.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_1.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_2.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_3.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_4.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-web_nlg_en_PALM_prompt_5.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_0.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_1.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_2.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_3.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_4.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_GEM-wiki_lingua_en_tldr_en_5.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_0.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_1.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_2.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_3.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_4.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_e2e_nlg_cleaned_generate_text_restaurant_5.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_0.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_1.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_2.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_3.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_4.json diff --git a/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json b/perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json similarity index 100% rename from evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json rename to perplexity2575/evaluation/generation/slim.lm1-4b2-84b-c4-perplexity_gem_xsum_article_DOC_summary_5.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_0.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_1.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_2.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_3.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_4.json diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.csv b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.csv similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.csv rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.csv diff --git a/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.json b/perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.json similarity index 100% rename from evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.json rename to perplexity2575/evaluation/rankeval/lm1-4b2-84b-c4-perplexity_5.json diff --git a/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt diff --git a/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt similarity index 100% rename from global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt rename to perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt diff --git a/global_step80108/layer_01-model_00-model_states.pt b/perplexity2575/global_step80108/layer_01-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_01-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_01-model_00-model_states.pt diff --git a/global_step80108/layer_01-model_01-model_states.pt b/perplexity2575/global_step80108/layer_01-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_01-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_01-model_01-model_states.pt diff --git a/global_step80108/layer_03-model_00-model_states.pt b/perplexity2575/global_step80108/layer_03-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_03-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_03-model_00-model_states.pt diff --git a/global_step80108/layer_03-model_01-model_states.pt b/perplexity2575/global_step80108/layer_03-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_03-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_03-model_01-model_states.pt diff --git a/global_step80108/layer_04-model_00-model_states.pt b/perplexity2575/global_step80108/layer_04-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_04-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_04-model_00-model_states.pt diff --git a/global_step80108/layer_04-model_01-model_states.pt b/perplexity2575/global_step80108/layer_04-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_04-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_04-model_01-model_states.pt diff --git a/global_step80108/layer_05-model_00-model_states.pt b/perplexity2575/global_step80108/layer_05-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_05-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_05-model_00-model_states.pt diff --git a/global_step80108/layer_05-model_01-model_states.pt b/perplexity2575/global_step80108/layer_05-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_05-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_05-model_01-model_states.pt diff --git a/global_step80108/layer_06-model_00-model_states.pt b/perplexity2575/global_step80108/layer_06-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_06-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_06-model_00-model_states.pt diff --git a/global_step80108/layer_06-model_01-model_states.pt b/perplexity2575/global_step80108/layer_06-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_06-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_06-model_01-model_states.pt diff --git a/global_step80108/layer_07-model_00-model_states.pt b/perplexity2575/global_step80108/layer_07-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_07-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_07-model_00-model_states.pt diff --git a/global_step80108/layer_07-model_01-model_states.pt b/perplexity2575/global_step80108/layer_07-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_07-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_07-model_01-model_states.pt diff --git a/global_step80108/layer_08-model_00-model_states.pt b/perplexity2575/global_step80108/layer_08-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_08-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_08-model_00-model_states.pt diff --git a/global_step80108/layer_08-model_01-model_states.pt b/perplexity2575/global_step80108/layer_08-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_08-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_08-model_01-model_states.pt diff --git a/global_step80108/layer_09-model_00-model_states.pt b/perplexity2575/global_step80108/layer_09-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_09-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_09-model_00-model_states.pt diff --git a/global_step80108/layer_09-model_01-model_states.pt b/perplexity2575/global_step80108/layer_09-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_09-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_09-model_01-model_states.pt diff --git a/global_step80108/layer_10-model_00-model_states.pt b/perplexity2575/global_step80108/layer_10-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_10-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_10-model_00-model_states.pt diff --git a/global_step80108/layer_10-model_01-model_states.pt b/perplexity2575/global_step80108/layer_10-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_10-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_10-model_01-model_states.pt diff --git a/global_step80108/layer_11-model_00-model_states.pt b/perplexity2575/global_step80108/layer_11-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_11-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_11-model_00-model_states.pt diff --git a/global_step80108/layer_11-model_01-model_states.pt b/perplexity2575/global_step80108/layer_11-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_11-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_11-model_01-model_states.pt diff --git a/global_step80108/layer_12-model_00-model_states.pt b/perplexity2575/global_step80108/layer_12-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_12-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_12-model_00-model_states.pt diff --git a/global_step80108/layer_12-model_01-model_states.pt b/perplexity2575/global_step80108/layer_12-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_12-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_12-model_01-model_states.pt diff --git a/global_step80108/layer_13-model_00-model_states.pt b/perplexity2575/global_step80108/layer_13-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_13-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_13-model_00-model_states.pt diff --git a/global_step80108/layer_13-model_01-model_states.pt b/perplexity2575/global_step80108/layer_13-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_13-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_13-model_01-model_states.pt diff --git a/global_step80108/layer_14-model_00-model_states.pt b/perplexity2575/global_step80108/layer_14-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_14-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_14-model_00-model_states.pt diff --git a/global_step80108/layer_14-model_01-model_states.pt b/perplexity2575/global_step80108/layer_14-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_14-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_14-model_01-model_states.pt diff --git a/global_step80108/layer_15-model_00-model_states.pt b/perplexity2575/global_step80108/layer_15-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_15-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_15-model_00-model_states.pt diff --git a/global_step80108/layer_15-model_01-model_states.pt b/perplexity2575/global_step80108/layer_15-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_15-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_15-model_01-model_states.pt diff --git a/global_step80108/layer_16-model_00-model_states.pt b/perplexity2575/global_step80108/layer_16-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_16-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_16-model_00-model_states.pt diff --git a/global_step80108/layer_16-model_01-model_states.pt b/perplexity2575/global_step80108/layer_16-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_16-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_16-model_01-model_states.pt diff --git a/global_step80108/layer_17-model_00-model_states.pt b/perplexity2575/global_step80108/layer_17-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_17-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_17-model_00-model_states.pt diff --git a/global_step80108/layer_17-model_01-model_states.pt b/perplexity2575/global_step80108/layer_17-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_17-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_17-model_01-model_states.pt diff --git a/global_step80108/layer_18-model_00-model_states.pt b/perplexity2575/global_step80108/layer_18-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_18-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_18-model_00-model_states.pt diff --git a/global_step80108/layer_18-model_01-model_states.pt b/perplexity2575/global_step80108/layer_18-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_18-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_18-model_01-model_states.pt diff --git a/global_step80108/layer_19-model_00-model_states.pt b/perplexity2575/global_step80108/layer_19-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_19-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_19-model_00-model_states.pt diff --git a/global_step80108/layer_19-model_01-model_states.pt b/perplexity2575/global_step80108/layer_19-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_19-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_19-model_01-model_states.pt diff --git a/global_step80108/layer_20-model_00-model_states.pt b/perplexity2575/global_step80108/layer_20-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_20-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_20-model_00-model_states.pt diff --git a/global_step80108/layer_20-model_01-model_states.pt b/perplexity2575/global_step80108/layer_20-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_20-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_20-model_01-model_states.pt diff --git a/global_step80108/layer_21-model_00-model_states.pt b/perplexity2575/global_step80108/layer_21-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_21-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_21-model_00-model_states.pt diff --git a/global_step80108/layer_21-model_01-model_states.pt b/perplexity2575/global_step80108/layer_21-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_21-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_21-model_01-model_states.pt diff --git a/global_step80108/layer_22-model_00-model_states.pt b/perplexity2575/global_step80108/layer_22-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_22-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_22-model_00-model_states.pt diff --git a/global_step80108/layer_22-model_01-model_states.pt b/perplexity2575/global_step80108/layer_22-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_22-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_22-model_01-model_states.pt diff --git a/global_step80108/layer_23-model_00-model_states.pt b/perplexity2575/global_step80108/layer_23-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_23-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_23-model_00-model_states.pt diff --git a/global_step80108/layer_23-model_01-model_states.pt b/perplexity2575/global_step80108/layer_23-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_23-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_23-model_01-model_states.pt diff --git a/global_step80108/layer_24-model_00-model_states.pt b/perplexity2575/global_step80108/layer_24-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_24-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_24-model_00-model_states.pt diff --git a/global_step80108/layer_24-model_01-model_states.pt b/perplexity2575/global_step80108/layer_24-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_24-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_24-model_01-model_states.pt diff --git a/global_step80108/layer_25-model_00-model_states.pt b/perplexity2575/global_step80108/layer_25-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_25-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_25-model_00-model_states.pt diff --git a/global_step80108/layer_25-model_01-model_states.pt b/perplexity2575/global_step80108/layer_25-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_25-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_25-model_01-model_states.pt diff --git a/global_step80108/layer_26-model_00-model_states.pt b/perplexity2575/global_step80108/layer_26-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_26-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_26-model_00-model_states.pt diff --git a/global_step80108/layer_26-model_01-model_states.pt b/perplexity2575/global_step80108/layer_26-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_26-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_26-model_01-model_states.pt diff --git a/global_step80108/layer_27-model_00-model_states.pt b/perplexity2575/global_step80108/layer_27-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_27-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_27-model_00-model_states.pt diff --git a/global_step80108/layer_27-model_01-model_states.pt b/perplexity2575/global_step80108/layer_27-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_27-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_27-model_01-model_states.pt diff --git a/global_step80108/layer_28-model_00-model_states.pt b/perplexity2575/global_step80108/layer_28-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_28-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_28-model_00-model_states.pt diff --git a/global_step80108/layer_28-model_01-model_states.pt b/perplexity2575/global_step80108/layer_28-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_28-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_28-model_01-model_states.pt diff --git a/global_step80108/layer_29-model_00-model_states.pt b/perplexity2575/global_step80108/layer_29-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_29-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_29-model_00-model_states.pt diff --git a/global_step80108/layer_29-model_01-model_states.pt b/perplexity2575/global_step80108/layer_29-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_29-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_29-model_01-model_states.pt diff --git a/global_step80108/layer_30-model_00-model_states.pt b/perplexity2575/global_step80108/layer_30-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_30-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_30-model_00-model_states.pt diff --git a/global_step80108/layer_30-model_01-model_states.pt b/perplexity2575/global_step80108/layer_30-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_30-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_30-model_01-model_states.pt diff --git a/global_step80108/layer_31-model_00-model_states.pt b/perplexity2575/global_step80108/layer_31-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_31-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_31-model_00-model_states.pt diff --git a/global_step80108/layer_31-model_01-model_states.pt b/perplexity2575/global_step80108/layer_31-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_31-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_31-model_01-model_states.pt diff --git a/global_step80108/layer_32-model_00-model_states.pt b/perplexity2575/global_step80108/layer_32-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_32-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_32-model_00-model_states.pt diff --git a/global_step80108/layer_32-model_01-model_states.pt b/perplexity2575/global_step80108/layer_32-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_32-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_32-model_01-model_states.pt diff --git a/global_step80108/layer_33-model_00-model_states.pt b/perplexity2575/global_step80108/layer_33-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_33-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_33-model_00-model_states.pt diff --git a/global_step80108/layer_33-model_01-model_states.pt b/perplexity2575/global_step80108/layer_33-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_33-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_33-model_01-model_states.pt diff --git a/global_step80108/layer_34-model_00-model_states.pt b/perplexity2575/global_step80108/layer_34-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_34-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_34-model_00-model_states.pt diff --git a/global_step80108/layer_34-model_01-model_states.pt b/perplexity2575/global_step80108/layer_34-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_34-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_34-model_01-model_states.pt diff --git a/global_step80108/layer_35-model_00-model_states.pt b/perplexity2575/global_step80108/layer_35-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_35-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_35-model_00-model_states.pt diff --git a/global_step80108/layer_35-model_01-model_states.pt b/perplexity2575/global_step80108/layer_35-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_35-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_35-model_01-model_states.pt diff --git a/global_step80108/layer_36-model_00-model_states.pt b/perplexity2575/global_step80108/layer_36-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_36-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_36-model_00-model_states.pt diff --git a/global_step80108/layer_36-model_01-model_states.pt b/perplexity2575/global_step80108/layer_36-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_36-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_36-model_01-model_states.pt diff --git a/global_step80108/layer_38-model_00-model_states.pt b/perplexity2575/global_step80108/layer_38-model_00-model_states.pt similarity index 100% rename from global_step80108/layer_38-model_00-model_states.pt rename to perplexity2575/global_step80108/layer_38-model_00-model_states.pt diff --git a/global_step80108/layer_38-model_01-model_states.pt b/perplexity2575/global_step80108/layer_38-model_01-model_states.pt similarity index 100% rename from global_step80108/layer_38-model_01-model_states.pt rename to perplexity2575/global_step80108/layer_38-model_01-model_states.pt diff --git a/global_step80108/mp_rank_00_model_states.pt b/perplexity2575/global_step80108/mp_rank_00_model_states.pt similarity index 100% rename from global_step80108/mp_rank_00_model_states.pt rename to perplexity2575/global_step80108/mp_rank_00_model_states.pt diff --git a/global_step80108/mp_rank_01_model_states.pt b/perplexity2575/global_step80108/mp_rank_01_model_states.pt similarity index 100% rename from global_step80108/mp_rank_01_model_states.pt rename to perplexity2575/global_step80108/mp_rank_01_model_states.pt diff --git a/tensorboard_4b284bc4perplexity/events.out.tfevents.1674457654.nid005494.105619.0 b/perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674457654.nid005494.105619.0 similarity index 100% rename from tensorboard_4b284bc4perplexity/events.out.tfevents.1674457654.nid005494.105619.0 rename to perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674457654.nid005494.105619.0 diff --git a/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616098.nid006152.42129.0 b/perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616098.nid006152.42129.0 similarity index 100% rename from tensorboard_4b284bc4perplexity/events.out.tfevents.1674616098.nid006152.42129.0 rename to perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616098.nid006152.42129.0 diff --git a/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616323.nid005494.8381.0 b/perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616323.nid005494.8381.0 similarity index 100% rename from tensorboard_4b284bc4perplexity/events.out.tfevents.1674616323.nid005494.8381.0 rename to perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616323.nid005494.8381.0 diff --git a/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616542.nid005494.13319.0 b/perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616542.nid005494.13319.0 similarity index 100% rename from tensorboard_4b284bc4perplexity/events.out.tfevents.1674616542.nid005494.13319.0 rename to perplexity2575/tensorboard_4b284bc4perplexity/events.out.tfevents.1674616542.nid005494.13319.0 diff --git a/perplexity2575/transformers/config.json b/perplexity2575/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8d973cca6c303d39373fc10106af26358b0ef51 --- /dev/null +++ b/perplexity2575/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 2560, "n_layer": 34, "n_head": 20, "n_inner": 10240, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/transformers/pytorch_model.bin b/perplexity2575/transformers/pytorch_model.bin similarity index 100% rename from transformers/pytorch_model.bin rename to perplexity2575/transformers/pytorch_model.bin diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9fbe17087447d833362dc91b180e9b283e07c931 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.36676283856494113, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0474507783379639}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.062332014806189766, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016383703848229427}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.293777806984314, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005252782658193723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09441575378592391, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020680531546244394}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028711966510953046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000984576654338761}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1322458599845081, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003314534134287909}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04314501248705826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001258246183189075}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.057942425405580346, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014255082882140484}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2776785385893423, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0049436461818446135}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0882116048398588, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018389749448658346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.058934717518613434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001525972938212972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.27624443355923034, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004852154002930374}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08927510610731734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001938092014044731}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..60ba5985ad07a33e6b017c47d1ff61a0cf50cee6 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.42447490695849177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.031118881647332453}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07242166849415733, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013848386081542273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3588660487979018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005213387725734495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11353731182395607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019319506260635304}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03288701360932817, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000839098109533103}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17107042365285788, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036083953475667513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.051698558921326514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012001219460540538}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0670061822698939, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001227160746048086}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3346245385921824, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004814146748998719}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10521613042548694, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017181082493525662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06851784863794814, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013044655089246824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.33834197646314856, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004780908665148567}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10736276773335406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018148053880352902}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9f803690c1b4d07212aeb7080753e73190d16767 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5078474394915784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04940313819145897}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07524299617261106, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013542247809418073}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3789792715638066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005087267508547312}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11839194985760551, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018550236570084812}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03451419278556197, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008480461582178029}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18485893110508558, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037439432130783046}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05453717672261224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012063786187369366}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06970631509385179, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012132144640462751}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35342460023270555, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0047409890816951}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10986668151378429, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016757644991035844}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07085029048321866, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001272417656582146}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35589542269045665, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004677996287698992}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11142211614255489, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017402016546960485}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a7bcf308134219de8d53b29a20b7ff9e4c0fa1e6 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5321467980679849, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030789259184486762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07467739697980223, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013056742555484042}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3765931475512988, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005136827785933215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11775282391938749, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018121209623013599}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03425895499250951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007949938460894235}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1857701112713038, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037899558051587997}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05437250272050667, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011494478736656965}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0691367241290362, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011898077979863157}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35044113186494674, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004789067731865496}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.109142035871985, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016567099883848363}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07016534933559325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001231446670361234}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3527313952049522, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004720204023911692}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11055745133283143, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017021172309438397}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..88ef49299a3bda728d37f308e70243f95d94bb21 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5836215112044281, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0373980578845506}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07814979242067882, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013719481084767942}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3904381500627582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005108365571685621}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12273951831524596, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018568477885135075}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.036278020218023364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008590667413980339}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19568480085429035, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037894995606282777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05731193809218633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012015065055436362}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07184600146882388, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012338794593141857}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.361289411306646, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004721144658086456}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11294640173282941, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016715462444065227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07360622983361918, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012935410743410267}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3670374936279833, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004716543868495296}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11548902373578677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017405908622108689}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b88a129702e655817437823fa134a4782549bc05 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.594609825520194, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04115839696833975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07606093952092045, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012363342608298056}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3956239968710567, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005142405199368944}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12086027376047605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017433543864987184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.034848706116865254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007661213026779092}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1971845061377734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003781803943041313}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.055825671549297295, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011219041594589493}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06988703720341218, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001122929060032178}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3647605769777058, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0047210888757834}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11109358926885284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001582946667660359}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07150521311673122, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011539037542073426}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3721409413587192, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047326985289146365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11358138097063522, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016202519807538079}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..43847797b200a12eadd3c6954a037d9b2334fd6a --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1319714359255099, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018067861281345137}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22663257957285188, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002733984829707475}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15459597826273924, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018270611999879997}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02346568721104801, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006971468696509421}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04305065808208426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013646495534821036}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.027936413268100608, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007972095177959765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1050094945336366, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012983078223279439}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18568833868889176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022086628996599916}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12417210909685761, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013302228377918145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1211307288912133, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001638963005635593}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20936613117867833, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025285661065844287}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1422075831554883, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016619749917407194}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.318952551089346, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04329525521577347}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..12deb20ee304d78df42a4f185a14afef7b85f490 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17493391960845747, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019881056363054072}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.30039251220979346, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027564678289120448}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20579895579192997, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019171748643174895}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.040554616651465696, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008659890131539827}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07316485920387228, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016147073802019601}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04823668695482641, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009745669933822557}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.124842470774516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001319051588032341}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22232295572810765, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00218343118232531}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1484222303241806, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013020741099865607}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16389878356035073, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018573417662959208}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2828415570261487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002627261412365232}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19302273540773426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001789695068656324}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.4993327349018104, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.060039405630241266}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f4fd7de7a4ac8cf7b022d8bc4f045f6b76a29164 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.18456973112779013, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002015516204243605}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.31320510678716973, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026816066901912826}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.215446597689823, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018467682989689277}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04451908592886625, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009130557961238952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07879022976243907, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016883257356260532}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05230636200823752, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009952603118013488}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1316268882646582, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013690654713722978}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23148383110872217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002153117823688896}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15530146813359313, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012696789175546876}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.17349312338034656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018858372860279045}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.29539552159407584, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025507540114149945}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20267202658830938, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001723884821520709}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.848425645647928, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07632604642356548}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1033316b2d16850d4f2b6d5325f6cf1911e601b0 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1616397163764498, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023460161842419813}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.26019267483379616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032056026696719647}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18186666197279194, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002214876076414925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03925295558880392, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009449386730106019}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06561949094566538, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016314095494124245}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04453744596750722, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009892511091368977}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11667604287371745, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016762280786544305}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19390457934260266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025516384846018345}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13202316706879197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001565731448359357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15230978309868673, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022054724157184874}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2461258416944667, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003046019155993613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17153352468735855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020795362207751736}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.803251560776854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0956254167064949}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a07ce2bbb45867ba4e85608de8f0f62e03ef822f --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.0540655546367526, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019863598257229935}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08630893835073304, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028923078072790034}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05848926036885533, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001947796388751384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.013419788420821602, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007196640004372746}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.022948179606902694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011746702031675198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014698290853528981, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006960360254178698}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.04061005184395829, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015089448751204634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06684826672013897, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023100255832951676}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.044046354099571715, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014521599460521}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.05070517916237353, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018676632653238442}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08116451423168446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027292176658861946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05480556417744295, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018205484087403967}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6541873598701015, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04137927662792639}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d0188fffc94b92fbc96c44696bb1d95780f59c32 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009622620991293292, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009755776848685625}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.014660623303221735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013738443681724601}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009922885274947888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00091535752249209}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0025945823584633773, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003550261333440917}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.004296371055249484, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000576258075124869}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0027535231928660694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00034248340049010525}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007418445736015545, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007597278932642448}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.01150875523797143, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001083700258541403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007698903693431021, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007102473355679709}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008921009893079637, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009010991448249183}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01368434519987409, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012818488127390474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.009228479004212309, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008517809180671035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.8017672277263173e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.4167644481328265e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e88538405b6fb9d21a313dc91d24149ec599a624 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.2944515852286527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0687957809640445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.13683365368832767, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014688301287434024}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.28316158012799547, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025200608344027693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.1814799362167216, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017831836075280368}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.046755060522420185, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008806060921358351}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.09586697768686785, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001719510820833045}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.06187846081562434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001129424676101297}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.12660643084306702, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00126456533149021}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.264267984967182, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022332757179524803}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.16841364171833556, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015464664247715663}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.11737623006499737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013285621448530893}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.24349593138163397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002354566720998469}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.15579956125425456, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016372102304097094}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f3bacb4af65bf838c3e754dd55baeecf1c508410 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 8.52641209830111, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12582983777195597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.44140716426798104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032213924886028253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4052286843296632, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002639166874418895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3977363846975939, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022382388166838187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18864819780738046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0022621645695871918}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.16963873808583682, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001847799566651559}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.16696906460089045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017222149044682246}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31455069215794823, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025903719800358703}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2903012525772825, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002143374874342348}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2829785990744798, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001784528829213968}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3567420815242637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029468018540509057}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3256533312057627, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023856069656370727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3201857670611568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002098087765270582}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9312d7ea35f79fc6b02be4b4fada0ee1e5ecb2f1 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.630291369867987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13549753046024302}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.44886308747052966, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030653689427961226}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4345078703253225, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025475650430768814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4181223330310302, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020232576936325647}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20393782443251954, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0022988281035972273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19337736914798762, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00185489954602544}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18635767606167977, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016723047591652514}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31607957889707133, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002589473433632966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3043881139321235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002132304038142002}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2928097571700884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017552966978288125}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3695227255731898, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00282070031070788}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3571271332319229, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023658526732539117}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3438100939181177, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019679894394683483}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..dbbf993cb0ee5d1da59d4d13722cbee15a303d02 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.771336904004668, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15312208049452972}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.47121262761824606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031706802673694546}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4285131204444559, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00259084813925993}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4246139438060347, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002068822985960878}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.22192545824696955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024446292469949274}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19735042748477633, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001962335262395526}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19583480506260798, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017745784799472742}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.33776452672838364, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002772013880864643}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3053908517936716, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022386749143566537}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3025604202708821, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018763118742909542}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3904903633666419, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029686040326820764}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3552152361692601, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002487386620131327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35175775657317715, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020815737481426283}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..349cba586a79f640cea37d942a02dab7f19c2655 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.267530539514095, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1677573231958913}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4875664382154273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003185218088206128}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4282782601002331, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024811809614885827}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43249984090343835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002029303339376666}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.23104550813725375, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024366019088569594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19888718264029498, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001882516080327131}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20132801941812545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017679869293689926}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3469917638960595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027307278162448678}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30357116962664776, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002153172746913521}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3066167803857757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001864747310583765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4016050584122585, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029687484050154784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35340408132516204, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024203053725328372}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.356433479440808, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002068322803762821}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0aab1ed5b97e1e930db50786cffb4d7514ccd28c --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.805990819642968, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11545747726371132}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.46998019703375354, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031239647333913445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43070572612561325, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002457470355676941}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.42703858045940735, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002035276652428456}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.22095953832665552, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002353597555734135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1987243871558035, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018784818554072877}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19734778489236487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017398333866025894}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3325206520940773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002612965421345996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3056110355009581, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002176897829405239}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3017510704812495, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018231271871051772}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3883766916064333, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002916081958006691}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35559042723108397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023422683169970725}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3526562252374031, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002039422626192226}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_0.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0adc2b5a2ae6b78a5011844b9f98fe56ffe25b --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1682140354361548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024311651181596846}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.35168988214341523, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004257802996267162}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2188247155119966, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026101698852964428}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03791114624887027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001430715346143808}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08181326285418697, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027684668080112493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.049755066362456114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001711057906744696}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12558538899658162, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019306618262220862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26406296625514597, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034141022743443975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16347253111222268, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020596404700326306}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13072162961307798, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019975037472617324}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.27675311185951984, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003756707707901523}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1707786995081715, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002220764586073378}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1814410356065763, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11929627005647012}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_1.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a4884c9be4ee2a379df11153c73fe07c3ae19add --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12394690078102485, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017820854664639617}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30883381009085337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004143617002757454}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17485668915463046, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024040861492345958}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02454039849295794, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009642339010215241}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06338989802824146, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025845302772511}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.034970894707131765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013750874506006509}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09759605191150027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013546647766234851}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24498653012258598, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032922471031046553}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13792484720753254, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00184311444020864}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09975522247129645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001443168667820945}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.25068739231214776, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003536217595269335}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14106410762921118, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00197754854435336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4164772106615187, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08503842048783962}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_2.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..94c0802e935df29c463726fef5d387d4853b3702 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1212713815463862, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001783930979666327}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3027696164744973, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004069720967342189}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17119896569207846, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023973191304758746}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022526851037537605, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009300320053962364}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05803699224106711, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002478507440389671}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.032088581665832575, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013254566404233465}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09410711927777662, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013305323171338883}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2369780862526828, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032212483252820195}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1331419291803311, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018112812768873992}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0973756908203134, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014271599181187183}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24589465344432024, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035007571446406256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1378737759652496, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019533435435502575}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3211406116055093, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05632158339691826}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_3.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..84b471537dcad80e769f523ce78a83c69166088f --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12267341712650358, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00207297750674979}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.29346318087456813, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004412522962315509}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16908880821212016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025898440173812076}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.023615304490600033, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010046076586988078}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05931770918646783, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002583579920531965}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03314896853957152, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013908257283640876}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09519232603078606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015734855162649944}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22996956742200556, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00356629562100884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13158510148593067, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020014770100106496}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0987948573594369, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001680092786160822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23916103459926824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003841293731139315}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13667047371150057, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021600836418570976}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4406275619553672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.058943511303575426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_4.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5220f3d4d9d3925f8256c5a2c4d8d786c48d98d3 --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.036834822457244766, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022079340145582244}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07337453869001616, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004314314932527252}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04566365412307027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002608741489638274}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.006497191357163194, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006016918414205361}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.014978313036291765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014510780480090683}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00874385192747724, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008092464001035177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.028775879177447013, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017095958814072434}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05725787803054188, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003351554553300089}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03550416488438028, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020020706708868776}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03052315595597832, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018382248537160094}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06056408978110664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035955665511950294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03770504825258967, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021688966924711204}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6685820712764758, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11003965221099908}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_5.json b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..76d6667ff058e75477636c00c28ae9637395016d --- /dev/null +++ b/perplexity50/evaluation/generation/agg.perplexity50_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0025092290685345187, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008065208895136817}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.00204279104163942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005925317015988438}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002202987774184108, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006658652488222124}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00031845928766017557, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002726745419818294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00021032426692804053, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00016342749062440463}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00024851863402463746, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020210817841172796}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0018256414840619524, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005744051717215062}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015255275808323426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004364013489751857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0016217715192546416, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00048067108652986303}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0020224773879338985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006369133276637897}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001658634237434707, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004694737360395629}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0017788861730293213, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005248009571798277}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.330855196908569e-39, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.2953575552071226e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_0.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0996b5def8ff12ec5cb6ea0c2cca79aaa750faa6 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e620220cc3aa61f829ac5bb3c71b71a9bed8a1e0c9b44f35894b417f1f481660 +size 4263648 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_1.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e2d318b56bab49810eeb471c1019ca1968c99055 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7c884222c6d10ea11ca3be75fa1231fa0524d2dc0295a56492fa4beecc4ae5 +size 5106949 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_2.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..682f0a6b390ce087fe4fc10050fdd665b6660a3f --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa28f0f72ffe7380cb46e6a2da8e33843569d2a921430776d243f51ab60eb37d +size 5962625 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_3.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3055dea2c94ef34fe6b927de44ee9a4dd66d6e74 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc43a76c578855b89c99a8a5694b45fdd67655cb96e9f01a26a6db9c91875225 +size 6863646 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_4.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..213e7b102bb1a29b1f42302a0c48b3ec0d3c9ffe --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfa3a476f7709fd55cc6af55d579da88f750d5eada7db26446ccfd04e23255d +size 7766389 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_5.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fceab456baa218549f51a3119974bb7020703d3c --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738826be149d489fe04faaabb639ed702466a76a8fbf8fb5683812926a906c9a +size 8671280 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_0.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cc6a04279a82d0a7bee8908712e42feccd9d7b6b --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2840b2e5d26d3ba2ef3462e2a9d611b30f20a1845fa335e421d906449e63ae44 +size 7668865 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_1.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2ecec5e1fafbb8ea741a7843da6c3ff6efcabb89 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6f3403bb9c74cc309f66346717bde5c25e20ceb53ebcc38cdbf21fd9052e81 +size 13321479 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_2.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5c006741eb54f181ed586ca3197b9bb6cca24c8f --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb02316f86bcdbb2a68ce281561ca2c62b6f72dab3d830d5ba60bffe1f31fdaf +size 18922508 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_3.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..113e790da2be2dbd6ef7739c7eb849e2e39c9e89 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0264a15e3ad34e9eb08284cfb77709abd44672fbbad544beaa58b9664dc6c9 +size 24340207 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_4.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e679aadb4c3231296007177d22dbdc4387bed333 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59b01670d7eea5cf43277b387dfa958ccf3d9c66852b694d34997fe123558ab +size 29473696 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_5.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1f9c3443415094bdb560a9c5e4c9d75715d72555 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13e3253fb750807fc2e2e0b9a8251b361251ac7c35b0133959b51113bf41972e +size 34799683 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..34672bd684558313424c8a9732a95ae3c6dab521 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda954416c2af5aa56238666a6dfed8a7f60a453e0e37d3c876019abeee2779e +size 4450274 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c86f41c4b0096533586c7b9e354397d259c741b9 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ccea9347e67765129f1a9c957d5b9ff43a77fd2f34e58db803c4428877fd841 +size 5113794 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6c7a5bce4995d3f1fac57b8a32fe397acf4ae68f --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be248223894f5d8bc6610f01251c5ff1d03476bdfaad6f4fc86a09b7c0152687 +size 6240105 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4a3b46f9bfa40b5728e5e7cf3a7301defb0db567 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4698b0dea10463a1fd25a89ec98c6cbb61495a1722ab5502c857ff0f5f5b81d1 +size 7285174 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8f7805d2fb8e9c84a0b483fa48512e2c5b8d87e7 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c521924ebd153d23d9366736483edb4cd3e25398e12edbe8d0a596b8701fe4c0 +size 8340914 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..23bbb00bf9e2413e058be59467d31bcf0993d8b4 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed778f2cbea542d90689699ef68c7646486dbc9a36779ec7d9bb391b0c66f76 +size 9452170 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_0.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..19adc6a6b7b2f254323fcffe773f4c1430ae4873 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ab7d82964dc511e9da6147efafb82356230a62874b28d6b9ffe1e4102ee14c +size 2804470 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_1.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f8b21ac5098b493eb89c7b96ef202b032ba7bf82 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e74d26cb846c7b502af297283ef4dd92547d125bd058e0c74be454942e12feb3 +size 5099192 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_2.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c6cc15966f75690f37447027c5a8bc9c6bee9891 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:587141e51fa17c277711faef0fe391c902d9e7340f3b6fb04854eb32106e6d37 +size 7373647 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_3.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..42901b4eaf45ef30791001034bc7b38ef163e855 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2007ada9eae54de0ba2ea3d72738577c011d6c758c252a5965e29359846e8ae1 +size 9642517 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_4.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ede51f821b106b354cc39f6ecd709b71abdf8014 --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e8bb61a8ad068d62d4d423e7eaf5e77916dafc531f432b029f27f4f7a0f82b +size 11671279 diff --git a/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_5.jsonl b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aa7cd64e57441639cfbae912a3a637c9568f1a7e --- /dev/null +++ b/perplexity50/evaluation/generation/examples.perplexity50_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7561501df2b06a5b965bed0c074b6584fd6c2f91f5af76dee32c8d4ea2bd62bb +size 13897502 diff --git a/perplexity50/evaluation/generation/merged.csv b/perplexity50/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..ee971d943eb4f65dbbbc7e05c669a6be2541e4ea --- /dev/null +++ b/perplexity50/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.06187846081562434 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.06187846081562434 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.16696906460089045 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.16696906460089045 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.18635767606167977 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.18635767606167977 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.19583480506260798 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.19583480506260798 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.20132801941812545 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.20132801941812545 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19734778489236487 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19734778489236487 +e2e_nlg_cleaned,5,average,multiple,0.16828596847521549 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.049755066362456114 +gem_xsum,0,median,rouge2_fmeasure,0.049755066362456114 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.034970894707131765 +gem_xsum,1,median,rouge2_fmeasure,0.034970894707131765 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.032088581665832575 +gem_xsum,2,median,rouge2_fmeasure,0.032088581665832575 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03314896853957152 +gem_xsum,3,median,rouge2_fmeasure,0.03314896853957152 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.00874385192747724 +gem_xsum,4,median,rouge2_fmeasure,0.00874385192747724 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00024851863402463746 +gem_xsum,5,median,rouge2_fmeasure,0.00024851863402463746 +gem_xsum,5,average,multiple,0.026492646972748977 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04314501248705826 +web_nlg_en,0,median,rouge2_fmeasure,0.04314501248705826 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.051698558921326514 +web_nlg_en,1,median,rouge2_fmeasure,0.051698558921326514 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05453717672261224 +web_nlg_en,2,median,rouge2_fmeasure,0.05453717672261224 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05437250272050667 +web_nlg_en,3,median,rouge2_fmeasure,0.05437250272050667 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05731193809218633 +web_nlg_en,4,median,rouge2_fmeasure,0.05731193809218633 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.055825671549297295 +web_nlg_en,5,median,rouge2_fmeasure,0.055825671549297295 +web_nlg_en,5,average,multiple,0.05281514341549788 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.027936413268100608 +wiki_lingua_en,0,median,rouge2_fmeasure,0.027936413268100608 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04823668695482641 +wiki_lingua_en,1,median,rouge2_fmeasure,0.04823668695482641 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05230636200823752 +wiki_lingua_en,2,median,rouge2_fmeasure,0.05230636200823752 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04453744596750722 +wiki_lingua_en,3,median,rouge2_fmeasure,0.04453744596750722 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.014698290853528981 +wiki_lingua_en,4,median,rouge2_fmeasure,0.014698290853528981 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0027535231928660694 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0027535231928660694 +wiki_lingua_en,5,average,multiple,0.03174478704084447 diff --git a/perplexity50/evaluation/generation/merged.json b/perplexity50/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..e3bb2f6cff870060fc149ba1ed98cdd4ef38168d --- /dev/null +++ b/perplexity50/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.36676283856494113, "bleu_stderr": 0.0474507783379639, "rouge1_fmeasure": 0.09441575378592391, "rouge1_fmeasure_stderr": 0.0020680531546244394, "rouge1_precision": 0.062332014806189766, "rouge1_precision_stderr": 0.0016383703848229427, "rouge1_recall": 0.293777806984314, "rouge1_recall_stderr": 0.005252782658193723, "rouge2_fmeasure": 0.04314501248705826, "rouge2_fmeasure_stderr": 0.001258246183189075, "rouge2_precision": 0.028711966510953046, "rouge2_precision_stderr": 0.000984576654338761, "rouge2_recall": 0.1322458599845081, "rouge2_recall_stderr": 0.003314534134287909, "rougeL_fmeasure": 0.0882116048398588, "rougeL_fmeasure_stderr": 0.0018389749448658346, "rougeL_precision": 0.057942425405580346, "rougeL_precision_stderr": 0.0014255082882140484, "rougeL_recall": 0.2776785385893423, "rougeL_recall_stderr": 0.0049436461818446135, "rougeLsum_fmeasure": 0.08927510610731734, "rougeLsum_fmeasure_stderr": 0.001938092014044731, "rougeLsum_precision": 0.058934717518613434, "rougeLsum_precision_stderr": 0.001525972938212972, "rougeLsum_recall": 0.27624443355923034, "rougeLsum_recall_stderr": 0.004852154002930374}}, "1": {"PALM_prompt": {"bleu": 0.42447490695849177, "bleu_stderr": 0.031118881647332453, "rouge1_fmeasure": 0.11353731182395607, "rouge1_fmeasure_stderr": 0.0019319506260635304, "rouge1_precision": 0.07242166849415733, "rouge1_precision_stderr": 0.0013848386081542273, "rouge1_recall": 0.3588660487979018, "rouge1_recall_stderr": 0.005213387725734495, "rouge2_fmeasure": 0.051698558921326514, "rouge2_fmeasure_stderr": 0.0012001219460540538, "rouge2_precision": 0.03288701360932817, "rouge2_precision_stderr": 0.000839098109533103, "rouge2_recall": 0.17107042365285788, "rouge2_recall_stderr": 0.0036083953475667513, "rougeL_fmeasure": 0.10521613042548694, "rougeL_fmeasure_stderr": 0.0017181082493525662, "rougeL_precision": 0.0670061822698939, "rougeL_precision_stderr": 0.001227160746048086, "rougeL_recall": 0.3346245385921824, "rougeL_recall_stderr": 0.004814146748998719, "rougeLsum_fmeasure": 0.10736276773335406, "rougeLsum_fmeasure_stderr": 0.0018148053880352902, "rougeLsum_precision": 0.06851784863794814, "rougeLsum_precision_stderr": 0.0013044655089246824, "rougeLsum_recall": 0.33834197646314856, "rougeLsum_recall_stderr": 0.004780908665148567}}, "2": {"PALM_prompt": {"bleu": 0.5078474394915784, "bleu_stderr": 0.04940313819145897, "rouge1_fmeasure": 0.11839194985760551, "rouge1_fmeasure_stderr": 0.0018550236570084812, "rouge1_precision": 0.07524299617261106, "rouge1_precision_stderr": 0.0013542247809418073, "rouge1_recall": 0.3789792715638066, "rouge1_recall_stderr": 0.005087267508547312, "rouge2_fmeasure": 0.05453717672261224, "rouge2_fmeasure_stderr": 0.0012063786187369366, "rouge2_precision": 0.03451419278556197, "rouge2_precision_stderr": 0.0008480461582178029, "rouge2_recall": 0.18485893110508558, "rouge2_recall_stderr": 0.0037439432130783046, "rougeL_fmeasure": 0.10986668151378429, "rougeL_fmeasure_stderr": 0.0016757644991035844, "rougeL_precision": 0.06970631509385179, "rougeL_precision_stderr": 0.0012132144640462751, "rougeL_recall": 0.35342460023270555, "rougeL_recall_stderr": 0.0047409890816951, "rougeLsum_fmeasure": 0.11142211614255489, "rougeLsum_fmeasure_stderr": 0.0017402016546960485, "rougeLsum_precision": 0.07085029048321866, "rougeLsum_precision_stderr": 0.001272417656582146, "rougeLsum_recall": 0.35589542269045665, "rougeLsum_recall_stderr": 0.004677996287698992}}, "3": {"PALM_prompt": {"bleu": 0.5321467980679849, "bleu_stderr": 0.030789259184486762, "rouge1_fmeasure": 0.11775282391938749, "rouge1_fmeasure_stderr": 0.0018121209623013599, "rouge1_precision": 0.07467739697980223, "rouge1_precision_stderr": 0.0013056742555484042, "rouge1_recall": 0.3765931475512988, "rouge1_recall_stderr": 0.005136827785933215, "rouge2_fmeasure": 0.05437250272050667, "rouge2_fmeasure_stderr": 0.0011494478736656965, "rouge2_precision": 0.03425895499250951, "rouge2_precision_stderr": 0.0007949938460894235, "rouge2_recall": 0.1857701112713038, "rouge2_recall_stderr": 0.0037899558051587997, "rougeL_fmeasure": 0.109142035871985, "rougeL_fmeasure_stderr": 0.0016567099883848363, "rougeL_precision": 0.0691367241290362, "rougeL_precision_stderr": 0.0011898077979863157, "rougeL_recall": 0.35044113186494674, "rougeL_recall_stderr": 0.004789067731865496, "rougeLsum_fmeasure": 0.11055745133283143, "rougeLsum_fmeasure_stderr": 0.0017021172309438397, "rougeLsum_precision": 0.07016534933559325, "rougeLsum_precision_stderr": 0.001231446670361234, "rougeLsum_recall": 0.3527313952049522, "rougeLsum_recall_stderr": 0.004720204023911692}}, "4": {"PALM_prompt": {"bleu": 0.5836215112044281, "bleu_stderr": 0.0373980578845506, "rouge1_fmeasure": 0.12273951831524596, "rouge1_fmeasure_stderr": 0.0018568477885135075, "rouge1_precision": 0.07814979242067882, "rouge1_precision_stderr": 0.0013719481084767942, "rouge1_recall": 0.3904381500627582, "rouge1_recall_stderr": 0.005108365571685621, "rouge2_fmeasure": 0.05731193809218633, "rouge2_fmeasure_stderr": 0.0012015065055436362, "rouge2_precision": 0.036278020218023364, "rouge2_precision_stderr": 0.0008590667413980339, "rouge2_recall": 0.19568480085429035, "rouge2_recall_stderr": 0.0037894995606282777, "rougeL_fmeasure": 0.11294640173282941, "rougeL_fmeasure_stderr": 0.0016715462444065227, "rougeL_precision": 0.07184600146882388, "rougeL_precision_stderr": 0.0012338794593141857, "rougeL_recall": 0.361289411306646, "rougeL_recall_stderr": 0.004721144658086456, "rougeLsum_fmeasure": 0.11548902373578677, "rougeLsum_fmeasure_stderr": 0.0017405908622108689, "rougeLsum_precision": 0.07360622983361918, "rougeLsum_precision_stderr": 0.0012935410743410267, "rougeLsum_recall": 0.3670374936279833, "rougeLsum_recall_stderr": 0.004716543868495296}}, "5": {"PALM_prompt": {"bleu": 0.594609825520194, "bleu_stderr": 0.04115839696833975, "rouge1_fmeasure": 0.12086027376047605, "rouge1_fmeasure_stderr": 0.0017433543864987184, "rouge1_precision": 0.07606093952092045, "rouge1_precision_stderr": 0.0012363342608298056, "rouge1_recall": 0.3956239968710567, "rouge1_recall_stderr": 0.005142405199368944, "rouge2_fmeasure": 0.055825671549297295, "rouge2_fmeasure_stderr": 0.0011219041594589493, "rouge2_precision": 0.034848706116865254, "rouge2_precision_stderr": 0.0007661213026779092, "rouge2_recall": 0.1971845061377734, "rouge2_recall_stderr": 0.003781803943041313, "rougeL_fmeasure": 0.11109358926885284, "rougeL_fmeasure_stderr": 0.001582946667660359, "rougeL_precision": 0.06988703720341218, "rougeL_precision_stderr": 0.001122929060032178, "rougeL_recall": 0.3647605769777058, "rougeL_recall_stderr": 0.0047210888757834, "rougeLsum_fmeasure": 0.11358138097063522, "rougeLsum_fmeasure_stderr": 0.0016202519807538079, "rougeLsum_precision": 0.07150521311673122, "rougeLsum_precision_stderr": 0.0011539037542073426, "rougeLsum_recall": 0.3721409413587192, "rougeLsum_recall_stderr": 0.0047326985289146365}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.318952551089346, "bleu_stderr": 0.04329525521577347, "rouge1_fmeasure": 0.15459597826273924, "rouge1_fmeasure_stderr": 0.0018270611999879997, "rouge1_precision": 0.1319714359255099, "rouge1_precision_stderr": 0.0018067861281345137, "rouge1_recall": 0.22663257957285188, "rouge1_recall_stderr": 0.002733984829707475, "rouge2_fmeasure": 0.027936413268100608, "rouge2_fmeasure_stderr": 0.0007972095177959765, "rouge2_precision": 0.02346568721104801, "rouge2_precision_stderr": 0.0006971468696509421, "rouge2_recall": 0.04305065808208426, "rouge2_recall_stderr": 0.0013646495534821036, "rougeL_fmeasure": 0.12417210909685761, "rougeL_fmeasure_stderr": 0.0013302228377918145, "rougeL_precision": 0.1050094945336366, "rougeL_precision_stderr": 0.0012983078223279439, "rougeL_recall": 0.18568833868889176, "rougeL_recall_stderr": 0.0022086628996599916, "rougeLsum_fmeasure": 0.1422075831554883, "rougeLsum_fmeasure_stderr": 0.0016619749917407194, "rougeLsum_precision": 0.1211307288912133, "rougeLsum_precision_stderr": 0.001638963005635593, "rougeLsum_recall": 0.20936613117867833, "rougeLsum_recall_stderr": 0.0025285661065844287}}, "1": {"tldr_en": {"bleu": 2.4993327349018104, "bleu_stderr": 0.060039405630241266, "rouge1_fmeasure": 0.20579895579192997, "rouge1_fmeasure_stderr": 0.0019171748643174895, "rouge1_precision": 0.17493391960845747, "rouge1_precision_stderr": 0.0019881056363054072, "rouge1_recall": 0.30039251220979346, "rouge1_recall_stderr": 0.0027564678289120448, "rouge2_fmeasure": 0.04823668695482641, "rouge2_fmeasure_stderr": 0.0009745669933822557, "rouge2_precision": 0.040554616651465696, "rouge2_precision_stderr": 0.0008659890131539827, "rouge2_recall": 0.07316485920387228, "rouge2_recall_stderr": 0.0016147073802019601, "rougeL_fmeasure": 0.1484222303241806, "rougeL_fmeasure_stderr": 0.0013020741099865607, "rougeL_precision": 0.124842470774516, "rougeL_precision_stderr": 0.001319051588032341, "rougeL_recall": 0.22232295572810765, "rougeL_recall_stderr": 0.00218343118232531, "rougeLsum_fmeasure": 0.19302273540773426, "rougeLsum_fmeasure_stderr": 0.001789695068656324, "rougeLsum_precision": 0.16389878356035073, "rougeLsum_precision_stderr": 0.0018573417662959208, "rougeLsum_recall": 0.2828415570261487, "rougeLsum_recall_stderr": 0.002627261412365232}}, "2": {"tldr_en": {"bleu": 2.848425645647928, "bleu_stderr": 0.07632604642356548, "rouge1_fmeasure": 0.215446597689823, "rouge1_fmeasure_stderr": 0.0018467682989689277, "rouge1_precision": 0.18456973112779013, "rouge1_precision_stderr": 0.002015516204243605, "rouge1_recall": 0.31320510678716973, "rouge1_recall_stderr": 0.0026816066901912826, "rouge2_fmeasure": 0.05230636200823752, "rouge2_fmeasure_stderr": 0.0009952603118013488, "rouge2_precision": 0.04451908592886625, "rouge2_precision_stderr": 0.0009130557961238952, "rouge2_recall": 0.07879022976243907, "rouge2_recall_stderr": 0.0016883257356260532, "rougeL_fmeasure": 0.15530146813359313, "rougeL_fmeasure_stderr": 0.0012696789175546876, "rougeL_precision": 0.1316268882646582, "rougeL_precision_stderr": 0.0013690654713722978, "rougeL_recall": 0.23148383110872217, "rougeL_recall_stderr": 0.002153117823688896, "rougeLsum_fmeasure": 0.20267202658830938, "rougeLsum_fmeasure_stderr": 0.001723884821520709, "rougeLsum_precision": 0.17349312338034656, "rougeLsum_precision_stderr": 0.0018858372860279045, "rougeLsum_recall": 0.29539552159407584, "rougeLsum_recall_stderr": 0.0025507540114149945}}, "3": {"tldr_en": {"bleu": 2.803251560776854, "bleu_stderr": 0.0956254167064949, "rouge1_fmeasure": 0.18186666197279194, "rouge1_fmeasure_stderr": 0.002214876076414925, "rouge1_precision": 0.1616397163764498, "rouge1_precision_stderr": 0.0023460161842419813, "rouge1_recall": 0.26019267483379616, "rouge1_recall_stderr": 0.0032056026696719647, "rouge2_fmeasure": 0.04453744596750722, "rouge2_fmeasure_stderr": 0.0009892511091368977, "rouge2_precision": 0.03925295558880392, "rouge2_precision_stderr": 0.0009449386730106019, "rouge2_recall": 0.06561949094566538, "rouge2_recall_stderr": 0.0016314095494124245, "rougeL_fmeasure": 0.13202316706879197, "rougeL_fmeasure_stderr": 0.001565731448359357, "rougeL_precision": 0.11667604287371745, "rougeL_precision_stderr": 0.0016762280786544305, "rougeL_recall": 0.19390457934260266, "rougeL_recall_stderr": 0.0025516384846018345, "rougeLsum_fmeasure": 0.17153352468735855, "rougeLsum_fmeasure_stderr": 0.0020795362207751736, "rougeLsum_precision": 0.15230978309868673, "rougeLsum_precision_stderr": 0.0022054724157184874, "rougeLsum_recall": 0.2461258416944667, "rougeLsum_recall_stderr": 0.003046019155993613}}, "4": {"tldr_en": {"bleu": 0.6541873598701015, "bleu_stderr": 0.04137927662792639, "rouge1_fmeasure": 0.05848926036885533, "rouge1_fmeasure_stderr": 0.001947796388751384, "rouge1_precision": 0.0540655546367526, "rouge1_precision_stderr": 0.0019863598257229935, "rouge1_recall": 0.08630893835073304, "rouge1_recall_stderr": 0.0028923078072790034, "rouge2_fmeasure": 0.014698290853528981, "rouge2_fmeasure_stderr": 0.0006960360254178698, "rouge2_precision": 0.013419788420821602, "rouge2_precision_stderr": 0.0007196640004372746, "rouge2_recall": 0.022948179606902694, "rouge2_recall_stderr": 0.0011746702031675198, "rougeL_fmeasure": 0.044046354099571715, "rougeL_fmeasure_stderr": 0.0014521599460521, "rougeL_precision": 0.04061005184395829, "rougeL_precision_stderr": 0.0015089448751204634, "rougeL_recall": 0.06684826672013897, "rougeL_recall_stderr": 0.0023100255832951676, "rougeLsum_fmeasure": 0.05480556417744295, "rougeLsum_fmeasure_stderr": 0.0018205484087403967, "rougeLsum_precision": 0.05070517916237353, "rougeLsum_precision_stderr": 0.0018676632653238442, "rougeLsum_recall": 0.08116451423168446, "rougeLsum_recall_stderr": 0.0027292176658861946}}, "5": {"tldr_en": {"bleu": 1.8017672277263173e-06, "bleu_stderr": 3.4167644481328265e-06, "rouge1_fmeasure": 0.009922885274947888, "rouge1_fmeasure_stderr": 0.00091535752249209, "rouge1_precision": 0.009622620991293292, "rouge1_precision_stderr": 0.0009755776848685625, "rouge1_recall": 0.014660623303221735, "rouge1_recall_stderr": 0.0013738443681724601, "rouge2_fmeasure": 0.0027535231928660694, "rouge2_fmeasure_stderr": 0.00034248340049010525, "rouge2_precision": 0.0025945823584633773, "rouge2_precision_stderr": 0.0003550261333440917, "rouge2_recall": 0.004296371055249484, "rouge2_recall_stderr": 0.000576258075124869, "rougeL_fmeasure": 0.007698903693431021, "rougeL_fmeasure_stderr": 0.0007102473355679709, "rougeL_precision": 0.007418445736015545, "rougeL_precision_stderr": 0.0007597278932642448, "rougeL_recall": 0.01150875523797143, "rougeL_recall_stderr": 0.001083700258541403, "rougeLsum_fmeasure": 0.009228479004212309, "rougeLsum_fmeasure_stderr": 0.0008517809180671035, "rougeLsum_precision": 0.008921009893079637, "rougeLsum_precision_stderr": 0.0009010991448249183, "rougeLsum_recall": 0.01368434519987409, "rougeLsum_recall_stderr": 0.0012818488127390474}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 3.2944515852286527, "bleu_stderr": 0.0687957809640445, "rouge1_fmeasure": 0.1814799362167216, "rouge1_fmeasure_stderr": 0.0017831836075280368, "rouge1_precision": 0.13683365368832767, "rouge1_precision_stderr": 0.0014688301287434024, "rouge1_recall": 0.28316158012799547, "rouge1_recall_stderr": 0.0025200608344027693, "rouge2_fmeasure": 0.06187846081562434, "rouge2_fmeasure_stderr": 0.001129424676101297, "rouge2_precision": 0.046755060522420185, "rouge2_precision_stderr": 0.0008806060921358351, "rouge2_recall": 0.09586697768686785, "rouge2_recall_stderr": 0.001719510820833045, "rougeL_fmeasure": 0.16841364171833556, "rougeL_fmeasure_stderr": 0.0015464664247715663, "rougeL_precision": 0.12660643084306702, "rougeL_precision_stderr": 0.00126456533149021, "rougeL_recall": 0.264267984967182, "rougeL_recall_stderr": 0.0022332757179524803, "rougeLsum_fmeasure": 0.15579956125425456, "rougeLsum_fmeasure_stderr": 0.0016372102304097094, "rougeLsum_precision": 0.11737623006499737, "rougeLsum_precision_stderr": 0.0013285621448530893, "rougeLsum_recall": 0.24349593138163397, "rougeLsum_recall_stderr": 0.002354566720998469}}, "1": {"generate_text_restaurant": {"bleu": 8.52641209830111, "bleu_stderr": 0.12582983777195597, "rouge1_fmeasure": 0.3977363846975939, "rouge1_fmeasure_stderr": 0.0022382388166838187, "rouge1_precision": 0.44140716426798104, "rouge1_precision_stderr": 0.0032213924886028253, "rouge1_recall": 0.4052286843296632, "rouge1_recall_stderr": 0.002639166874418895, "rouge2_fmeasure": 0.16696906460089045, "rouge2_fmeasure_stderr": 0.0017222149044682246, "rouge2_precision": 0.18864819780738046, "rouge2_precision_stderr": 0.0022621645695871918, "rouge2_recall": 0.16963873808583682, "rouge2_recall_stderr": 0.001847799566651559, "rougeL_fmeasure": 0.2829785990744798, "rougeL_fmeasure_stderr": 0.001784528829213968, "rougeL_precision": 0.31455069215794823, "rougeL_precision_stderr": 0.0025903719800358703, "rougeL_recall": 0.2903012525772825, "rougeL_recall_stderr": 0.002143374874342348, "rougeLsum_fmeasure": 0.3201857670611568, "rougeLsum_fmeasure_stderr": 0.002098087765270582, "rougeLsum_precision": 0.3567420815242637, "rougeLsum_precision_stderr": 0.0029468018540509057, "rougeLsum_recall": 0.3256533312057627, "rougeLsum_recall_stderr": 0.0023856069656370727}}, "2": {"generate_text_restaurant": {"bleu": 9.630291369867987, "bleu_stderr": 0.13549753046024302, "rouge1_fmeasure": 0.4181223330310302, "rouge1_fmeasure_stderr": 0.0020232576936325647, "rouge1_precision": 0.44886308747052966, "rouge1_precision_stderr": 0.0030653689427961226, "rouge1_recall": 0.4345078703253225, "rouge1_recall_stderr": 0.0025475650430768814, "rouge2_fmeasure": 0.18635767606167977, "rouge2_fmeasure_stderr": 0.0016723047591652514, "rouge2_precision": 0.20393782443251954, "rouge2_precision_stderr": 0.0022988281035972273, "rouge2_recall": 0.19337736914798762, "rouge2_recall_stderr": 0.00185489954602544, "rougeL_fmeasure": 0.2928097571700884, "rougeL_fmeasure_stderr": 0.0017552966978288125, "rougeL_precision": 0.31607957889707133, "rougeL_precision_stderr": 0.002589473433632966, "rougeL_recall": 0.3043881139321235, "rougeL_recall_stderr": 0.002132304038142002, "rougeLsum_fmeasure": 0.3438100939181177, "rougeLsum_fmeasure_stderr": 0.0019679894394683483, "rougeLsum_precision": 0.3695227255731898, "rougeLsum_precision_stderr": 0.00282070031070788, "rougeLsum_recall": 0.3571271332319229, "rougeLsum_recall_stderr": 0.0023658526732539117}}, "3": {"generate_text_restaurant": {"bleu": 10.771336904004668, "bleu_stderr": 0.15312208049452972, "rouge1_fmeasure": 0.4246139438060347, "rouge1_fmeasure_stderr": 0.002068822985960878, "rouge1_precision": 0.47121262761824606, "rouge1_precision_stderr": 0.0031706802673694546, "rouge1_recall": 0.4285131204444559, "rouge1_recall_stderr": 0.00259084813925993, "rouge2_fmeasure": 0.19583480506260798, "rouge2_fmeasure_stderr": 0.0017745784799472742, "rouge2_precision": 0.22192545824696955, "rouge2_precision_stderr": 0.0024446292469949274, "rouge2_recall": 0.19735042748477633, "rouge2_recall_stderr": 0.001962335262395526, "rougeL_fmeasure": 0.3025604202708821, "rougeL_fmeasure_stderr": 0.0018763118742909542, "rougeL_precision": 0.33776452672838364, "rougeL_precision_stderr": 0.002772013880864643, "rougeL_recall": 0.3053908517936716, "rougeL_recall_stderr": 0.0022386749143566537, "rougeLsum_fmeasure": 0.35175775657317715, "rougeLsum_fmeasure_stderr": 0.0020815737481426283, "rougeLsum_precision": 0.3904903633666419, "rougeLsum_precision_stderr": 0.0029686040326820764, "rougeLsum_recall": 0.3552152361692601, "rougeLsum_recall_stderr": 0.002487386620131327}}, "4": {"generate_text_restaurant": {"bleu": 11.267530539514095, "bleu_stderr": 0.1677573231958913, "rouge1_fmeasure": 0.43249984090343835, "rouge1_fmeasure_stderr": 0.002029303339376666, "rouge1_precision": 0.4875664382154273, "rouge1_precision_stderr": 0.003185218088206128, "rouge1_recall": 0.4282782601002331, "rouge1_recall_stderr": 0.0024811809614885827, "rouge2_fmeasure": 0.20132801941812545, "rouge2_fmeasure_stderr": 0.0017679869293689926, "rouge2_precision": 0.23104550813725375, "rouge2_precision_stderr": 0.0024366019088569594, "rouge2_recall": 0.19888718264029498, "rouge2_recall_stderr": 0.001882516080327131, "rougeL_fmeasure": 0.3066167803857757, "rougeL_fmeasure_stderr": 0.001864747310583765, "rougeL_precision": 0.3469917638960595, "rougeL_precision_stderr": 0.0027307278162448678, "rougeL_recall": 0.30357116962664776, "rougeL_recall_stderr": 0.002153172746913521, "rougeLsum_fmeasure": 0.356433479440808, "rougeLsum_fmeasure_stderr": 0.002068322803762821, "rougeLsum_precision": 0.4016050584122585, "rougeLsum_precision_stderr": 0.0029687484050154784, "rougeLsum_recall": 0.35340408132516204, "rougeLsum_recall_stderr": 0.0024203053725328372}}, "5": {"generate_text_restaurant": {"bleu": 10.805990819642968, "bleu_stderr": 0.11545747726371132, "rouge1_fmeasure": 0.42703858045940735, "rouge1_fmeasure_stderr": 0.002035276652428456, "rouge1_precision": 0.46998019703375354, "rouge1_precision_stderr": 0.0031239647333913445, "rouge1_recall": 0.43070572612561325, "rouge1_recall_stderr": 0.002457470355676941, "rouge2_fmeasure": 0.19734778489236487, "rouge2_fmeasure_stderr": 0.0017398333866025894, "rouge2_precision": 0.22095953832665552, "rouge2_precision_stderr": 0.002353597555734135, "rouge2_recall": 0.1987243871558035, "rouge2_recall_stderr": 0.0018784818554072877, "rougeL_fmeasure": 0.3017510704812495, "rougeL_fmeasure_stderr": 0.0018231271871051772, "rougeL_precision": 0.3325206520940773, "rougeL_precision_stderr": 0.002612965421345996, "rougeL_recall": 0.3056110355009581, "rougeL_recall_stderr": 0.002176897829405239, "rougeLsum_fmeasure": 0.3526562252374031, "rougeLsum_fmeasure_stderr": 0.002039422626192226, "rougeLsum_precision": 0.3883766916064333, "rougeLsum_precision_stderr": 0.002916081958006691, "rougeLsum_recall": 0.35559042723108397, "rougeLsum_recall_stderr": 0.0023422683169970725}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.1814410356065763, "bleu_stderr": 0.11929627005647012, "rouge1_fmeasure": 0.2188247155119966, "rouge1_fmeasure_stderr": 0.0026101698852964428, "rouge1_precision": 0.1682140354361548, "rouge1_precision_stderr": 0.0024311651181596846, "rouge1_recall": 0.35168988214341523, "rouge1_recall_stderr": 0.004257802996267162, "rouge2_fmeasure": 0.049755066362456114, "rouge2_fmeasure_stderr": 0.001711057906744696, "rouge2_precision": 0.03791114624887027, "rouge2_precision_stderr": 0.001430715346143808, "rouge2_recall": 0.08181326285418697, "rouge2_recall_stderr": 0.0027684668080112493, "rougeL_fmeasure": 0.16347253111222268, "rougeL_fmeasure_stderr": 0.0020596404700326306, "rougeL_precision": 0.12558538899658162, "rougeL_precision_stderr": 0.0019306618262220862, "rougeL_recall": 0.26406296625514597, "rougeL_recall_stderr": 0.0034141022743443975, "rougeLsum_fmeasure": 0.1707786995081715, "rougeLsum_fmeasure_stderr": 0.002220764586073378, "rougeLsum_precision": 0.13072162961307798, "rougeLsum_precision_stderr": 0.0019975037472617324, "rougeLsum_recall": 0.27675311185951984, "rougeLsum_recall_stderr": 0.003756707707901523}}, "1": {"article_DOC_summary": {"bleu": 1.4164772106615187, "bleu_stderr": 0.08503842048783962, "rouge1_fmeasure": 0.17485668915463046, "rouge1_fmeasure_stderr": 0.0024040861492345958, "rouge1_precision": 0.12394690078102485, "rouge1_precision_stderr": 0.0017820854664639617, "rouge1_recall": 0.30883381009085337, "rouge1_recall_stderr": 0.004143617002757454, "rouge2_fmeasure": 0.034970894707131765, "rouge2_fmeasure_stderr": 0.0013750874506006509, "rouge2_precision": 0.02454039849295794, "rouge2_precision_stderr": 0.0009642339010215241, "rouge2_recall": 0.06338989802824146, "rouge2_recall_stderr": 0.0025845302772511, "rougeL_fmeasure": 0.13792484720753254, "rougeL_fmeasure_stderr": 0.00184311444020864, "rougeL_precision": 0.09759605191150027, "rougeL_precision_stderr": 0.0013546647766234851, "rougeL_recall": 0.24498653012258598, "rougeL_recall_stderr": 0.0032922471031046553, "rougeLsum_fmeasure": 0.14106410762921118, "rougeLsum_fmeasure_stderr": 0.00197754854435336, "rougeLsum_precision": 0.09975522247129645, "rougeLsum_precision_stderr": 0.001443168667820945, "rougeLsum_recall": 0.25068739231214776, "rougeLsum_recall_stderr": 0.003536217595269335}}, "2": {"article_DOC_summary": {"bleu": 1.3211406116055093, "bleu_stderr": 0.05632158339691826, "rouge1_fmeasure": 0.17119896569207846, "rouge1_fmeasure_stderr": 0.0023973191304758746, "rouge1_precision": 0.1212713815463862, "rouge1_precision_stderr": 0.001783930979666327, "rouge1_recall": 0.3027696164744973, "rouge1_recall_stderr": 0.004069720967342189, "rouge2_fmeasure": 0.032088581665832575, "rouge2_fmeasure_stderr": 0.0013254566404233465, "rouge2_precision": 0.022526851037537605, "rouge2_precision_stderr": 0.0009300320053962364, "rouge2_recall": 0.05803699224106711, "rouge2_recall_stderr": 0.002478507440389671, "rougeL_fmeasure": 0.1331419291803311, "rougeL_fmeasure_stderr": 0.0018112812768873992, "rougeL_precision": 0.09410711927777662, "rougeL_precision_stderr": 0.0013305323171338883, "rougeL_recall": 0.2369780862526828, "rougeL_recall_stderr": 0.0032212483252820195, "rougeLsum_fmeasure": 0.1378737759652496, "rougeLsum_fmeasure_stderr": 0.0019533435435502575, "rougeLsum_precision": 0.0973756908203134, "rougeLsum_precision_stderr": 0.0014271599181187183, "rougeLsum_recall": 0.24589465344432024, "rougeLsum_recall_stderr": 0.0035007571446406256}}, "3": {"article_DOC_summary": {"bleu": 1.4406275619553672, "bleu_stderr": 0.058943511303575426, "rouge1_fmeasure": 0.16908880821212016, "rouge1_fmeasure_stderr": 0.0025898440173812076, "rouge1_precision": 0.12267341712650358, "rouge1_precision_stderr": 0.00207297750674979, "rouge1_recall": 0.29346318087456813, "rouge1_recall_stderr": 0.004412522962315509, "rouge2_fmeasure": 0.03314896853957152, "rouge2_fmeasure_stderr": 0.0013908257283640876, "rouge2_precision": 0.023615304490600033, "rouge2_precision_stderr": 0.0010046076586988078, "rouge2_recall": 0.05931770918646783, "rouge2_recall_stderr": 0.002583579920531965, "rougeL_fmeasure": 0.13158510148593067, "rougeL_fmeasure_stderr": 0.0020014770100106496, "rougeL_precision": 0.09519232603078606, "rougeL_precision_stderr": 0.0015734855162649944, "rougeL_recall": 0.22996956742200556, "rougeL_recall_stderr": 0.00356629562100884, "rougeLsum_fmeasure": 0.13667047371150057, "rougeLsum_fmeasure_stderr": 0.0021600836418570976, "rougeLsum_precision": 0.0987948573594369, "rougeLsum_precision_stderr": 0.001680092786160822, "rougeLsum_recall": 0.23916103459926824, "rougeLsum_recall_stderr": 0.003841293731139315}}, "4": {"article_DOC_summary": {"bleu": 0.6685820712764758, "bleu_stderr": 0.11003965221099908, "rouge1_fmeasure": 0.04566365412307027, "rouge1_fmeasure_stderr": 0.002608741489638274, "rouge1_precision": 0.036834822457244766, "rouge1_precision_stderr": 0.0022079340145582244, "rouge1_recall": 0.07337453869001616, "rouge1_recall_stderr": 0.004314314932527252, "rouge2_fmeasure": 0.00874385192747724, "rouge2_fmeasure_stderr": 0.0008092464001035177, "rouge2_precision": 0.006497191357163194, "rouge2_precision_stderr": 0.0006016918414205361, "rouge2_recall": 0.014978313036291765, "rouge2_recall_stderr": 0.0014510780480090683, "rougeL_fmeasure": 0.03550416488438028, "rougeL_fmeasure_stderr": 0.0020020706708868776, "rougeL_precision": 0.028775879177447013, "rougeL_precision_stderr": 0.0017095958814072434, "rougeL_recall": 0.05725787803054188, "rougeL_recall_stderr": 0.003351554553300089, "rougeLsum_fmeasure": 0.03770504825258967, "rougeLsum_fmeasure_stderr": 0.0021688966924711204, "rougeLsum_precision": 0.03052315595597832, "rougeLsum_precision_stderr": 0.0018382248537160094, "rougeLsum_recall": 0.06056408978110664, "rougeLsum_recall_stderr": 0.0035955665511950294}}, "5": {"article_DOC_summary": {"bleu": 3.330855196908569e-39, "bleu_stderr": 2.2953575552071226e-33, "rouge1_fmeasure": 0.002202987774184108, "rouge1_fmeasure_stderr": 0.0006658652488222124, "rouge1_precision": 0.0025092290685345187, "rouge1_precision_stderr": 0.0008065208895136817, "rouge1_recall": 0.00204279104163942, "rouge1_recall_stderr": 0.0005925317015988438, "rouge2_fmeasure": 0.00024851863402463746, "rouge2_fmeasure_stderr": 0.00020210817841172796, "rouge2_precision": 0.00031845928766017557, "rouge2_precision_stderr": 0.0002726745419818294, "rouge2_recall": 0.00021032426692804053, "rouge2_recall_stderr": 0.00016342749062440463, "rougeL_fmeasure": 0.0016217715192546416, "rougeL_fmeasure_stderr": 0.00048067108652986303, "rougeL_precision": 0.0018256414840619524, "rougeL_precision_stderr": 0.0005744051717215062, "rougeL_recall": 0.0015255275808323426, "rougeL_recall_stderr": 0.0004364013489751857, "rougeLsum_fmeasure": 0.0017788861730293213, "rougeLsum_fmeasure_stderr": 0.0005248009571798277, "rougeLsum_precision": 0.0020224773879338985, "rougeLsum_precision_stderr": 0.0006369133276637897, "rougeLsum_recall": 0.001658634237434707, "rougeLsum_recall_stderr": 0.0004694737360395629}}}} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..82c1b85464d5e513ce4bf1b1af35e573da894af1 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.36676283856494113, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0474507783379639 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.062332014806189766, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016383703848229427 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.293777806984314, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005252782658193723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09441575378592391, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020680531546244394 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028711966510953046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000984576654338761 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1322458599845081, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003314534134287909 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04314501248705826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001258246183189075 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.057942425405580346, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014255082882140484 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2776785385893423, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0049436461818446135 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0882116048398588, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018389749448658346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.058934717518613434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001525972938212972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.27624443355923034, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004852154002930374 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08927510610731734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001938092014044731 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7322d96c8e7df06944cfdb0123154f88c361e546 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.42447490695849177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.031118881647332453 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07242166849415733, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013848386081542273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3588660487979018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005213387725734495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11353731182395607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019319506260635304 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03288701360932817, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000839098109533103 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17107042365285788, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036083953475667513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.051698558921326514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012001219460540538 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0670061822698939, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001227160746048086 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3346245385921824, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004814146748998719 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10521613042548694, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017181082493525662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06851784863794814, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013044655089246824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.33834197646314856, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004780908665148567 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10736276773335406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018148053880352902 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..be69c5c1525e943335e437401b3e80e4cbb92b68 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5078474394915784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04940313819145897 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07524299617261106, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013542247809418073 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3789792715638066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005087267508547312 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11839194985760551, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018550236570084812 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03451419278556197, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008480461582178029 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18485893110508558, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037439432130783046 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05453717672261224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012063786187369366 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06970631509385179, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012132144640462751 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35342460023270555, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0047409890816951 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10986668151378429, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016757644991035844 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07085029048321866, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001272417656582146 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35589542269045665, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004677996287698992 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11142211614255489, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017402016546960485 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1177c560cd0899940a0d569f61c94fd83ae80a96 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5321467980679849, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030789259184486762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07467739697980223, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013056742555484042 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3765931475512988, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005136827785933215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11775282391938749, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018121209623013599 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03425895499250951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007949938460894235 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1857701112713038, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037899558051587997 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05437250272050667, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011494478736656965 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0691367241290362, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011898077979863157 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35044113186494674, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004789067731865496 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.109142035871985, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016567099883848363 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07016534933559325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001231446670361234 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3527313952049522, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004720204023911692 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11055745133283143, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017021172309438397 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4a91655fc4d4ffb68a2d6fdf6002054a96d743 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5836215112044281, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0373980578845506 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07814979242067882, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013719481084767942 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3904381500627582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005108365571685621 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12273951831524596, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018568477885135075 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.036278020218023364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008590667413980339 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19568480085429035, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037894995606282777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05731193809218633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012015065055436362 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07184600146882388, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012338794593141857 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.361289411306646, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004721144658086456 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11294640173282941, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016715462444065227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07360622983361918, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012935410743410267 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3670374936279833, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004716543868495296 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11548902373578677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017405908622108689 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c907f6bbc1cc6e015bdad63209c2506a5793bf64 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.594609825520194, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04115839696833975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07606093952092045, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012363342608298056 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3956239968710567, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005142405199368944 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12086027376047605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017433543864987184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.034848706116865254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007661213026779092 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1971845061377734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003781803943041313 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.055825671549297295, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011219041594589493 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06988703720341218, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001122929060032178 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3647605769777058, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0047210888757834 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11109358926885284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001582946667660359 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07150521311673122, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011539037542073426 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3721409413587192, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047326985289146365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11358138097063522, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016202519807538079 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f37dc3a437198fb90e0cc5a6ade3296090136f53 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1319714359255099, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018067861281345137 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22663257957285188, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002733984829707475 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15459597826273924, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018270611999879997 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02346568721104801, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006971468696509421 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04305065808208426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013646495534821036 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.027936413268100608, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007972095177959765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1050094945336366, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012983078223279439 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18568833868889176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022086628996599916 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12417210909685761, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013302228377918145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1211307288912133, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001638963005635593 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20936613117867833, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025285661065844287 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1422075831554883, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016619749917407194 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.318952551089346, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04329525521577347 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f2a46c53f78304e6980ad8b8902c266041843d87 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17493391960845747, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019881056363054072 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.30039251220979346, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027564678289120448 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20579895579192997, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019171748643174895 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.040554616651465696, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008659890131539827 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07316485920387228, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016147073802019601 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04823668695482641, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009745669933822557 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.124842470774516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001319051588032341 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22232295572810765, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00218343118232531 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1484222303241806, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013020741099865607 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16389878356035073, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018573417662959208 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2828415570261487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002627261412365232 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19302273540773426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001789695068656324 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.4993327349018104, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.060039405630241266 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..61a51672c3ad707bdedf05467386e462f321f48c --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.18456973112779013, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002015516204243605 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.31320510678716973, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026816066901912826 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.215446597689823, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018467682989689277 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04451908592886625, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009130557961238952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07879022976243907, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016883257356260532 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05230636200823752, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009952603118013488 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1316268882646582, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013690654713722978 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23148383110872217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002153117823688896 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15530146813359313, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012696789175546876 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.17349312338034656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018858372860279045 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.29539552159407584, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025507540114149945 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20267202658830938, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001723884821520709 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.848425645647928, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07632604642356548 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..aae941e3bef4f9d91e8cd58b9fea833ddfd2d992 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1616397163764498, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023460161842419813 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.26019267483379616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032056026696719647 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18186666197279194, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002214876076414925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03925295558880392, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009449386730106019 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06561949094566538, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016314095494124245 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04453744596750722, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009892511091368977 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11667604287371745, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016762280786544305 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19390457934260266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025516384846018345 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13202316706879197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001565731448359357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15230978309868673, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022054724157184874 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2461258416944667, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003046019155993613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17153352468735855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020795362207751736 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.803251560776854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0956254167064949 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..66d57ed9cefda4336fd9bd1b8a59be90c718325c --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.0540655546367526, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019863598257229935 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08630893835073304, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028923078072790034 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05848926036885533, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001947796388751384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.013419788420821602, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007196640004372746 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.022948179606902694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011746702031675198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014698290853528981, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006960360254178698 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.04061005184395829, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015089448751204634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06684826672013897, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023100255832951676 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.044046354099571715, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014521599460521 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.05070517916237353, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018676632653238442 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08116451423168446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027292176658861946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05480556417744295, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018205484087403967 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6541873598701015, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04137927662792639 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b25913cc1399c670a1fc94db4f0236e8a58aaaed --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009622620991293292, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009755776848685625 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.014660623303221735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013738443681724601 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009922885274947888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00091535752249209 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0025945823584633773, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0003550261333440917 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.004296371055249484, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.000576258075124869 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0027535231928660694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00034248340049010525 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007418445736015545, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007597278932642448 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.01150875523797143, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001083700258541403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007698903693431021, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0007102473355679709 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008921009893079637, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009010991448249183 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01368434519987409, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012818488127390474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.009228479004212309, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008517809180671035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.8017672277263173e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 3.4167644481328265e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..56c8bd0fe00e6d2b7cfa0221536b3f6fcd88c0c3 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.2944515852286527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0687957809640445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.13683365368832767, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0014688301287434024 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.28316158012799547, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025200608344027693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.1814799362167216, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017831836075280368 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.046755060522420185, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0008806060921358351 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.09586697768686785, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001719510820833045 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.06187846081562434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001129424676101297 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.12660643084306702, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00126456533149021 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.264267984967182, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022332757179524803 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.16841364171833556, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015464664247715663 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.11737623006499737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0013285621448530893 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.24349593138163397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002354566720998469 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.15579956125425456, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016372102304097094 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c43f4995aaa53184e1e51d339596c11b074c6fed --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 8.52641209830111, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12582983777195597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.44140716426798104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032213924886028253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4052286843296632, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002639166874418895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3977363846975939, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022382388166838187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18864819780738046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0022621645695871918 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.16963873808583682, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001847799566651559 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.16696906460089045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017222149044682246 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31455069215794823, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0025903719800358703 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2903012525772825, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002143374874342348 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2829785990744798, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001784528829213968 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3567420815242637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029468018540509057 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3256533312057627, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023856069656370727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3201857670611568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002098087765270582 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4e518f60dfd89dc71f90066dcd36402b6ddd9c07 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.630291369867987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13549753046024302 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.44886308747052966, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030653689427961226 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4345078703253225, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025475650430768814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4181223330310302, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020232576936325647 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20393782443251954, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0022988281035972273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19337736914798762, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00185489954602544 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18635767606167977, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016723047591652514 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31607957889707133, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002589473433632966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3043881139321235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002132304038142002 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2928097571700884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017552966978288125 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3695227255731898, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00282070031070788 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3571271332319229, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023658526732539117 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3438100939181177, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019679894394683483 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fe313dec5698245740ceaf8a88ed78ae1cae72bd --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.771336904004668, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15312208049452972 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.47121262761824606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031706802673694546 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4285131204444559, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00259084813925993 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4246139438060347, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002068822985960878 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.22192545824696955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024446292469949274 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19735042748477633, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001962335262395526 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19583480506260798, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017745784799472742 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.33776452672838364, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002772013880864643 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3053908517936716, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022386749143566537 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3025604202708821, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018763118742909542 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3904903633666419, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029686040326820764 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3552152361692601, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002487386620131327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35175775657317715, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020815737481426283 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7cb54c5c0be681ac296fd9a0b93a8a01a5fb6051 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.267530539514095, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1677573231958913 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4875664382154273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003185218088206128 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4282782601002331, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0024811809614885827 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43249984090343835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002029303339376666 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.23104550813725375, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024366019088569594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19888718264029498, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001882516080327131 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20132801941812545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017679869293689926 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3469917638960595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027307278162448678 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30357116962664776, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002153172746913521 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3066167803857757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001864747310583765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4016050584122585, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029687484050154784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35340408132516204, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024203053725328372 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.356433479440808, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002068322803762821 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1e4d2e781f376ae0889166547def2c9c074f8bca --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.805990819642968, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11545747726371132 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.46998019703375354, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031239647333913445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43070572612561325, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002457470355676941 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.42703858045940735, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002035276652428456 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.22095953832665552, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002353597555734135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1987243871558035, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018784818554072877 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19734778489236487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017398333866025894 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3325206520940773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002612965421345996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3056110355009581, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002176897829405239 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3017510704812495, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018231271871051772 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3883766916064333, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002916081958006691 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35559042723108397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023422683169970725 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3526562252374031, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002039422626192226 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_0.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..402e6676ee9240e646d86f33cac3abd2f672ed58 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1682140354361548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024311651181596846 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.35168988214341523, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004257802996267162 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2188247155119966, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026101698852964428 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03791114624887027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001430715346143808 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08181326285418697, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027684668080112493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.049755066362456114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001711057906744696 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12558538899658162, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019306618262220862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26406296625514597, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034141022743443975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16347253111222268, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020596404700326306 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13072162961307798, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019975037472617324 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.27675311185951984, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003756707707901523 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1707786995081715, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002220764586073378 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1814410356065763, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11929627005647012 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_1.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f10a5428df56a31eafc499e45e9938a67fcd22f2 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12394690078102485, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017820854664639617 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30883381009085337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004143617002757454 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17485668915463046, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024040861492345958 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02454039849295794, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009642339010215241 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06338989802824146, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025845302772511 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.034970894707131765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013750874506006509 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09759605191150027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013546647766234851 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24498653012258598, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032922471031046553 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13792484720753254, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00184311444020864 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09975522247129645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001443168667820945 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.25068739231214776, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003536217595269335 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14106410762921118, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00197754854435336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4164772106615187, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08503842048783962 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_2.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b37ac234756e72cee9f5a371f3068fc12b4d49f7 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1212713815463862, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001783930979666327 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3027696164744973, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004069720967342189 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17119896569207846, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023973191304758746 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022526851037537605, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009300320053962364 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05803699224106711, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002478507440389671 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.032088581665832575, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013254566404233465 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09410711927777662, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013305323171338883 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2369780862526828, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032212483252820195 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1331419291803311, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018112812768873992 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0973756908203134, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014271599181187183 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24589465344432024, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035007571446406256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1378737759652496, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019533435435502575 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3211406116055093, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05632158339691826 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_3.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..32d475e6dd0c651d42d2517400bf0d929f220bd1 --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12267341712650358, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00207297750674979 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.29346318087456813, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004412522962315509 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16908880821212016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025898440173812076 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.023615304490600033, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010046076586988078 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05931770918646783, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002583579920531965 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03314896853957152, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013908257283640876 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09519232603078606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015734855162649944 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22996956742200556, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00356629562100884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13158510148593067, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020014770100106496 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0987948573594369, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001680092786160822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23916103459926824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003841293731139315 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13667047371150057, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021600836418570976 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4406275619553672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.058943511303575426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_4.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..78e94dde69c0e5fb7674bca696e244e8aa2fa4dc --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.036834822457244766, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0022079340145582244 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07337453869001616, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004314314932527252 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04566365412307027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002608741489638274 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.006497191357163194, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006016918414205361 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.014978313036291765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014510780480090683 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00874385192747724, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008092464001035177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.028775879177447013, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017095958814072434 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05725787803054188, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003351554553300089 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03550416488438028, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020020706708868776 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03052315595597832, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018382248537160094 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06056408978110664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035955665511950294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03770504825258967, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021688966924711204 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6685820712764758, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11003965221099908 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_5.json b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f91b475386b598ac1cf8956ae8be487217cd7f9f --- /dev/null +++ b/perplexity50/evaluation/generation/slim.perplexity50_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0025092290685345187, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008065208895136817 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.00204279104163942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005925317015988438 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002202987774184108, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006658652488222124 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00031845928766017557, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0002726745419818294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00021032426692804053, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00016342749062440463 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00024851863402463746, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00020210817841172796 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0018256414840619524, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005744051717215062 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015255275808323426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004364013489751857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0016217715192546416, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00048067108652986303 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0020224773879338985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006369133276637897 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001658634237434707, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004694737360395629 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0017788861730293213, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005248009571798277 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.330855196908569e-39, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 2.2953575552071226e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4-perplexity/perplexity50/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_0.csv b/perplexity50/evaluation/rankeval/perplexity50_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..e973a4734e58e66af876bfceab785bd6e3e2996d --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.014899597242811483,0 +anli_r2,acc,0.335,0.014933117490932572,0 +anli_r3,acc,0.3383333333333333,0.013664144006618275,0 +arc_challenge,acc,0.28071672354948807,0.013131238126975576,0 +arc_challenge,acc_norm,0.28498293515358364,0.013191348179838793,0 +arc_easy,acc,0.6106902356902357,0.01000521278287814,0 +arc_easy,acc_norm,0.5315656565656566,0.010239317603199509,0 +boolq,acc,0.5675840978593272,0.008664798701065799,1 +cb,acc,0.44642857142857145,0.06703189227942398,1 +cb,f1,0.24357864357864356,,1 +copa,acc,0.81,0.03942772444036623,0 +hellaswag,acc,0.46703843855805616,0.0049789271647928835,0 +hellaswag,acc_norm,0.6088428599880502,0.004870121051762726,0 +piqa,acc,0.7524483133841132,0.010069703966857102,0 +piqa,acc_norm,0.7540805223068553,0.010047331865625184,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.838,0.011657267771304405,0 +sciq,acc_norm,0.734,0.01397996564514516,0 +storycloze_2016,acc,0.7140566541956174,0.010449259851345843,0 +winogrande,acc,0.590370955011839,0.013821049109655462,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_0.json b/perplexity50/evaluation/rankeval/perplexity50_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ef4719fd907c0588f2820f7e735f6f57e464746c --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811483 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932572 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618275 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.24357864357864356 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.46703843855805616, + "acc_stderr": 0.0049789271647928835, + "acc_norm": 0.6088428599880502, + "acc_norm_stderr": 0.004870121051762726 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655462 + }, + "storycloze_2016": { + "acc": 0.7140566541956174, + "acc_stderr": 0.010449259851345843 + }, + "boolq": { + "acc": 0.5675840978593272, + "acc_stderr": 0.008664798701065799 + }, + "arc_easy": { + "acc": 0.6106902356902357, + "acc_stderr": 0.01000521278287814, + "acc_norm": 0.5315656565656566, + "acc_norm_stderr": 0.010239317603199509 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975576, + "acc_norm": 0.28498293515358364, + "acc_norm_stderr": 0.013191348179838793 + }, + "sciq": { + "acc": 0.838, + "acc_stderr": 0.011657267771304405, + "acc_norm": 0.734, + "acc_norm_stderr": 0.01397996564514516 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857102, + "acc_norm": 0.7540805223068553, + "acc_norm_stderr": 0.010047331865625184 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_1.csv b/perplexity50/evaluation/rankeval/perplexity50_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..6d0ab3f3a056236c2e77a81a3b9e17ed00fa2256 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.014899597242811485,0 +anli_r2,acc,0.339,0.014976758771620344,0 +anli_r3,acc,0.3358333333333333,0.013639261190932882,0 +arc_challenge,acc,0.28668941979522183,0.013214986329274777,0 +arc_challenge,acc_norm,0.3122866894197952,0.013542598541688065,0 +arc_easy,acc,0.6123737373737373,0.009997307914447614,0 +arc_easy,acc_norm,0.5669191919191919,0.010167478013701796,0 +boolq,acc,0.5522935779816514,0.008697094687974059,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.255050505050505,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.46395140410276836,0.004976796060456438,0 +hellaswag,acc_norm,0.6121290579565823,0.004862690594815717,0 +piqa,acc,0.7377584330794341,0.010262502565172449,0 +piqa,acc_norm,0.7383025027203483,0.01025563077270823,0 +rte,acc,0.5306859205776173,0.030039730592197812,0 +sciq,acc,0.886,0.01005510343582333,0 +sciq,acc_norm,0.863,0.01087884871433332,0 +storycloze_2016,acc,0.7071084981293426,0.010523873293246304,0 +winogrande,acc,0.5840568271507498,0.013852485356798266,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_1.json b/perplexity50/evaluation/rankeval/perplexity50_1.json new file mode 100644 index 0000000000000000000000000000000000000000..50cc2cb638634042655ad66d9f426ac4d1b4ad71 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811485 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932882 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.255050505050505 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.46395140410276836, + "acc_stderr": 0.004976796060456438, + "acc_norm": 0.6121290579565823, + "acc_norm_stderr": 0.004862690594815717 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.5840568271507498, + "acc_stderr": 0.013852485356798266 + }, + "storycloze_2016": { + "acc": 0.7071084981293426, + "acc_stderr": 0.010523873293246304 + }, + "boolq": { + "acc": 0.5522935779816514, + "acc_stderr": 0.008697094687974059 + }, + "arc_easy": { + "acc": 0.6123737373737373, + "acc_stderr": 0.009997307914447614, + "acc_norm": 0.5669191919191919, + "acc_norm_stderr": 0.010167478013701796 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274777, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688065 + }, + "sciq": { + "acc": 0.886, + "acc_stderr": 0.01005510343582333, + "acc_norm": 0.863, + "acc_norm_stderr": 0.01087884871433332 + }, + "piqa": { + "acc": 0.7377584330794341, + "acc_stderr": 0.010262502565172449, + "acc_norm": 0.7383025027203483, + "acc_norm_stderr": 0.01025563077270823 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_2.csv b/perplexity50/evaluation/rankeval/perplexity50_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..ee1e97d97a57a2c263a541826c37350e35c597be --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.341,0.014998131348402706,0 +anli_r2,acc,0.336,0.014944140233795027,0 +anli_r3,acc,0.33,0.013579531277800918,0 +arc_challenge,acc,0.302901023890785,0.013428241573185349,0 +arc_challenge,acc_norm,0.30631399317406144,0.013470584417276513,0 +arc_easy,acc,0.6287878787878788,0.009913599001845737,0 +arc_easy,acc_norm,0.5938552188552189,0.010077409815364058,0 +boolq,acc,0.5694189602446483,0.008660360145988744,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.293715318105562,,1 +copa,acc,0.81,0.03942772444036623,0 +hellaswag,acc,0.4645488946425015,0.004977223485342026,0 +hellaswag,acc_norm,0.6143198566022705,0.004857607641160633,0 +piqa,acc,0.7426550598476604,0.01019992106479251,0 +piqa,acc_norm,0.7486398258977149,0.010121156016819245,0 +rte,acc,0.555956678700361,0.029907396333795994,0 +sciq,acc,0.885,0.010093407594904617,0 +sciq,acc_norm,0.856,0.01110798754893915,0 +storycloze_2016,acc,0.7071084981293426,0.010523873293246304,0 +winogrande,acc,0.5966850828729282,0.013787257285896236,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_2.json b/perplexity50/evaluation/rankeval/perplexity50_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c6238594c1a4bed3ee0b5e80d2bcf54dc61c6904 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.341, + "acc_stderr": 0.014998131348402706 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800918 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.293715318105562 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4645488946425015, + "acc_stderr": 0.004977223485342026, + "acc_norm": 0.6143198566022705, + "acc_norm_stderr": 0.004857607641160633 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795994 + }, + "winogrande": { + "acc": 0.5966850828729282, + "acc_stderr": 0.013787257285896236 + }, + "storycloze_2016": { + "acc": 0.7071084981293426, + "acc_stderr": 0.010523873293246304 + }, + "boolq": { + "acc": 0.5694189602446483, + "acc_stderr": 0.008660360145988744 + }, + "arc_easy": { + "acc": 0.6287878787878788, + "acc_stderr": 0.009913599001845737, + "acc_norm": 0.5938552188552189, + "acc_norm_stderr": 0.010077409815364058 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.30631399317406144, + "acc_norm_stderr": 0.013470584417276513 + }, + "sciq": { + "acc": 0.885, + "acc_stderr": 0.010093407594904617, + "acc_norm": 0.856, + "acc_norm_stderr": 0.01110798754893915 + }, + "piqa": { + "acc": 0.7426550598476604, + "acc_stderr": 0.01019992106479251, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.010121156016819245 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_3.csv b/perplexity50/evaluation/rankeval/perplexity50_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..08e1006cb59ac33f194923f4f6de87e6350cd33a --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.015008706182121733,0 +anli_r2,acc,0.331,0.014888272588203943,0 +anli_r3,acc,0.3233333333333333,0.013508372867300226,0 +arc_challenge,acc,0.295221843003413,0.013329750293382318,0 +arc_challenge,acc_norm,0.31313993174061433,0.013552671543623503,0 +arc_easy,acc,0.6317340067340067,0.009897286209010892,0 +arc_easy,acc_norm,0.6127946127946128,0.009995312065890341,0 +boolq,acc,0.5758409785932722,0.008643869023388125,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.32495309568480296,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.46106353316072496,0.004974628903829131,0 +hellaswag,acc_norm,0.6156144194383589,0.004854555294017531,0 +piqa,acc,0.7388465723612623,0.010248738649935576,0 +piqa,acc_norm,0.7431991294885746,0.010192864802278039,0 +rte,acc,0.51985559566787,0.030072723167317184,0 +sciq,acc,0.89,0.009899393819724428,0 +sciq,acc_norm,0.872,0.010570133761108665,0 +storycloze_2016,acc,0.7167290219134153,0.010419760409155363,0 +winogrande,acc,0.5864246250986582,0.0138409717631953,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_3.json b/perplexity50/evaluation/rankeval/perplexity50_3.json new file mode 100644 index 0000000000000000000000000000000000000000..978fd56fe1aa43934b2c1b13bc81e74bdf6251ce --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.015008706182121733 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.014888272588203943 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.013508372867300226 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.32495309568480296 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.46106353316072496, + "acc_stderr": 0.004974628903829131, + "acc_norm": 0.6156144194383589, + "acc_norm_stderr": 0.004854555294017531 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317184 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.0138409717631953 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5758409785932722, + "acc_stderr": 0.008643869023388125 + }, + "arc_easy": { + "acc": 0.6317340067340067, + "acc_stderr": 0.009897286209010892, + "acc_norm": 0.6127946127946128, + "acc_norm_stderr": 0.009995312065890341 + }, + "arc_challenge": { + "acc": 0.295221843003413, + "acc_stderr": 0.013329750293382318, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623503 + }, + "sciq": { + "acc": 0.89, + "acc_stderr": 0.009899393819724428, + "acc_norm": 0.872, + "acc_norm_stderr": 0.010570133761108665 + }, + "piqa": { + "acc": 0.7388465723612623, + "acc_stderr": 0.010248738649935576, + "acc_norm": 0.7431991294885746, + "acc_norm_stderr": 0.010192864802278039 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_4.csv b/perplexity50/evaluation/rankeval/perplexity50_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..fb43cdf0a830a23495946315b6232e4ec2f21737 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.324,0.014806864733738859,0 +anli_r2,acc,0.341,0.014998131348402702,0 +anli_r3,acc,0.3283333333333333,0.013562032919529026,0 +arc_challenge,acc,0.30204778156996587,0.01341751914471642,0 +arc_challenge,acc_norm,0.3242320819112628,0.013678810399518819,0 +arc_easy,acc,0.6342592592592593,0.009882988069418829,0 +arc_easy,acc_norm,0.6056397306397306,0.01002817603839299,0 +boolq,acc,0.5691131498470948,0.008661108320775369,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.32666666666666666,,1 +copa,acc,0.85,0.03588702812826373,0 +hellaswag,acc,0.4640509858593906,0.004976867796583557,0 +hellaswag,acc_norm,0.6164110734913364,0.004852658876775374,0 +piqa,acc,0.7426550598476604,0.01019992106479251,0 +piqa,acc_norm,0.7464635473340587,0.010150090834551786,0 +rte,acc,0.4981949458483754,0.030096267148976633,0 +sciq,acc,0.891,0.009859828407037183,0 +sciq,acc_norm,0.882,0.01020686926438179,0 +storycloze_2016,acc,0.7204703367183325,0.01037770209970486,0 +winogrande,acc,0.5880031570639306,0.013833112857645935,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_4.json b/perplexity50/evaluation/rankeval/perplexity50_4.json new file mode 100644 index 0000000000000000000000000000000000000000..52620066adec9c5d2e7ecd413967e5987638b279 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738859 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402702 + }, + "anli_r3": { + "acc": 0.3283333333333333, + "acc_stderr": 0.013562032919529026 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.32666666666666666 + }, + "copa": { + "acc": 0.85, + "acc_stderr": 0.03588702812826373 + }, + "hellaswag": { + "acc": 0.4640509858593906, + "acc_stderr": 0.004976867796583557, + "acc_norm": 0.6164110734913364, + "acc_norm_stderr": 0.004852658876775374 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5880031570639306, + "acc_stderr": 0.013833112857645935 + }, + "storycloze_2016": { + "acc": 0.7204703367183325, + "acc_stderr": 0.01037770209970486 + }, + "boolq": { + "acc": 0.5691131498470948, + "acc_stderr": 0.008661108320775369 + }, + "arc_easy": { + "acc": 0.6342592592592593, + "acc_stderr": 0.009882988069418829, + "acc_norm": 0.6056397306397306, + "acc_norm_stderr": 0.01002817603839299 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.01341751914471642, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.013678810399518819 + }, + "sciq": { + "acc": 0.891, + "acc_stderr": 0.009859828407037183, + "acc_norm": 0.882, + "acc_norm_stderr": 0.01020686926438179 + }, + "piqa": { + "acc": 0.7426550598476604, + "acc_stderr": 0.01019992106479251, + "acc_norm": 0.7464635473340587, + "acc_norm_stderr": 0.010150090834551786 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/evaluation/rankeval/perplexity50_5.csv b/perplexity50/evaluation/rankeval/perplexity50_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..cf4e0d34412ab2908444058f1cbc7e0130ad0b53 --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.01500870618212173,0 +anli_r2,acc,0.341,0.014998131348402693,0 +anli_r3,acc,0.3258333333333333,0.013535422043417455,0 +arc_challenge,acc,0.3046075085324232,0.01344952210993249,0 +arc_challenge,acc_norm,0.318259385665529,0.013611993916971451,0 +arc_easy,acc,0.6313131313131313,0.009899640855681043,0 +arc_easy,acc_norm,0.6077441077441077,0.010018744689650043,0 +boolq,acc,0.5712538226299694,0.008655800332760227,1 +cb,acc,0.44642857142857145,0.06703189227942398,1 +cb,f1,0.31446540880503143,,1 +copa,acc,0.83,0.037752516806863715,0 +hellaswag,acc,0.46285600477992433,0.004975993795562032,0 +hellaswag,acc_norm,0.6171081457876917,0.004850988215167544,0 +piqa,acc,0.7399347116430903,0.010234893249061303,0 +piqa,acc_norm,0.7426550598476604,0.01019992106479251,0 +rte,acc,0.555956678700361,0.029907396333795987,0 +sciq,acc,0.885,0.010093407594904628,0 +sciq,acc_norm,0.875,0.010463483381956722,0 +storycloze_2016,acc,0.7129877071084981,0.010460934115933265,0 +winogrande,acc,0.5990528808208366,0.013773974554948028,0 diff --git a/perplexity50/evaluation/rankeval/perplexity50_5.json b/perplexity50/evaluation/rankeval/perplexity50_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6ef9c791c42abf8f797c3143afbdb4d8f449e15b --- /dev/null +++ b/perplexity50/evaluation/rankeval/perplexity50_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402693 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417455 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.31446540880503143 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.037752516806863715 + }, + "hellaswag": { + "acc": 0.46285600477992433, + "acc_stderr": 0.004975993795562032, + "acc_norm": 0.6171081457876917, + "acc_norm_stderr": 0.004850988215167544 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795987 + }, + "winogrande": { + "acc": 0.5990528808208366, + "acc_stderr": 0.013773974554948028 + }, + "storycloze_2016": { + "acc": 0.7129877071084981, + "acc_stderr": 0.010460934115933265 + }, + "boolq": { + "acc": 0.5712538226299694, + "acc_stderr": 0.008655800332760227 + }, + "arc_easy": { + "acc": 0.6313131313131313, + "acc_stderr": 0.009899640855681043, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3046075085324232, + "acc_stderr": 0.01344952210993249, + "acc_norm": 0.318259385665529, + "acc_norm_stderr": 0.013611993916971451 + }, + "sciq": { + "acc": 0.885, + "acc_stderr": 0.010093407594904628, + "acc_norm": 0.875, + "acc_norm_stderr": 0.010463483381956722 + }, + "piqa": { + "acc": 0.7399347116430903, + "acc_stderr": 0.010234893249061303, + "acc_norm": 0.7426550598476604, + "acc_norm_stderr": 0.01019992106479251 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9a66a30f21e9579979e94d8462b8548cdd72093 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa21661aa78a6e13fb555bba62d9059b41afbd9011192d2bb015c608c21a162d +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aec05e05f0ab6ae77f799a36fafcbb289c8acde --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7bbf149071bbf41c2ff91a60149ea43de80751c5792972b99072f1c23d756c9 +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3a79080a4c7f7572c13876808dcc7457f4e0528 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4c67df43d6a9aa3459b156bef1f8cad32c48879318b138f51417508a1f6a3f +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..659f6f6e9500ea79457421619f2fbf054e89abde --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b231c22a8edcf8ae4cfafb73f7339e3a98ee296ef7884aaab0ee7a4a970b1c5 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e37f8882e761674e06ae22aa404e813b3ca30c8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8391af8d35d12d2ceecc9d653a531be0a9709cf3621cdebbf8986a07c2d7b3 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9457e4c393717a8a762af1cba3effc9bd03844 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5e88b0bcbdf71f1a244edd485b6afa4ca664f5c8d9691b012bc90c21fa7b58 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..358282da50e31718a2d5a9f6dbf2cea756294ef9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24b4ae393e2951484dd96340aeeff7d4090f6ed01da9475e6df6b676d54db62 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d177e935e4055930eb9f798153d367c041c6f81 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59998e0942355e12f57d1ad57becd7ebe53a6a324bd307e48134fa294c737785 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6e7044696ad682ee328c9c6f9e26b50cd7e1689 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb4e23197d5666b328bb4640438308e27160e7b889b46f2207c5ab0a0f1e61ed +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11612b33bbd7dec1734e40ed5fb4b44f682c4831 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f468e1045f6efe8b5a5f1e35c2b9f88aab451f94655b65c49d7f76a56fb22d2d +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6b30cc82bef3ac3c7cad58b92cd945d75caf21d --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50e857346759cda74b15ddda65f91a078b68fa53fb0995f39557fe733aa4075 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5284e449de0e81d433d3898460b80f5db8c96384 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f17f9b05463fced4dc129d20636bbab3dbb7e0588ac94c63b1659826c9c22b3d +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..085cdfd06eeb931a8fb840cf0ef9dd0c43ddc6bc --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edeaade011e49e8f50c8557ba7c882ec778219e26fbf061176fb40b63af8d575 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66634295dbea30c2a8c8efaeddc236803e9f7283 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2d245859f1b4a938d26c068569a0202986e2e836bca782aca255fcc703c03a +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eacf412af29ba2ff8cde0381a3150c887d3619b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b8316588b519aeeb94fb3950c96a1fbf7a757ec95a3ea77d70d81863435ab3 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f25c583af0851ba17321d211951e1b5cc76bf9bc --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154adb8466fa8bd6e982e8e86e984a55bc7c42822f3478c45f7c3560cd1d7932 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24798ccc496913ceea21c631fa9a8c50e827d137 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a26da654e2d5dc7896b30120394d5df8398880f49033db1354645846eae2beb +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82242bb92a8c5119b3c07287ca277f8f8395ea8c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e4a64c057f6a802d6737436e495c5d957489f6e71a8c6174ac8c14c5412a7f +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..354381db75a1eb2146226533e321ce6ace4eff0d --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017b8d3e6659f2008e77fbd9328a0fc6ebbfa236c3cc4b3eb1c958e85748139e +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2bc62b46d07c32fa2e969e516eb301bf50847fd --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05033e445105aefe2d50cf98ff160a378c582fd59b183ae36271fe34c760bac +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d85b069591b52fb08702ac1f72ba1422c80747 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f688c00572fc90d245937495f193e74de9471a0a382cf2cc2d51638b9b0d6b7a +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b978eb18fc4c1150cfb524ceeb17d55f20ddfb9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4368aaaa713c3124d9d112b4df8838d53a92de6889c9a5f95e77b7c037593f74 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f704759f2ed27cc58a78860db3ca413d6aac47 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de0f1e8b313e62a75b9067e75e61d08c1856d28fa81194cf7d1ff9ceb2bf171 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3d40487a6c4b7ffbb2002679c98eeddb71b6b7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0389f05778852f9521671e9f8c4afa1e9e4d01deb511c4f610fae6d75feb08b5 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35b070651903ae8a4903267ec75222a2f3bcf78 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1b1541877125879a38f86739693a785cc8c97a80ff271ca4261923d77ce605 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a84eb9eda3dcea094563e0d82d9c4e9e79dd9ba9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764dde6ea974d793235b1385c740edf8039e7eec44e1243989fcd34917942c29 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef3fd31e9f543b90474224f11c4a5869b571007 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb06e077c7fdf4296d7bf9e3435689719039fbf22189959865080d6cb6ff19c3 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc2f1be7d11e4873621514b7cd014894cef56643 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bdc947ea0d6fc216657f0dbaadbf14a45bd3699f12bb8582446e3d2dbeec22b +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14ed7cca241e1cd30da53e7996a13dc859e1c388 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51c7e6d47e1dd4bdb9aa965898c761d69dc563dd3d19939d0531fb88ad53408 +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..180483aab1b43b811f6d300991d69432391e19b9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f856167923166cf5382383490bb64cd69ebeefaf735c2c19f9c6b73e85940b +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba86d0e88833c14f27d8d2ba778b8321f55b057 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1237fefff0dfeecb0d74689433c2c36a9a84260e203a764dc2a8a25bc1d9c11c +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06896817ffca4badd93f73ea2ad06b1a1ad1b0b9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d4a64bc901b662c45f5aeee498ea68da8d3715be59065ff8f2c47150c8b05a +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a689cbd3f83a6b223ae29b8d31b31d2e520777 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452525b62408cc47b342a5fa54424bed58e548c8a725c6e3cb2c5d216a185662 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8193c0c145f5a650d3e0089da148f68c09fdebab --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a359273334af3b572224a850aebcb7cb8d7aa3cbd100707083da7a8c2be3b955 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8321674042e0216398af61469d1591d01ae119 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3f98a059e74700f36ba60e080906b12ab3f54eea360a2e56a3379cdf8d85bd +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a2352f817d115285ce8ce3b4345e75b9cc07b3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8880eb4d6bae230b54e39b9113126d516a57fcb0935d61007df7f438b32dd60d +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db926ca16b5b78321035ced1401c5e1b9e286b24 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59271c7a9447b4dbfb8afbed6c82cd9c855c1f173380745b70fa389ffe6c7685 +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8128a91e37591b55af7baedf513826ef98d95812 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0355d9bf87324593a7e37b425b53ee25d5b544d24285711b7859d04430583bb +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead27018b4c97af36d1c77e18726aac082021225 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662e446882d0bbb81328f3cdc41c9520bd318bb08ecabd7b115eaf976ea30e0b +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..205afc6548c7a8dbcd1c713c402447337dcc06a1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516ec3902fa4e934519bcbcf52db4a057a45fea0c3b76ef8b1bb2d0407c38c52 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..697a3d86b662e91b7843eb272b14a1b3e31b548f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedbdea23ca9979a0fc35e0f78c1828b607963bd88a4db1590364c68bd21f7b2 +size 131963693 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..813b5feca5a4bd0cbbefd0c32d1bc5b54ddfcd3b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7f85830ee12ecb9e646f15b9e33a0ed85bc4f696f3dd608c98a81eca10b938 +size 131963693 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d043b0201b1b16139151d9639d39de74314b1eab --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35978d68e04ddd388cc3e8b0d2a0575533a28555a4019c2e50551e401b0b23b0 +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a70083e31a785344b486ed2139647edeede03b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a7a062400828964b556f0e2945966d21d9b33af87eefcbab078334b750c4fd +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58de71571aa33ba2b6d87ab1f58eb2ca456e4efc --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4981fb59c65f34a8318ef1c9efe04c109c1cc4cba5fa053a5b07489d393b6464 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b2610e7beec088d3090e29a6e1bcb1bce95c3a8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e510066f0fe6a5ff8a280b82ccd2fb0125135e2b60a323fe4b98e67826a6bd +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba67ab2a21cb03c43d0f4f82ba099e319d33908 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a859c5ac319fbcd31e8a84573e49adb8d2f50f54f9ded99814339a4d4b3c4bbf +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36cb4997f85ca8fa03425faf0bd03f3b7e8d8bd --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6952bfe25bc9c0084c171287be871e77401cfe44c71abd70caac5938bec0d67e +size 131963565 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d9afb259bfc2b01f58f0d85438022e33858303 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89d8bb1ea95b0baf65e7210a41fef30de2c29205c48523fc35d05f914e54447 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d230ec74f81754e8fff701f7f31a0c3cec1415dd --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da8277b692f740320f20e056630e228ac24427748915cf61b961ff525b37fb0 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27458f85e0f2969741cbc2cc89d0b4a9eccc5e83 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193e9755529fab782d5aa8b815fa5031258ffa5fdeffde271dfa19caf4282991 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..550f38915aab9d4706d226e421d2932c9e038220 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fe42f57ad0ba8995f154f1359c07b0fb6aee81c8b2355237446857872987e1 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c67d84b98b69be3ccb9c36d2e97640fc9f095455 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0508a3da44cbf79b4adf4dacd5df776fbe779a1ed5524ebcd128ac1ea278758a +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18e20b8c717c237fc08a18255eda56db89f89a8e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e6cd28756f5ce1d12ae98f87b3f9fa21b4a762269787747f4f06ac7be4b0e53 +size 131963629 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0844e09338821cec74419175ca878a12b60a31 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0853eec4f1c6a18bcf55105a611e9ccffe089253e7b4e51459c2f7c4b11df4cb +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e98602f67cbb60bc924bc0800855c7277a2015 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb718199f113ac9f5643f3161e2e5a8d0dc5d98decc9f914c17ce00101e3721 +size 131963501 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ce38ce98f9347543b49529fe11a7b2c1352a3e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f732dcbb7fcd7ac5aabbc2123b2c3b7282358d50d8de040c2e592e3ef0e841 +size 131963693 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8fc08d9f9864955ac5f942b160577e034c3be24 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790cc8b4b6f835eddd385ea9e74bc07a992a3e64b1887332480bb64a81edb0a4 +size 131963693 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a7533dc72b374a37f6087840e73c844b411272f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9416908a75eda13eb9f7d280cb7261bfb5e30d41edc5dfea5ad6a0aa7c841ed +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b34f1d1441543ba5c96fa921c617e1779abf7be --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b723e063409164ba0e1ca69183a1c5004d555ca482cb84fd52df9731fca4f705 +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a878b9790d1fcce43add23b32d1ceca6303242f4 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ff0404027efcd130f6ee9df5b2b49c6f3dbf57677efcb256cb77d9d56f9c32 +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a06e8411c15feba34ca04ea004affc60b6b3341c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64e7fd4a1887c2b9b36ca034e57eb3174cc0fceed899021ede745896c04599d +size 131963437 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0649b99633ebeb8e071c9788f10fb5e5683f47ac --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62a61e8a42883bf2d8cb70f61b4808884f8facfacceb91f7a42de87c598e90d +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..862fd8df6a11ab2f6a5383cc2c56076bf61efac3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15a9643cd088ca278f982132e5b39845fb14551faf9888ca977d07941912d2c +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c0640d7703364c7e71b634e2a424fb1c9446718 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9577fc36eb622d87af425efd766cbffc510f93333a9efa79868e531e0559e8b +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cb523a5e70b57cb1390634a80abe85f8f0ad45a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dca31b94798c7d2daba0e6ba7d6d64c8600208e2a06f7e3a6482455f2fc7410 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bec7dd89ab9347322bbbcf6e3edb5f4355df0d0c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9f435a50b33f2c789f117c679bc8571e1325210b1d42a819b264d8fc1e5d9c +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa28d4cd5783ca24bd8c531eb7786ee379c1596 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f762352144b22f22e84c5f2202094b202fbd17e82d98010292b63f4c11a8d415 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a99b4e83f429da730143583603f774e85e6cd1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12fb5576609b22cffdc2b9a0b9f82ee61b47f038c52c2fd09dc5b93548c2104a +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2057dc3e8a913bb3f4949b6008255ac4c7f8a4 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ede71c20243cf5eeae63559684938e4cef047af9cd60c584f8c0f5d23bf071 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b94bc8f13baf845de6f2be6309e44f409175ca2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff6618a890690976a7c0343f8551d497a69cc0520c7bc748b79929872a5c86b +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..440fe9e69a72d7db58d26c243895390a89bbd6ec --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1a7889cc81a33ed15160951089efa44aa12ca6fe74793491f44e900889911b +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7597b74c32324beb3c70490fca06b3e6d20313d --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0752fee313db040a76dc9940dba2bf4464a0d2db73ac87db93c981d925f6faef +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5049bf34ee9e21bd54b65c61d93d36a783792248 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c853a463a8f1bc8e53c5d1ff7199f52fd8458b9a5f7921379d633c588971c303 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d959df49df9c92cd9523181c1b692884544a8c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c51778eaf97bd366967406088cd9835cff78ae20a48e84cd52b5935415cda8 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5f390188176d9739f00d920dbbafe5549b6d3a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1044328c394442d7829c2821abb30ec60ba683780e2edf93bdf683548cd651e0 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c4e8d0544cd4c8ab33e28a63a4b7efe7447bc2c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a8e3c3059a671bc520b437c6dc9dd2dfeeafb27eb39d2ffc1aa23d39f63569 +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a52167d365fc1f93caae6e7a626642f00b4b9bb6 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c06ca8990a969a832c6aee6fdaef25684189cf579a63399f746b943ae27e9aa +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fb4da141298f7bf00b1b941b5c5008f0bcd4da --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08f0db8986349c009dca542ab44fd57faf398be4e08e4d01baef99c0abe3144 +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6602a78ece5cc14d92e8d83afed40d96d2486e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa36f3a881c81fa2d3574e62b74e7d89304651d0a26b1a2ab212d9f5ea4528be +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..830cfae450a0048dac658bf3c297a94ee31d32bc --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f55c6dbc4efb0a7090feffb4b2a7f51d72147c45b8923375f4a44abf1fc4be3 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf5da6d2cd74eecb044ee60c56b870a778fc9d2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649220b2ea50127ca17bccfe4d0df1255207b8505289331f592c771085e01a7c +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad0a43d6a78ad0e91f2c7caf1a882f51bf57b1f6 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddaf650654cdc2c0e9118d0e5bdb7d9e4eb360e7c9558d85cdc180b31c00df14 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a0f6b5cbcf3c9066d58fe735540ab2dae02f27 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4842bf86e57e8107b51fc68a9589e670d6819f17d4639bc05b4c1cf9b484add2 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e1a8cfa7ea78c5e210e00ec5fd2b76229be27a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f327946a3123a8a690766e09c6302ca8511cfea41480313da848bac3f495251 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4c5725398a0ce32df61a0a073022687b1fb70e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1390780d8c2327ed45609012f13788d24137679aa282be5b62709cbadacee412 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c10ea785b08d7bc48812ba91e8c1e752885c44 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c70abbd4db02efab6169b53da00af6c26da67f88085b0f506db82bf41c8852 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..279bb83451910a79c4169091217da54c183a0d16 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67254bb642acfb838dfc72e911c41494ca89c8c751858e875fb2686ff05d3408 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e103a29505fa41e2e399328c4d9fd837035b75b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5213a203eff4a611c1a909499d658727772a91f5bab4acb5a6e0f3c532cbdb +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee4d41fe5efefe3d628432221f5c389dd98945c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081a96e00b16c7c8dd4bd841d66ad29508677502328aa6d72108891d7710dd0f +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758b04edcdb11bbd8bf13f25fd3463c48e404e38 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b0efe89b810c307cda9346e5b1577ed5285e26e7201c43c26b1c06ab1037583 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c7a4eeff6e6ca8176dcd7ff7216396a59776698 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a146e3d8593143912cfd3e71814255cc770327cfa44513f4371bfdaee533bc5 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfbfac52abb1dd8303c630b6310918a411080f98 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d710564fa35f768ee7b5b4ad95697cf483a461302b974ff3d167055c8a83c33 +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de181f0cf1cf78c6674a97651f6b19b857370571 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d27242c28a5e65e6dfe5fd3ae8007bc85a8d252b01090ddf433832d53b5063 +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f860a2a7bef6ec45aa552a3c4d7673a028dbcca --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f83e247aaebcde1c30a22fd0838af940587eb7ddfcf12e6984e0c202ba618c7 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..572d8e26f67166e30a94e4125cedec422be784e8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1246c62d034923005a8cb86f795cb23ee36abb8cc6eebf62e14279f79f3cb425 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c6e9b1fe8f7fa69ab68d088261dbce626aa2a9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d68f8b90abbfa88fdcb606876b234c5bb0791dcb226973fdbe0348e417abf0 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be13b0d6ecdf7998651291093bd4d58b1805672 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bf96da905781c2dece00fd6911541f42323a106fa98ac337104e4857fbe776 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a3395d8772f686e35dffdfd2d0d941f86bb76b1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bebb6026010360fd19e02c404463cbd8c229917894257a62c39249d6b5722789 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d474c4d8c0f33821cea64b204da6edaaf4a22f84 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e246956fcd48b1033cfe2c260abc2270258d115023e548bd0052465a4d99203 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4eb117ede3c4d3a0f476ea9cb32aea434313156 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f01f4b38cf2dbadd22237949bc0041c62a5b581645adea0853bf893c7b93d5a +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..424fc0de58401b3c0b4219806fc43c00b2b2f1c1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba2cf062d63a2173e517e4a521d094a3b5229c579c79f332d831a430ee37310 +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..391d59b9c101e7e1f42845722e3624bed1683598 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59ecd9d1fca4c119f8ae3543384ec3cadf4dd5a066d289c319e94bdc8baf1809 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8328ce005a2d1b7618e0f60c7ae7f25711c15639 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:918ca07ce33c7aaf8976cf5c051ea00cb6fac139f58020751d359c43d0877903 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea06bb492af1670c9e9179837260f9864bab1ec8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b340018bcd3b72eea9d34a6febaacbad7fd637710cb6b82054f5958e876f5aca +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fdf42bb3102c1e09f80527d324b3f17ce331fb5 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3551cc2587ff70269d822009a37bb4b253cd265bbdf7470b938302fab84e701 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f474493aae1ee0139758cad953b214cb026bb464 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f07db0dc3f544651bc17bcc170b7472a12f0717b986a4dbf00a14cea6ab898 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..670cb389e3f0e84473839dea33fe4c47916391e8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89cc41a359e93104008338bb5fa4f901d2d5ccc9aa91a0f5a9599f65c851c66 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..326057fb1426c2a6ec9a1710dcc1012b568c9fe6 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48505bcecf8a4939f1107312f632e6b8efedc3803f39dca3bcbdaa3ab377577a +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..567c7641ae9e3f8179e4a87b818ff3978d2ab8f0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16dd817aeae61a2cfd0a1b32fa20b2ae7ffeadfd0b4bd77fcf0dcacb9098776c +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7954cb840fcc0477397b4762785f12acf5fd736 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da35f53202e5ecc4860bd398256337fac68f23645d10ce84fa25255f5b2cddf +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..702dd26bc10f50d1214b219c27ecced787ff3c73 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feff72d0be291f2ddd3305d1861b3619e0bd2bf2bba288c7ad365f757b7cbb99 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65ea1569d864d11e0812f154777a39c2573c0ff --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a134bb563b4cd22f1d330d8912da0770a4f77686005da3f2a03ff5d521ce3c0 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0a007ccc9e1bb6b197765506970b89f61fabdde --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cbda168aceaa4c8b348b003ed4ed19e48ff4419b228da7fcf7a73eb8dd4af56 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1032f213e5fcf51f106eb53d960fc3867d07541 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c21724a2c99d1703b27100c566882d1ae169ac7a6c6e9a04b8ddc97166398a6 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdaa74e3c1f846abe0f190805e97c7029399eab6 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dede9d8a9049d6a08d5abb90d2024f4bdcdb2918a66faef0a61147413d2a1864 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..175ebf172a342f01192066317bb445ce90a391b7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc248836c0896d43cc042f6127500972350705915a197dbd010a9e6e870615b6 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb20309065e36ac7f7e4c042462822b26043233 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72263af3e25e7f0b01c3d40cc2804337d0b8890f040a9dbf4906fa61c7bcf16c +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de361b1466def7572150b16b99ba03fedaa0f07 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7aadda69bb528cb2f4d4ee6a94aab87eb7420c447fa409caa90fafcb68558ab +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c1204eaec73ca0f50fb54732de23ff38045eac --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318f567765a7c7066429eff0e62028226b86d1b628d27ce2a6f324ff3a95b9a7 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5cb7f72ab43787d6a5630ae296057a118fcfcd --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90febff50930b966197692bddef27ccf4eac7470f64c3a5dd2ea6d785745194b +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c52aa06d9645fd0007429d3b5ab57bacb2b0dc7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734c8517c9866ed87faa2578be41fec640d5e35bec2bc72687b65260c3ca08e6 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43dfab3a9cd556e99b3a93e05ca77ac6f8c5ecd0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3797e4d2ba735b2973b66b1a67a15e5b3c82eec06d33fdaac365c1be2cf5a3b3 +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..628495ea73f1f5ec0cb1bfdeb3ce79ac8d188d6e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ade962a98ae4d41afbf1d14552781165bcaae8ba15fb84624585fafab803dcc +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7888f98556aa1204f539924a1aabeb55edc77438 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc55f776ba521cb4baed1e1a4a30025a8510dbcdf30daab226ede3eca1f85e38 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8485dd106b85faa4d91d2e9ab97b434898d9f36f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe87438dfffb71893e5e2f32db6111d74a9266579ccd75ff42573103c612dfd +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18b7f66eb04381474471ddb50b59637e52b9fea --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32304fb09e9f424dfd235538469ad2b7070e9fa1f36d6a398b00a50d6bfe7b2b +size 131963746 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b2761a2978e21a5ec2641919539d1adefa2956 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6425bc4608c9d2a96380a6fc59d24de5706a9c3b5ab13a87ac3753ac1638f2 +size 131963746 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b64ce939e70afe1e6accbb9780a5368562d8793c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992f8ef6c04811ea07703fb8ca60d172825818aa522a5706af13eb28a3db1dec +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..945166334e098e631aea316da1f24f5cccc52f25 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acfec904a13b3807b068f8d81233150d3ed64054fe252d1b4137852de752d403 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c800555adc24d2b7f5a99de573e0bb1483362749 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edfd316a781811ee89fb64fdfb0e1467a2bdfb6616f44cf1029bfa567a1305ae +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d15e8ac18305849a56e9e33b7890aafd4ff9aa --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ad11b90fee0def4942e903a8c18969be0ca864bde5eff470244976eebe57b0 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f95fdc116f1efcefcb8a6b3c5e80cefdc23284e0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae41febcc9317d71a1f9ee108ebbbac53170485fd2450c3eaf746b7bdbd1098d +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cad7c49db29adaa04f55023027f85fc7f78e91 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ea73374f623f983a63ee476b7525d14f9678e791fba3a68961a35537d13240 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd33bb18fc218a24a2c1b8df786d2090687d524 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664402430c4388223072d4a3b0857cf628c4ba7a2d85419dfa5c84e843bd914b +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4db123d0d8284ddf989845915fde0e396a54c24 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8222ef22835a2b4c33dc05aa22f1bc125e56d770fd8c2b3b5c2b8bb930a8c163 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ae5a3e2a924cb6ce1cf47e154ed4174e964dac --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90c8cadf1fba66134ce47f700cd5c3e1cff912cbe32c173cc99a95cccb988f2 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4309450056b0cd32548c0b60a49c9180267f7746 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc614ab8e4699741a7b063202f466371704351e19d948906066202176b15c17 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82d677dff22296cc5e887a453506864a0591301b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5bfbe723718109a8f20632d47cff94e09745c869c8cf83ee596372ab0c48a7 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5c22e22575e8a9dd303c6850ca295e1d52e2ff --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a4494f7a81796895b2812bb3377469369b32b630781a5b307306051fc89018 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..828ecaef4913c27959b72f4f15b15338c755bbfe --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7bf8cefa3ff572469c632c76d023befeba3440fe9fa82eeef0803e15c0d2310 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc588466170c58c645df8cad1d488b9285162a0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389f21de5170a75f644989bdfa646311f7c2239c9a199b608f04ddae1b28a7a1 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c7111849a809dbc0a328db2ca68d6efde53ec8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e77d5404b7265dc92f4afd97d2cd4eadb08daa60c4b0f735e012ace3bccc28 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de48f4959aeac95916b87326cb81eb05cadc5f00 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dcc798352092e27112e458da1d8c01f56ad5ee5af6645c916dc9eb811372cd5 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b511b5a1d4d5fac24e29acb56d99b43775a19bb7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e86684732f8fcb521d197bffcbe724588d9238d80e7141a14bd6211eb59e10 +size 131963607 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6baba7b907d9328911170cfee97d91f6d7d3946f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833f0e32f94375ea998356d426ec63ccddb4445f152356c4638e97337df8a77b +size 131963607 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..789a97c5277eff74cb4b02683e3b5ad390640b0a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4800a26b12a81c2bae8c6c7ff4f3366db085a8456d5ccf244cd637635803b1a2 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc0a7d5bbb382e5a64758e902df837c9d42b344 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153616d73cd2085eca5f01c1f1914a68ee0ffff56ba0598f7c415260855faa4a +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e64fe4931e0e58a97d71f2c26d2b2a55039c96bc --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780ec554cac5ccef880dda2bd064241a7ffe279c0e74972bbc893b13d673bcce +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f39ffb6ddc9174f998a141e470e232174726076b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba0c4e4db0fd11de30fc7ad5f2ce734d55fc68091115701a69e8be62df03de +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..712e88506036ad7b0ec3c2b9f9aff0efe7946cc0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ad1bce182897bae33c174a8739be90aa008f505eaa109175c980aa3d198ccf +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e03096255fc1dd4d2fdc1f3d44ffc83d9171c3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c005a57f9d1057225c77f2661a9899b459a5f00a350c5bed082ba24c2d4b54 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df7a38b0101fbfab6d966dc58b8402a609d06c1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36267f63841a8f5c9d6fd49a616104d95e257c5ec331bcc049b8d23b91cdc3e6 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfbc61ac28c713623287e22edeeec3c6b7819f3e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d0ec1a824da24f3f6f836bda343ea1580a8560fbb6ad289fe26685d6cd5bb8 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa2b1a8db8976c0a3b409fb4ff4f07d6b18342b7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033b2aa02fe6c233c2704f1b6b8ff57ddc1748f2f3c3f3e48ad51acd05210f17 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83443a8beb2e5f1b0f4c4adeeffc436fb56fb434 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec172d588423b0e7cc6487bc3b1074cc75ba6abe2eedae0159095da4744e9a7 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea1038655fb2861b52b1ccfd39261f0ae018ea4f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d3309ca7b1ed6372224f9a36b47e7ca7f1897b017a942be6e994f2a5ee648b +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a94cef3179b72d425924cd3b59a4b4d1885181ed --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7e40e7e4c0de6ccb40611ec5b3d29e98ea24f099961a53b9c393215a4b6c2e +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df4b07f94ee745fccf25551304a18e15795fbeed --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d935944189bc42da6abb2eef516ac338b3bb6e36cca7663687595eca4214bd0 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26eb359325839bca181e9662179052ff2434856 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da21d20f12225087fa08f26a8ffd283806319e8c20cdd04fc5ff8362d596d45 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2a6853a5d60a4ba5755856c7992257656fcea9b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ddd9ca24481b92e8a18aa29bb635be3ac9b7008f10281d975ce4b15e8986a4 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbee2a22b14dad890b04f3c755f3a6c13d0c883 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54874dfad49e108e3456c38afa61db3cc6ef173734e5e60dd53d0d12e3c81d82 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8711dd5e8c8b0722bc7209c5b72248ca9e76886e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14ce7ad38c1bf8c4b6eb86ebbd0721a170b6adf6e0c87ccc4921d01d68f11b6 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2505c10f6a531a427d057b6a786e8135d1318e82 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dce9a6b8f6bbe9f9334aafb57ea8ff04a8e97a0901b9786f6847dedb9b58de +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6a804c93969096fdf5c9f8bc797fa5dddffedf4 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac18a32b4ee50e449580498f00e3cf2f82b3fffb682f2580ec10712b41abd9e +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55285b323d3cb808ad3d88269c7de932bf043c10 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad31bf3d819c5d584552290234030909ef529d6aa95f7232b24812136010d9d +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ec85f80ea6e0ac7216c12474887bfa9c13c5990 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c196c3f3eb2ebd36171ec9bf2c3b5c6017d7421ee594e8321871b9e23cc7c9b +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8383928fb1cf6ecd6238a56a5e20e0410bca142 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de72948506548db5ad06e27e95e9995bacb928126f66e98b11ff6fa0b099556 +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1448321980d5337a60046e1e6e9a59d4a4079a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3554e04f35f5184dfdee1907db4dbf5650be30e43b6a0770bc5ba67571a2719f +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f6ba73ed6fe0232dbeb4a982a3b107b690891f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:001bf9e2ac4fb57225f2cd0abe89f7054ad8a1bb2a301ee0b030f0358b2f131f +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dbdb5d4eda173e9feffdd9f447b9ec612230279 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4027480bec369098b37765e844d60cf2fb6dcc7a128c79f21ef9eeb347d0addc +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b5acd9b26d7cf56d85a0c3f12107d414b5a6ad --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968adc778d3b8d334642f75c6e15208567f36316e4bd4b36110c53952443cb22 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8cc070c120e5874b1c7102895528eaffda8346 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1623e898d4e7b05d506350a2c33024a461e346364b12f91fb514b40ebeb458 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..628e5de9b86bbc0b73c8c065b7f67ef0b3bb5134 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc29991ac0d55a7fe615bd73b973a1bc662f1a6b4cafa4c8962494c9d096726 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ad8914b96cb045dd1de0535d2229e9cd2e3aa8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7318628dcd3f6d72fc2cfca679b4d0812fe3f95cf3e1a4215dbb84909a7d75c3 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ddf3d9ca51889fd6d6e774d2b110d91e6c3a2f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c6c4be75e0989da008a3b202f106ed00add76f079e6f8c0986da4f944c342e +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9939e592d185fc0961356ab7c3a5b6581cf6d289 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397a19653965f00411b03c69689dafa7a8ca897e1454b8dcd6e3193d654c1467 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0088fa373c7cd537bef7d5f166ad5706484d8b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df65db65277d3016ffbd9af8f5bee9c316663b2a970378579af7c869b3ca55b3 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d371e35687a7d8fa9a0838230f9fb9abf701f18c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe591610b98a6dc4ac2ea074cfe2026e5c523cf9d9d128262d3d8003d8fc519b +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6dc2ba8741b1f6b0f9847c843d0b214844cb9fd --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f593ecde1acecf3d8b3ba6282592d4369325068aa8f97d5ad062aa38c00c83 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e2afc2df37bfebb9841066873e2486651b0be1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afee1d7098a585890af3f13dbf4a4b1f3c559781eeccf9159337c2ea89944fa +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e209ef8cb01d9be942e556061e3ed8dc0252bb7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:580e3429f450390e9b2b0d508c2277b4f9911cbdc62a6df8813d2b9bc7b6b840 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f748b3300d0b0ed026c74b7a9d60a3e4f02f1cdf --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d8d8775691c9faa52bb0894130ec83eb7c66379cb40093dfe68c1b56ad3e41 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..289466a3216ea3614c9f46e068e978a35c8b97bb --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5feb0bd92b9bb37ae1bc9b83a94cef73610f7e642b9732bc497add1c9a52ff +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61cd5b66523c65b65de66f8358bc83f0802c7153 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87b505677bf6d81275ec9e9594ccbdae00e2bdec34a27d57f534c9b46fae99f +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a42ac40ef462d808a06d25609295675c117e5265 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318ed8c1a41cad3da32a0b2ad7cf3233f71f147251334b1361a43f74bcf00c78 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a723cebd73996dfa1fd1b15536a6c6fada5483a1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2214958ce9054dbb8af0b80ab9d0dd40f624c98629d5b4f8a32ab5a67c12b95d +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a81101c417b09e958ab81827900549915170abe --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb13a169e09ddd9bbad0c37636adc91d8b62f3ab87fce1c0b44076428c44d1c0 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae32c96eb9bdba933a0de9ae04d2b98ae9d5442a --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cda13c4596ff09f6446a600b99ba2fd6f3ff3d368001e901c36e75b8b1ec544 +size 131963415 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c3d3bd7386af05b77795e78d0015b02ed61e62 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:841e4e9b695ca1320ebc3b45b43fd98bf1a9bc580a38b14e603e78d36d504055 +size 131963415 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5670c60b956835e7c7629eefd376dfbf149a2c7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c42514261adefb304a410c83cd686cf12531be1a98401b2bfb6a3bc34a455d03 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f59ceba0f1ec856607a2e84c0e5b26971b7309 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092282bf90ffaa3baf81a2f4c2445d02905e414814ccb427a15b1db414bbd06c +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb49c7664a4801ba2f99ba437e2f31029f69b4ce --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc8b8ca6ce369bfab0815b2512cbba84778526ca595b9e956c40d9ccd86d3ce +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..067dc1f820f89ca22194fec6dc2d656449c99104 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3086e452b2e76046518843b6730ab33d3a2c6565e9b7059cfddc976a978c5371 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b77049030fa9cf126519832b99298458092f521 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01dd87d3d65b02cdca467e99862aadd9786742d6a76ee33940afd8d1cefee1b3 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d143cde9d4dc02a948e8e7d070f759b04cd6620b --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a7efe121c567443c5c4c19332e26dfaf483d85c81d20fe68c6d79f69e59710 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ec86df09355b79ef3c7cee14cdf8d7b6538aa0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d55b8cf4d1539fa211cc6a50f9115e16957d27397cac42e63df2dfc4fe68c39 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b92fdfb5d77ce72b90021d436513c64b9278933 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb15d9c00af6783764045806fbf0ad5e662c12662a804e1799f9d61bfc70a4d +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..127bb68716bc774cae28ae2305a0d580dd782a1c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838fe88473d71bfa44416899a9ed252394b1f31328f8eb7cf04572ddc87901ce +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67372fdfc63312c11ad120b7dbd6980938c4dff8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015cb8f0d7929afeef31d4448638d15bd7c947205d65ad74096048f5f2d0e169 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99e032b65dec14b9e64482ba7ec8a356caf68a7d --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4d2c34ca1e1124473300b752d047af6015a52d533a448adad916a3695b60ba +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c97615c1dc89d017795daf574fe520e585ab95 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe8f6a1d9023f130e826e86d39add71bcebad5b24e88a76ade2d11a1fc47bbe +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..966b55098812e09e6297ad25168527c74fa018b3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f995b1ef66776bc170d0ab1738d2f48f69134a09d7d40a165ff4fa3187d2868d +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c28c74e4f03a641a10c04aaa2f8284528dee8ed9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908952c730ab8319c8e1b1d7bf2afbe1d33cdbb972bd16d61057ec43982d31b6 +size 131963682 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e212a8da11a98f2e85fc722bcd59631d42c336e7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4080698e0783ba7141e5f595b8949b58324667fc8aabf9d46b82bce701360f0e +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a6bd5c5c8ab314d881e0719b2663c61eb1d7c2d --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6c77c37516fc30cd225595cb9a2e43aeb9f87d535ef9d2f54b3fb32729b983 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff3680891dbabc3b300030fb47056bc0b1d610f2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423b06465bc878ad96a79e738fe349640afdbbbdd50ea4904a4b9a09c18e8a50 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14efac4cc6feb122a77634ebdd5f0cd406a29ae2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4fb945778af9560df4b6f7c1ad25bcdc9f2daa21109e5855ff5645a0ec9768b +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0dbd7514ba921eba4aa13d3307daf3a76ae335 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0839177ed6c6802fb459415252e49c212cc9e5df750e72a41356091394004c33 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5205a66736108d7e78cc0d647f0f41f98c1f9055 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a87302e61dda83b158a74574adfc61b022781a543a6d0b8c0a68a419d36ed6 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1bf79e68dfc6a115534c497f0a811dac5f899e0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb4565fd201426e312683b77e4e3d6c4f51e195f1dcdefa015a65643ccc66d7 +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f70b33ec32ad0ac3aff88afa52703290ca2ea1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c555175a14f8bf94a840239ab527f301b06856349ee408eabc3f95fe675834 +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76ec08df861ca2f0b93baaf8663d25a08ab6702 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563f75ba5a6b387a1cd4b03abd1ad240b3e897445029569b5fe515987b5d8658 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffc94d42e5a72a7ae50a0235a13ad4cd7a0e4bc2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c5325c116737dec52a37f5581e71f0c304050be221c7642cb5ed786641aaf5 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a8abdcea24798205d6166dadf439297f2bbfe8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d746a5bc7ef5f2b1f29493461c89685327f7fea2e25081f55017db4ac483cf2 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bfa0d2fd7541d82e4f1605c6686498c37fe0121 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:243ca9c1a060d3fe77b1624ce9e4d85a33e2ac38eba82539b66839c6dd81773b +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bb8f40587e405268ca1a8784a1973332f39354 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0749c51298d99f3426826a65cd1574fbcab5c0490749b03d4e8acb90900545cc +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce74d4f40cd6fe94b069c9aea6250d3bbead6fa --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:026e8833b7b254064b3fba177ae1926c59226f31f68ecac87d9d12756dc6d7d8 +size 131963426 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40391f1b4499b2818510d521c0151487ad0a2660 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0a1419eb81260a1205aac0d4d477d2744532a0f7e0bc72aeecc93a93e4d087 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..903c23c171b4ffcc4ef56bd81fa19c19ed1cd290 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eefc92734e2169063c0d8e2cdf4ac7b36b2950c36ea6c5d8b4d86792905e383 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..585b4610f6c6d09d4a387a39787e464497baa2c5 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b5196799eb413c605dc41fc4f3c8976618250e76aa8259277b96fb64047049 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..541b5881f050a650533e70d30a253557f280b8e9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b47556d884fc349f65060d00adcf1cdac4b534ffa66b8a7a8a0cc204099b0c +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b1c2733a8e126e15581dad6d09c4aaf4cf3e00 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1163ef8322a8f50e905436312875f70619b14b5464af80745a94fb2676df25d7 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c8f488d677a700387fa8d79537f1698f47bf077 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81749520af69bdb3898f0fe070340e3c1b22c2458c209989a1453a1830534143 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c23735e3542c81c745e979fa3cf36f9771fb31fb --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ef3d48aae220aa9e6e65e258a784a3b5b6b005f63a4b09f9d2c6c29c101d23 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43221c77f62fc253f4a7c1845e8fc55b5170ae6 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31df48e10807edc22430ca2a84d4898a46e90d7fadc3d45fea8d4e04ff83f32d +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..364fcda77b97f9a27fbd3e801b4d73b7679d85a7 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a560c8ae0004c4bc34d3cbb84c02023e580211bf5dbb51f10c7ee9c2c291a2 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7333ec92ae9c1be15e97b4039c06e9395576ec76 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe9f2634b688344488cdd85222d648aae11bc4b44678d577e72289cf8ca8af1 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2276b6f6973b4c1aba6ee8f5933398115e7e933c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:562e1e39cab7644c71de3317e68ff88cec16798be24badfdb06e0ed0437e9c35 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae5bdfa54d993776ffaf5fa26388a3367cd3410 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6f157bea65cd011a2cd8013a5a8f3bb36aea379d8780c788de70ff62d47f58 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e4ba0cb55974b2750e31465fc105ff91070a4c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6df503aebb3f3846e98807fe0813d00b7e91c4eb442f3ff00a4cd2da2159e2 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff010e3541c1e8499cb2158cc5359313c37e24e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498ae87a60bb37a80d678434891d6b972bad9f25e0fec89abd126d8cd3e8f4ae +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dd3db24a63a5769f88857fa4c48023fab5ed6e3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a350bcfcccf41d9faa83918618125376107ec4c7a8bb4641e5c10e6fa8c56ce7 +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab61042c49110ab217646d0e8dbc958310eb7f9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb0a75f4e929aa4fde2818d4805f29a926dd2280a2a60aed637b7905d681ed7 +size 131963479 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72b17f58e0bdb4db16a02cb4537814a47b38491f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f5091a02d3ec09476d8b0ce2c20ada5fd43ae93d59435786b3af0c8e5d4569 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6394d2e9bcfcd9f7d8f675c70d8a5901cd4dce9 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50aa4bc2bc6368288aa05df0e12c760265631d4579dc5c97745a44a30fd35417 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..943e3241617cc4fbae4feb5df066de19caaa6dca --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895aed5081d66e4b77832a75594c30b97330887ec9fdc080a3b7ebebf037946b +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1576081c51964c5044b95e513c7356511090ac3e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e4be91cad907af3e32eef3a422affd1e18abf5564d07e66406848a16e3a7ba +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74150ff37ae7a3ff0131a2a8d29abc4fb8023f35 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b242b7b37d70c9ab8cba33f7fa16dbc5d4e673d5edcafab9464f0d02b323efc8 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..983249d3c207a7737448c7d2eb558e456b6e9379 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44a0e7e1fbe79690eef9bca03b33d54187d2e69f63969b7c0acd17f82e11d6f +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b39d3011d98fd967b641f093c32a0bbe8af8c73c --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3789e708e699d90e9c92c19d1db0fafe313968022ea6d6bc2930494cca3b20 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da789d4d502ccc2e9f316e7b5e09c659fd961b0e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d4396f6b22c38f9bc6f92b7de9cc2bb857e2a2a5edda8c014535c6cce480349 +size 131963618 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb61f436d9ef42f67865a0b017902b4ebaf4296 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7548d20b561b8e09ea4d737b070b786d6b751eaba2fb27bc0daa8b1bb12c51 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d282f260d0310928dca16a4f04bd8046bc067d27 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d61217e3ff1f5f6323b0fca0fb17915cb29bcf1976812f8ec980f2c3076e612 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac75cf8df5fb897d1d66c9f2a5f4fc9b4648b5e8 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bc84888594b7a1b97a84881950d03debf03496bb42c44cb09561569fbb57b5f +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9d2099787f838a09270289f3ddff3bf7a1d60e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59950ecfd484e53acebd2446eb9783c640278a75b9e53ab29a443a8710534c2 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b805145c88f7ff5d4f569c9e201c568bb70c95e --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2682e3bb91966a3b226a7e0a2b29293171aeb5453987b80a2485014c701774 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de33b4a969c2dc6d54fdf3cab8b90aa1d704328f --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:055fee6bcb672c192f176e5e4316f023aceae2a210b9cc0927de8ba7bdf70360 +size 131963490 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df7e5a341dd5ff0a8f423cf9240cc0c6f8b9870 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6876b8dcd9ec2302113a073034d3eaa13a9e28b01b991e9159a1656ad64b4170 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39aa9b8a84ad2832284a23f2c409d5ae667f4f14 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f634b4dd5f7b6f8624c1749c332ca91e2cfbf68e0ec80eeaf149155b450c749 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da184e35572c9f21b4ada8a6a8fcf47bb79f7e1 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9e93ff215856f22f0bb717d9cfd579a65497b23d9a8149a28db3de024fe648 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72b372b54be3b87684ab3090371b7306ff17b0f3 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b6748fe1f81de4dbcba488873b073dbd6288aa5312cd1bed9f1ee8604a9d38 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f12913c93e698997be7595a069fdb08ea2d2ce0 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e6a8deb886447c45983002b7f08b4b2dc02387b90437182ce2abedc7dff63b +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a107057f399aa495433ad1cae6aedd56d4442e83 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215c88f0c48593245cbb141dba5b4b356a2f86db71631606abf215ef7d2c74e1 +size 131963554 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9344b88c98b47e7b735201b37f5b6a8cb1903c02 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40aa987d3069514a771cb59ef0fdbf45bfd278d88bc3ae284c186b4c7d601c7 +size 131963543 diff --git a/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82713cbeaa0327a9a3fb042928ccd44c476186e2 --- /dev/null +++ b/perplexity50/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5bd42f2b84ba25052436d54d747bc310d883499bad268dd762720cef6c34e2 +size 131963543 diff --git a/perplexity50/global_step80108/layer_01-model_00-model_states.pt b/perplexity50/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5efb24810df098a668b130e5246e2325f72b49da --- /dev/null +++ b/perplexity50/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c675c1a9ab5955b7728e0a9a3bdaacdca9604cf4867dbefdfdf5a7b838910103 +size 139592963 diff --git a/perplexity50/global_step80108/layer_01-model_01-model_states.pt b/perplexity50/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47df4c9a8b09bcd04408f7f3e1f241de6329cb7 --- /dev/null +++ b/perplexity50/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5d227e3b5eef6f6f6536f1ccb73bd349f8c43d3b7a7067c2836623a16e3e70 +size 139592963 diff --git a/perplexity50/global_step80108/layer_03-model_00-model_states.pt b/perplexity50/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fddcf934d5ad24928c511424c4f64f1f1cc06c18 --- /dev/null +++ b/perplexity50/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2daf557ca1afd1007a44ffaa2041eebcd8e4d3a544e1960a489919e0f36b23 +size 78696195 diff --git a/perplexity50/global_step80108/layer_03-model_01-model_states.pt b/perplexity50/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4801d9db7e477c29ce6481392d60f996d23c9ceb --- /dev/null +++ b/perplexity50/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fc977566ef533ec6f6615568a87fcc35897f8a02f8c989cfb09d5cb12841cfa +size 78696195 diff --git a/perplexity50/global_step80108/layer_04-model_00-model_states.pt b/perplexity50/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e5d9bbf6a6c7efeb5768241e09d95b6a6effe4d --- /dev/null +++ b/perplexity50/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d7fccab46df04986d389c2e9df47b7afc624e33c4f7e73f49c989192c47c87 +size 78696195 diff --git a/perplexity50/global_step80108/layer_04-model_01-model_states.pt b/perplexity50/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed791138b6744250d91b2ea29b0b0fa4eb7df70 --- /dev/null +++ b/perplexity50/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ec005a39f138174e370a427658488a3c03100cbc64890901614ff95212fed0 +size 78696195 diff --git a/perplexity50/global_step80108/layer_05-model_00-model_states.pt b/perplexity50/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6340766f1a7b50c2ce2da0acca37177317438c1c --- /dev/null +++ b/perplexity50/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95804b73c9c96cc106df4134194b1a3b3cd6c2857a900f6c477795842ecc6dac +size 78696195 diff --git a/perplexity50/global_step80108/layer_05-model_01-model_states.pt b/perplexity50/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925bca71b23d1e2dae1de06c3ee88362a00c881d --- /dev/null +++ b/perplexity50/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfea46b2a9d72aa207ec0aaa3bf06f6e819fb2d69f6e0fa904e6cda608a0a23e +size 78696195 diff --git a/perplexity50/global_step80108/layer_06-model_00-model_states.pt b/perplexity50/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eddcb31515dfda801329982ba267582745ea56e --- /dev/null +++ b/perplexity50/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56ae5d9c9115beb47486ef54a5c7783099c6b9c2374d522d22759faa451aa942 +size 78696195 diff --git a/perplexity50/global_step80108/layer_06-model_01-model_states.pt b/perplexity50/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31f83dda13fe1ffee3b5222033b1f5f0050beec3 --- /dev/null +++ b/perplexity50/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca430e9b51d4c3a9f4430db3194fd97a1a515b7c2fa5fad04731d5e925634af +size 78696195 diff --git a/perplexity50/global_step80108/layer_07-model_00-model_states.pt b/perplexity50/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e7cfb95f22d973d0a48ba785380be74e6ed87d7 --- /dev/null +++ b/perplexity50/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b467b904019626dc1221ef0b4e097f673601e6cdf39f307c8fbd73a83244ab88 +size 78696195 diff --git a/perplexity50/global_step80108/layer_07-model_01-model_states.pt b/perplexity50/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1fa78dc4f9d0a7e0ce642d503632f01f672bee3 --- /dev/null +++ b/perplexity50/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3180aedfcbaabde8ae01d9111cd6d0613e52dac176eec49562ebb3f83e359bf6 +size 78696195 diff --git a/perplexity50/global_step80108/layer_08-model_00-model_states.pt b/perplexity50/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92e640da5728836b98a2025cbf13d9f0cd08734d --- /dev/null +++ b/perplexity50/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58d7d05bc74b1964f1d926dd4630052d1d3fe17aff1e101f37389e7171fbe23 +size 78696195 diff --git a/perplexity50/global_step80108/layer_08-model_01-model_states.pt b/perplexity50/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..806e09e4147e51b0367f926a1c85232dbdd3ba5e --- /dev/null +++ b/perplexity50/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b5c948b045ed3537061ade25ce9f0b24211945f5c690de439fd50df21610ec +size 78696195 diff --git a/perplexity50/global_step80108/layer_09-model_00-model_states.pt b/perplexity50/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b1b2945199b45f2ec19eee74942bf23c0fa8bbd --- /dev/null +++ b/perplexity50/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2564647e320f5565008ff1d95052b70dc2b372a7908c8fc71f536047de86f15 +size 78696195 diff --git a/perplexity50/global_step80108/layer_09-model_01-model_states.pt b/perplexity50/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..303efe5c7f194d5fe345076005a2af34cc05ec99 --- /dev/null +++ b/perplexity50/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b82ff396ef577c2404b8aec77a5ce8c963fac41af744a3225c2acb2e8b5f50b +size 78696195 diff --git a/perplexity50/global_step80108/layer_10-model_00-model_states.pt b/perplexity50/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16d397bf02fa0fbc6726703e38ffe1c2a10fc43 --- /dev/null +++ b/perplexity50/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57989539ed33a3d5036a5a0b41524192a5f81b7eac38aeb7d66b7a58988ac526 +size 78696195 diff --git a/perplexity50/global_step80108/layer_10-model_01-model_states.pt b/perplexity50/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29c0ce01ced893a30c58115b787875b94888af0 --- /dev/null +++ b/perplexity50/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d984a2f95df7844dde90f411ba7ceac1a26ca53d79b9e30a4292c2adac70f2f2 +size 78696195 diff --git a/perplexity50/global_step80108/layer_11-model_00-model_states.pt b/perplexity50/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d09bdf19e012783c82118fa4afbad8f8c9f21ffa --- /dev/null +++ b/perplexity50/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f90c87d4305bd3c6f6eea4cf413c8b5180207145a76c478e6daa12f5bace37 +size 78696195 diff --git a/perplexity50/global_step80108/layer_11-model_01-model_states.pt b/perplexity50/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38171b70178261043c0dd440a566bd604c249d03 --- /dev/null +++ b/perplexity50/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00906b2d0eeb351684bafd19f46d7ef1515421479b742bf26efacec500cbae9c +size 78696195 diff --git a/perplexity50/global_step80108/layer_12-model_00-model_states.pt b/perplexity50/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d507d052fe5f133f93a127f4ba38cf13dc771a --- /dev/null +++ b/perplexity50/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcea5433860fd860c3b4f453dd23c803468f499e02f4c19bb910d1d8f26d50eb +size 78696195 diff --git a/perplexity50/global_step80108/layer_12-model_01-model_states.pt b/perplexity50/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a0447f2685421f042898a987c080fe7a9546435 --- /dev/null +++ b/perplexity50/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a50dd9fabedcde5b5b6f83025c790c0d4adc974fb97e84c784c8e6b19b47a03 +size 78696195 diff --git a/perplexity50/global_step80108/layer_13-model_00-model_states.pt b/perplexity50/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea9b218ffdf3b3c71098f6ce5581656f4fdf7f49 --- /dev/null +++ b/perplexity50/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632de0e774c3d959fcc4c45d58ea1caad3b0784d363328752e977fc93d2a7370 +size 78696195 diff --git a/perplexity50/global_step80108/layer_13-model_01-model_states.pt b/perplexity50/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..150a1532fda6f4809871c91561759d169c752ed3 --- /dev/null +++ b/perplexity50/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26448c74a677d710ad9058bbd72885d3a452b4e993339a0f722f3053d30ac7bd +size 78696195 diff --git a/perplexity50/global_step80108/layer_14-model_00-model_states.pt b/perplexity50/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66e7d3c429df917f2f7c44db056fb21409190db --- /dev/null +++ b/perplexity50/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877cbf59155b0f97762fbcac6b13d71df0c6d0b986f8f67d00b6ba615785dd3b +size 78696195 diff --git a/perplexity50/global_step80108/layer_14-model_01-model_states.pt b/perplexity50/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e604925b1bb4e86d6434a4392b7f4d8b49514c54 --- /dev/null +++ b/perplexity50/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a61444dd2a76c47ba9f7526b9a5c38d58a5c67b04d1533486c54b702019175 +size 78696195 diff --git a/perplexity50/global_step80108/layer_15-model_00-model_states.pt b/perplexity50/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a4f88a6690f1b34b598e6f720b93e5af1818519 --- /dev/null +++ b/perplexity50/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1efb1cb83bd4e73bcc1984da0d35a09efcd1df259b3b806e1abad09b17cbe50 +size 78696195 diff --git a/perplexity50/global_step80108/layer_15-model_01-model_states.pt b/perplexity50/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b199b62f92f0f3cf0a8e93f871a7e806b2ffdf51 --- /dev/null +++ b/perplexity50/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a476dcc1e562dbf483d672a9b098eb01ce63289c6b1dcbbc9903ffd2ad0ebcef +size 78696195 diff --git a/perplexity50/global_step80108/layer_16-model_00-model_states.pt b/perplexity50/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6f25dce80a227aa096b82f70f699e08b17ddb0 --- /dev/null +++ b/perplexity50/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29d72607de91421d6b30894fbb9522e872d245fd87ca0d3f1a434efc8a9fee1 +size 78696195 diff --git a/perplexity50/global_step80108/layer_16-model_01-model_states.pt b/perplexity50/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7101628e995e17f73ac74ddcdcb166629bbabb9b --- /dev/null +++ b/perplexity50/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80aa9e3d0f4cd2fa36cd1a25be979f6eb3a9375611267bbb6fccdb4ca461bfbc +size 78696195 diff --git a/perplexity50/global_step80108/layer_17-model_00-model_states.pt b/perplexity50/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4afdce43524c83a8d9c5f1fcdbf78d7041fefdb --- /dev/null +++ b/perplexity50/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7cec4fa15978cbdb87acaae433e80fa25cbd834607b34c003874f6e34df210 +size 78696195 diff --git a/perplexity50/global_step80108/layer_17-model_01-model_states.pt b/perplexity50/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccd2e374037a98b3e5182bb93c1707941347b6f3 --- /dev/null +++ b/perplexity50/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336d2da5c26059d67d5f2b162c514f50a17838ea55978ab204c43dbb08b75afe +size 78696195 diff --git a/perplexity50/global_step80108/layer_18-model_00-model_states.pt b/perplexity50/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b4967a341fec3fff5c149dbe48197353593a474 --- /dev/null +++ b/perplexity50/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb9ce08b73152af34ef4291212858d7e7c3e6238f28e53c438f2b1a7dc58616c +size 78696195 diff --git a/perplexity50/global_step80108/layer_18-model_01-model_states.pt b/perplexity50/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d54cc960191c51fd733f608e2da6e70432123760 --- /dev/null +++ b/perplexity50/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164b9b6b4bfe69e6a28686c94df7ef49d5c29974055d3b35861346ba2c76e303 +size 78696195 diff --git a/perplexity50/global_step80108/layer_19-model_00-model_states.pt b/perplexity50/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d08998e765af6d75dda2d36d418b82a4540c8b --- /dev/null +++ b/perplexity50/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b87c5865d2f750408e0a54bc6d9dfaf84ce192c34a3eaeb725b97a5bb571fd1e +size 78696195 diff --git a/perplexity50/global_step80108/layer_19-model_01-model_states.pt b/perplexity50/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7d1e1277defef97c8068008c5b5bbad49bf912d --- /dev/null +++ b/perplexity50/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:761203f08e01a99573a733759932028d8dc1e2ef2407fc15d969a8cb1b23a4dc +size 78696195 diff --git a/perplexity50/global_step80108/layer_20-model_00-model_states.pt b/perplexity50/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa83d63b8bb9f33c5c096b7b16ce910b93dc1864 --- /dev/null +++ b/perplexity50/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7457f7f5e4cc34e50b66666c5b3e2647e5ccabfd738f6b92103f3796ae287061 +size 78696195 diff --git a/perplexity50/global_step80108/layer_20-model_01-model_states.pt b/perplexity50/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8c1e94a0e0d87946f8e82e338f10ac2b763ce64 --- /dev/null +++ b/perplexity50/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00338cb0f15ec8e75f59f2b1b13d04ed80f74f00035963fa9ffc314468bf168d +size 78696195 diff --git a/perplexity50/global_step80108/layer_21-model_00-model_states.pt b/perplexity50/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e908a14cb21a85b76b8cf6e7f6eef19553fab1f --- /dev/null +++ b/perplexity50/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1b6c43cbdef250e7fb006ab31e48a76b9ce2dafabffeb7cd3384dd216a16e2 +size 78696195 diff --git a/perplexity50/global_step80108/layer_21-model_01-model_states.pt b/perplexity50/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7b481f176b969b4a8512ab56cf841f3b6dce41 --- /dev/null +++ b/perplexity50/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5ec1cb48ea99b7f614c6378a71905609eda2ca183f601c51522e4c79055668 +size 78696195 diff --git a/perplexity50/global_step80108/layer_22-model_00-model_states.pt b/perplexity50/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c715df80d71dd53f1564363b576893340e32bd17 --- /dev/null +++ b/perplexity50/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c090028d6434bf6dc3e4467099e439e5a6266e6b66e3a4c544ce9c9535990caf +size 78696195 diff --git a/perplexity50/global_step80108/layer_22-model_01-model_states.pt b/perplexity50/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef664e58b2f8a1e589a7159d04b28e1b68524669 --- /dev/null +++ b/perplexity50/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b70c76e278a69d7251f56a4814b9f3e53d1b944d32d8c6732118fc4bbf1343a +size 78696195 diff --git a/perplexity50/global_step80108/layer_23-model_00-model_states.pt b/perplexity50/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57714145de90c2901d1ae4715881b3e4c10ac6c1 --- /dev/null +++ b/perplexity50/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70aac4dd917d698b06f99e9acd12f7251ab137f8f24e1d5449a91830ec27f991 +size 78696195 diff --git a/perplexity50/global_step80108/layer_23-model_01-model_states.pt b/perplexity50/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..120b35285807b2287e488c4bdeefb5a0bd4b9146 --- /dev/null +++ b/perplexity50/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9358f0077b96dad44ca8de80fd65c6b3e50511208600f10130f3b0096c911d9 +size 78696195 diff --git a/perplexity50/global_step80108/layer_24-model_00-model_states.pt b/perplexity50/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e968ce316eb91fff0ec51d241ef1bc62676ed4a --- /dev/null +++ b/perplexity50/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f11e0c12c96cfa1787f74575c8c050836700f1e1e7ada4bd121da01030459e +size 78696195 diff --git a/perplexity50/global_step80108/layer_24-model_01-model_states.pt b/perplexity50/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de87988478a96eee1ff77cd683ac8c4c594cdc33 --- /dev/null +++ b/perplexity50/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4ab0ac753f6d0956b6d134bdf07b3ddba926eb690e05f6dc2be0631f882d91 +size 78696195 diff --git a/perplexity50/global_step80108/layer_25-model_00-model_states.pt b/perplexity50/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..534a39a84cbb37ed805d09b276c6e8b92068c61d --- /dev/null +++ b/perplexity50/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8837dda5a0119cd44bb85181260864d7359cac02897bcaad4e16bb821496c07b +size 78696195 diff --git a/perplexity50/global_step80108/layer_25-model_01-model_states.pt b/perplexity50/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21282fa27e2e992b35a55245e0040fc1c7f694c2 --- /dev/null +++ b/perplexity50/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468ecd163b2df8670b8070ff579d4f1eca2cf7de32ed00fedbb8e3d4dcd08cb5 +size 78696195 diff --git a/perplexity50/global_step80108/layer_26-model_00-model_states.pt b/perplexity50/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1947bed5378e6f1f6bfa6397d7a026705f021f4a --- /dev/null +++ b/perplexity50/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e711969da3855f7f23dce76a09aa95115416f6cc209ac27f5ee31dab6021aa41 +size 78696195 diff --git a/perplexity50/global_step80108/layer_26-model_01-model_states.pt b/perplexity50/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1290a9c63a7390d9c666f65c438f80e60ea5dd81 --- /dev/null +++ b/perplexity50/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11689374061c802e48594c801354d36ab614fe80d3f50103498af8cb2d7c9c73 +size 78696195 diff --git a/perplexity50/global_step80108/layer_27-model_00-model_states.pt b/perplexity50/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84e098f7f7480e89ba0154aa293a0da8a20ada3 --- /dev/null +++ b/perplexity50/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582bb6f19fb90746dea32c3abb07c3503cd8517ae60022e0127f6a4919600cce +size 78696195 diff --git a/perplexity50/global_step80108/layer_27-model_01-model_states.pt b/perplexity50/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..091ab92352fbebaf1cdc3d38a2541ee38447659d --- /dev/null +++ b/perplexity50/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72de2fc715c59a1e02858e59cc1d8308d34ff33dc1b63f8fac8e3a743b991f2a +size 78696195 diff --git a/perplexity50/global_step80108/layer_28-model_00-model_states.pt b/perplexity50/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e3852ef7c06aaa8baf872362c3db7697dc6474 --- /dev/null +++ b/perplexity50/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed8573a9d12d9b2e2cb4e85e563a0c1c43716d50d4a3b01cc282afcbc5a4f1c +size 78696195 diff --git a/perplexity50/global_step80108/layer_28-model_01-model_states.pt b/perplexity50/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76b23891cd1d064060c570e9f8afb7e52c6a921 --- /dev/null +++ b/perplexity50/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d628abe8afd096c5dc84c04747a4468a4304e34c05c09e7f88203ed5c78b080 +size 78696195 diff --git a/perplexity50/global_step80108/layer_29-model_00-model_states.pt b/perplexity50/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eac4a4435025c270ffafd7aced03567a3f14955 --- /dev/null +++ b/perplexity50/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340e8169dd90602dce8bbf9c25a37370d228ce7bde7318a012df2f061660655e +size 78696195 diff --git a/perplexity50/global_step80108/layer_29-model_01-model_states.pt b/perplexity50/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8524aae1db342f3f5343e4d305e367d540d534 --- /dev/null +++ b/perplexity50/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372f6db3853221e3d5ad4be9fc9ac036d14699b5488548fd7e7849335ddabd3d +size 78696195 diff --git a/perplexity50/global_step80108/layer_30-model_00-model_states.pt b/perplexity50/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ba24702992904714dad3c27a8bafff7bf6669c --- /dev/null +++ b/perplexity50/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe294559e4a6bf9a18311a4a32f707906939731539572a1bf5a587d5cafcf12 +size 78696195 diff --git a/perplexity50/global_step80108/layer_30-model_01-model_states.pt b/perplexity50/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4c62cff6bf178948f9f6b8674381d1ea80ab42 --- /dev/null +++ b/perplexity50/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d7be583d07debc5cdea29c1bd36c438cb58001c829d79255c4138e1132c6dc2 +size 78696195 diff --git a/perplexity50/global_step80108/layer_31-model_00-model_states.pt b/perplexity50/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db8a15041dde84deeed2026a5efc139567e9446a --- /dev/null +++ b/perplexity50/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6c6b89117d06652cf9c523b3920faffa3bccfe59bbbfc64d7c5cd3db0ebdc6 +size 78696195 diff --git a/perplexity50/global_step80108/layer_31-model_01-model_states.pt b/perplexity50/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3197e18a93f20fcc173c44b1a2fdc442d6a4301d --- /dev/null +++ b/perplexity50/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74da9dec760d6d0b6cc7101afae3c40d89293382a43871ce9d8a25e828167567 +size 78696195 diff --git a/perplexity50/global_step80108/layer_32-model_00-model_states.pt b/perplexity50/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05d95f12319a1f5f21dcd95cba639ffce163a38 --- /dev/null +++ b/perplexity50/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc0d2607b87fcd2a8e1b4b00704939209449b41647ac25dacd3ea51b0939ccf +size 78696195 diff --git a/perplexity50/global_step80108/layer_32-model_01-model_states.pt b/perplexity50/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58da72348b04579bf0ad2880459e6dd8eece661a --- /dev/null +++ b/perplexity50/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854c294ecb50e7d530c5f2f8ac1f939f05c662319a7cdcaf019d017b61d94c6d +size 78696195 diff --git a/perplexity50/global_step80108/layer_33-model_00-model_states.pt b/perplexity50/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa204292e1f8914da0b3b1642dae14103c5b5e7 --- /dev/null +++ b/perplexity50/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0d9fcf1a12c013c88acaeb6b8e890eed1383fafcded1b4133f2b7abbafef6a +size 78696195 diff --git a/perplexity50/global_step80108/layer_33-model_01-model_states.pt b/perplexity50/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6eecfc3dbece4c65086e47f386b046136fd250 --- /dev/null +++ b/perplexity50/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d5561f3323143cbc42c6dcc65237d88be1f135d7e664ff5442697735232a82 +size 78696195 diff --git a/perplexity50/global_step80108/layer_34-model_00-model_states.pt b/perplexity50/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a98e1bf739660e8535321a1bd2d50719d1cd9c8 --- /dev/null +++ b/perplexity50/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423a0f619c5b486590a1dcd6d003e274cc10378e8dd06b6881fadf4ac52e0f77 +size 78696195 diff --git a/perplexity50/global_step80108/layer_34-model_01-model_states.pt b/perplexity50/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9cac84301c36deae9a0f3fd4a1d4a87fe8da56c --- /dev/null +++ b/perplexity50/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf6006b232673f130197c7b22bf8db13e622d88b9c7becc37bec78747fccd98 +size 78696195 diff --git a/perplexity50/global_step80108/layer_35-model_00-model_states.pt b/perplexity50/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d357d7e8dcf8555b6b411e6df208c44d8eae3878 --- /dev/null +++ b/perplexity50/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecfc48e446f6cb6ce8610428f73e82a4693c879df5a0ff7b4149afa632f507e +size 78696195 diff --git a/perplexity50/global_step80108/layer_35-model_01-model_states.pt b/perplexity50/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4364fc3679c6f0519199ef049371cc539cdf1a6 --- /dev/null +++ b/perplexity50/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6327d94128f79230807320d3f7e7736886beceb40f175e8ad54d7f7075610f41 +size 78696195 diff --git a/perplexity50/global_step80108/layer_36-model_00-model_states.pt b/perplexity50/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b40c88163fb52c83d03b526a81b862d20ba4ab --- /dev/null +++ b/perplexity50/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a5deeff33df9f457c7f0ad167f5ed13ef68965955f58f409aae247052eb05c +size 78696195 diff --git a/perplexity50/global_step80108/layer_36-model_01-model_states.pt b/perplexity50/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd881d83111849761655c31fe6caf612ffa9691e --- /dev/null +++ b/perplexity50/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45866c61acd8092eb5083d17c1cd6e209c2369633825ff0ff34b8e1a670e902 +size 78696195 diff --git a/perplexity50/global_step80108/layer_38-model_00-model_states.pt b/perplexity50/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadc9221fb0e8a0db9ed8ad1f4bc51f037ab5a4b --- /dev/null +++ b/perplexity50/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb414222015430688af417aaaf424dbda9dd4151d44d4536ccda2d20cdbaad4 +size 11459 diff --git a/perplexity50/global_step80108/layer_38-model_01-model_states.pt b/perplexity50/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f20d5f46495a336eafc2a37ef337e23b83f65ca --- /dev/null +++ b/perplexity50/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1cbc1cc6be9fefa1e10791319dba3a1f79ec72d72f1c2cf7e4873f7f13a3a66 +size 11459 diff --git a/perplexity50/global_step80108/mp_rank_00_model_states.pt b/perplexity50/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d7ab7e76f9f0c848e7ead60a67a6de4446ab74 --- /dev/null +++ b/perplexity50/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2baf6d113c70244394479e7489091d85443249fd56ef968487c2f1515008291 +size 49971 diff --git a/perplexity50/global_step80108/mp_rank_01_model_states.pt b/perplexity50/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..958b27432d4f1212726e06b1dd8e782911cf30a2 --- /dev/null +++ b/perplexity50/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2973374c5f20cda6fdf8e539bf799dea9fe745edebc28d904a04caefb5065292 +size 49971 diff --git a/perplexity50/transformers/config.json b/perplexity50/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8d973cca6c303d39373fc10106af26358b0ef51 --- /dev/null +++ b/perplexity50/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 2560, "n_layer": 34, "n_head": 20, "n_inner": 10240, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/perplexity50/transformers/pytorch_model.bin b/perplexity50/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..296a30e3c9887b1dcecfc072d7f7a2499c47279d --- /dev/null +++ b/perplexity50/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6533883b93203bac514bf26ba623fc312ffe3d67134ab4aabbf4c74d69e9dc1 +size 5904072781