diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..04d34249d603485b77e7e7dc676228d79d39f4c2 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,27 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..159bc6b6a5a532cd3e7b39365aae435eb095118a --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.39867475560543253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040710617580952874}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07159145875770288, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002283808001727691}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.33011129846709864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005549061845378151}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10122826174069728, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002030855444856264}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031026301819685173, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014049201598679499}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.141245281048318, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003480506067615889}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04403608291299997, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012192330846573284}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06766144263497025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002200382676285986}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3140572523976384, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005291909825302324}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09551945698986261, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018848555816109573}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06725304160135988, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022287248715200532}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.30648495757927524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0051352153658538804}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09445387353772787, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019087634807937826}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..29ec13fb67e68ab423f09d7df4ec3651144a8cdf --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5977516671543485, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03455978435410294}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.15329732392184445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004761968102469258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.33370364652423734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005246547259909354}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1711963022842594, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0038816812182382796}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07679311519695951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0031236928525937855}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16882814193332238, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003640171016562461}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0857526213458049, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002597828881141045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.13595872134603265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00415929123413415}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3095423761616577, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004810670635852979}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1534319102614937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0033050845225794535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.13980848021437933, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004295380685702628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.31383788958058917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00486300699089206}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1570680694188298, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003409305514835227}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..35a60ff438a6528fe1fc9d0d5f342a7da722830e --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8503915955853156, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05968548918805337}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1917742263420682, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005385679944541483}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3738096503830145, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005103325336420911}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2091458628301747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004368376241819497}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10356295618475722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003683856363979968}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19885995393306385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003903858113021774}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11135315365861329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003118659844197972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16851904595769937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004611458862978508}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34493506529791307, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004681893250444328}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18644863944216591, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003718060906678577}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17381481236849558, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004812357218174625}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.34931922765393125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004727442594540538}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19076821047822043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0038409906523227373}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..91f437063ec87ccd382d7a8c513f728345011398 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.0608115765539845, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05486212986821941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.2109031935726629, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005657574041201383}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38579341297680214, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005263285665966895}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.22576763475110825, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004567332560152851}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11718228855429308, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0039778102828192516}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20867650284917746, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004090722696838276}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1222000218776608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0032692358141888987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.18502061308156897, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00494101709613097}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3541127463117956, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0048313529786746376}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.19994721976859944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003893228020122849}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.19117483049363265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005112752281414307}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35990671696452886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004900147798514321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.2055386770672947, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004032516312771944}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..31f5238d0d899e7a1021ce9770a41563f4bfeb6c --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.158092237390548, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07452530667512201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.2295067379234449, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0059287703100318265}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40298988844952865, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00497792321884406}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2406471321436084, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004596728562288805}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.12859268415342448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004204050255493124}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21890193742839065, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003990051975819316}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.13098409219865875, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003365830035361665}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.19954826063286818, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005140545573172722}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36706220250566124, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004574558237043198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.21211741223916908, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003973821558556186}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.20786819450493935, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005347471613133442}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37558574187088717, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046496158518284265}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.21938170732231038, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0041053949186676784}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..442f249057cf78f4f1d4e8b66c0439fbd5412999 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.3912791138065583, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07547788285778162}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.24790045979902117, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.006118840902841762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4151553294689575, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005017236192009034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.25846836171966886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004870562806193873}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.14286641755431828, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004399109330777923}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2303936349020371, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004075946874373824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1440780447118915, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003537122239634605}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.21538085312440458, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00527177793605653}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3783352287326247, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004644197217937787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.22741941196495352, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.004181213734611599}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.22513353909188877, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005531377737909901}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3875077488648253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047015995940884545}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.23598364900790592, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0043592478927788475}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..08a3f668d5c1c84c32b9c821437cd45b2785a962 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.0983375818863275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029053806058016835}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.12947888309750052, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0031473479280467198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.09571267819389127, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022899105765691293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.019660602529021045, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009095314106449951}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.02987435711226961, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012172920898615256}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.021249378039416924, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008023915053086402}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.07993490033371602, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025495157441145547}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.10403034397768768, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002524536215776094}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.07569979604312303, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017489838355855545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.09140255938348718, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027879956998521685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.11935909833374875, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002924586364247349}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.08804228557786513, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021147247236710737}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.3716396460310256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.053237921475075736}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2cab56134801c9bfece443fe6986e2d40e82110d --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2744539537425681, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004094328235431946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20170838774611544, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002762665652290496}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.19520859102820864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023238276963889674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07934207376791574, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002463348090483984}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05161000248015028, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001498911556068985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05109974611655904, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013693724913750134}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.21534515919762, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0033577432477576922}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15642273279178595, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021832373243515003}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15103480090963925, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018026481462705155}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.25936704726034565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003901950893364067}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19051893854427063, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002613048263614744}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18411759086730042, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021842348386272325}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.1039054275536215, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10890100851738928}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2c50899b5a9189c14a61839d1d9d20d0998f8c00 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.3460381570015358, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004003344331842124}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23464288041344536, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027534125642066803}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.24085996898585788, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002327696120886891}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.11151199462195266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026567771627046344}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06934611067556229, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001590260268305198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.07281302072231448, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015331223512556303}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2720546258349463, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003358764729317707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18272653217328982, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002227548532418399}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.18727237241373534, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001864663335169569}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.3279410319312666, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003860840910318087}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22156477723365048, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002619713558025792}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.22759593452074767, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022262933288697143}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 4.021085183806486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10816463413951247}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee3c43af2a48f37dc12d06e192324af374b2dcd --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.29806862880783386, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004379212298416797}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.19523732178409814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030541305702034035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2013812252122371, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026442870837295527}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0944687677366076, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002549028495799297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05859589734154174, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015957713051932727}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.060392462467898575, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014617335431351905}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.23529644412419154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0035766830650948893}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15306469354602847, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024463484798115413}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1575651913948673, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020868868630608897}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.28262725801972627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004215517896622171}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.18413938272093217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029006585330709185}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1901383608530664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025143987155999636}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.8492374969628904, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08750896589246163}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3b91c147b22fb6c6b056c07d24b1fd43f5d39592 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.09744191367423756, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0036149483966249}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06351396221418004, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024571906285560316}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.06426126220521501, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022879021970431588}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030295987904196204, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017243942607559877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.018491602504902276, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001060705507474276}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.018863111807267564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009913845983569886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.07836036552522192, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029649730324953685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.050259543495048555, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019585266496901644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.05089928957613344, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018155956397895659}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.09237908655494775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034638908963912757}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.05946970338742905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002300251520662075}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.060406863253473476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002154837434813025}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.04222973749038275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.008257164616079426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..2680f4b327777794e25543742033e60e5a8b6aa3 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.015305807829806464, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016276583452807518}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.009349321645652907, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010109706029017072}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.00953238699480448, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009587457771524576}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.004958444950717817, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00078608095281603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0026826988588868894, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0003968858121931347}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0028143315500782783, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00039639159831938314}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.01243346272156789, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013729751550239605}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0073466093897751935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0007905623261997666}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007529872183034152, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007598887929454067}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.014878898488927081, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015914308498318637}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.008983079259713787, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0009667267066960596}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.009188390133961012, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0009205800070516369}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.846919172678707e-16, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.0413111014482104e-15}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cda6ca0bb2e1e5cac73bffb50238dd539d2a16c1 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 8.198586697938474, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.054371247913430655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4231953254379122, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0056811184198751995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41981351300313063, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004043734085642848}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3022704849875045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020893712232562985}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3051389569292783, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.006594915459228414}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20265608384266906, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002503934686098032}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14423544971256652, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014159696060948752}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3836380762491933, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005946261746966947}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3484722408438825, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033554610252052412}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2534973577384106, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001628749077015259}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3962431609974829, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005875394355670361}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3703437525515446, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003620950376631745}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.26893260867745544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018533435510961985}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..895b7de48fedc735d44d0cbe4f355b8367652cd6 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.954988812929066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14638391482320653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5311859863746525, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031772485874862837}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43624994053743726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030327438873743837}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4537564177673297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023632144199618754}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24897172805854162, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002559248595927766}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20337318700614485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022235996604563096}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21085921681195505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020229136192088815}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.38733665631563075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002821853296737016}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.315877576992612, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024697936355976423}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.32899874690483255, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002049880594632269}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4347157576529157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030856903887374197}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35598940596786033, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002795354387124902}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.37054424699208366, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002335750021395727}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ca09eb239cb059b9cea781f0f0f5b7dbc25d55d6 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.73609934719948, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1706582991235465}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5680092384554517, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031495723548982087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4759328537809361, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029386091005988964}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.49441630977548484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022862001339864647}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.28544083962132866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026946059983280406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23719216451336508, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023245662185703573}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24603831528858075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021292376417195715}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.42134005366112265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002909446351508468}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3512428781930749, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002532983060440299}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3653029314145531, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002146107896814678}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.475872210666167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031333580177863346}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3981455953816073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002824532725234551}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.41379888832533746, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00237786243846331}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b56eb73d9282c9ae74a2722afd87f0bb34c7ecb3 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.048354827099848, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13173575451352945}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5658695177334656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031270966615477226}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4772433101176052, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002917359278396573}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4953189142141289, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002271954969288382}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2857562961388842, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002592704630991091}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2406640346417443, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023517367710014212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24880756415774488, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021197041292271416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.420758211599137, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002882465972530548}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.353211891202741, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025199808294822496}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3670423199742575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021430589574260245}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4741438305573669, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003065753471768471}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3999905903170581, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028010787672272464}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.41508607573173817, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023504639188504377}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ebbeaf9e5639afa4c223c4a2cbabf1f450053f56 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.659789068321356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09790592578075817}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5629082237331698, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031003560888099003}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48698263732189806, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00287742331110304}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5009803259010409, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022733438320721978}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2853458371364896, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026072609808903465}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24654716022968468, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023658238343093408}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.25262951809146383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002143658780301566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.41748637464334715, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028245699760167772}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.360690044589161, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002543868919808212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3707998453692219, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002141988029007844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.47279540233959655, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030412213049662708}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4099044454840407, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028278158640341732}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42113638543719284, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023735545802868797}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1c3b126998077a544d5a46c9f4eb37b28bf8c871 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.823188838317058, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1368685740129237}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5616100796950558, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031091108469005055}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4850202390045189, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028303944848881626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5006752815479694, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002293153386217313}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2862382834902288, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026324353670205162}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24621876290655678, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023348256981223997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.253549804289564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002160468600623493}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.42006777923537075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002838373199736789}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36307186033383765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025521298014791567}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3742926890886437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002195861570391623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4750750508873225, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003062574123520972}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4112165114016575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002792171967020979}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42403643962685617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024063554475022685}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c048f7755a514b03ce98e2e0359ddf9c39f176ef --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.119120787601094, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023903339190153865}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2461239647280435, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004464088909716045}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15265221672321955, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026395478481095695}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.021414744477178442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009940965797788914}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.049032580222604115, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023171129192253166}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02898750523181668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013247193132835207}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09592721076197161, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019579324417703724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1978355142295738, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035176799456197697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12235254548597051, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002020584245155245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09716298214503066, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002022535774203556}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20129878308057195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037572922765230963}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12420575571774427, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021512334045276564}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.171269553073038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08153430802540716}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fcf763c7486bce04d2856ae341f227cdfd28a0c4 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10224744795994899, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019764379774743278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.23590822077779397, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004177064380964356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.13902284366105663, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024556497954162514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.016207513348042157, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008615781781451241}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03905160442337228, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020375288076235304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02231228910998861, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011471564552570346}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08236658742598567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015445410531161362}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19134487295792035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003380183880201007}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11213145719440366, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019182613072779942}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08052607097380447, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015434958084231858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18734245397230653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003385262789984471}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.10976827761223337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019415142922813897}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9048271934902518, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06835860071628046}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a3696611a9d07bf0d84fd5ad807948fc10381911 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.22173311440321666, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004109442469093336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.24407066905873215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0039449863279907875}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2179588836123356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0033902392785234987}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0489853613709537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024629201330116494}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05128610907736208, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002273587180471874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04679084112223886, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021370388355844076}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.16718537084915933, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003201387426185195}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.183772543674527, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0030394228586101703}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16402350220086148, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0026122531049125497}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.16900869672693924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031978995143340755}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18767663761745132, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031822595104393585}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1663715483433569, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026310551428506287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.314221689423562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17638598922785836}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f7846200265bd82140b54cd754eeab4d5d01e8ca --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2337627371131494, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004249737953653732}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.22725208941553016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004010986661230982}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2197892591864117, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003666804932828543}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.05339111111134872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024509143835275216}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.049825868827123865, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022675300569590423}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04903344742670968, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021800365971211236}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.17463575759203218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003402527377508609}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1692107411887922, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031370692854018833}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16380342910756276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002909510596814998}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.17650859372044322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003403724174446378}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.17225092039068918, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032378857630900775}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16595773590679566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002927988954487852}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.754436883607044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.168222551241106}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..80033998395ee6a15e2465f28161f3ba19c67522 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0672089280846886, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004365308186585058}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.052674217830646665, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003299030898118782}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.053733463265401994, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003263549332918562}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.014382600033410985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014988508353396943}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.011774586389019105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012243332638704686}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.012165431481051413, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012546534160519155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.052955195940592614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003709170208574461}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.03946016910084321, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002530795032801481}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.04075928712930905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002550780700931808}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.05345610024362179, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0037197148122439573}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04019695133532339, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025782928954495906}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.04131811744935463, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025725346112910707}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.08668412486361368, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.021081432536932964}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..07548a27a40389464c5fb8fe2c0725c7e2d9d167 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/agg.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5d05146f28a0dc3de8b37245aced17442c9e9659 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d86f8eb5a84aed1346681376a0a7e650d6660f7b673b974fdceb1b92bd927e00 +size 4207700 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..21333b34a97b03f755dda7c34fdb91a15146976d --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f056458ed913962d90a870cb93a028b6b5703b6d91966485626b39475e06bd +size 4698295 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fc671829251b9893a1bfe40afcc2e67bb2cb024b --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145d96246e5e215e968ca7d4aa19e9e86c1f65129b2712ab9cdd89882417c7ff +size 5526385 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..69984a09e8b95d526b67f7d4ef26888efd66706e --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cc1f3a5063a91591be3ae326483f12b5b3aeaff9b282e4ad323ab31e70f784 +size 6383679 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..eacebf041704910f437c483316dce1d0b888a404 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8fae03f1a9fee8c03aa80e35ecf2766562612ce89ab3aa836f61c0a48954f1 +size 7265182 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1a29abaad73edd019f33c7952980ecfc5597ca66 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea5ed6c3c9f36d04ac7ab367749ca82bcd647a8bee90413244911539e393ba9 +size 8134668 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92165caf67be0260d7459e1fb7e67e56a593784f --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb3d2cf755985515814b016926a4fca84137689f9c161adc86615e9193f4f11 +size 7300984 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b13a17acd90841a25e6d33686294809dd55c2ede --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfaa135e3b814d2f7f70a3aad6275465750cc48d59ff2e475175fdd0c5f16f5d +size 12963259 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a40a6c78e7de80be42aa3401a365962d713d0195 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe8323f30ca241d66367bdf16d28319671ea0e3041242fa46a606b43dba073e +size 18501610 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b18c24be74f080613113eeb9c7b9af1ce0320940 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387e65e34b46a50c228fad6d3e1cedeb938040b525df8e4b4f7ed5aa48e4c117 +size 23985147 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2115ed6f46270c2a5c484b824a3036dde5479692 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c532f85b25d29b6f91cacaf81669f277f552ff08e24815ee09fa962cc4e77b +size 29356269 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..da7f969eee39cd866cb184641702807c5a1bf72c --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4691019a0a3c6d6becb467ca0ea88644dfc977295db8ff446b89362a7d4064ba +size 34781524 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aa6c6992ca1c38c541aa7d9324c99a9dea44b040 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd56323ee596f31bc046b35593af7e22847677d6d3c187a7b885b54c1190f96 +size 4252036 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f4a980f94df5999b5cba9c623f5b72515c7fcf33 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160c9cb661770b63d919c19aae62dcaae67488ea98b9ebc5dc4f318b3a9f1cad +size 5025554 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ecee4d3b356a6352ebc7e82e11f3583ffcdf0483 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4325671fcbd547ea3ad4c1a2bd23430a57ee391001826c8aaf848bd33cbe7f37 +size 6110041 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..94e4c2d78130c6188d9ee1aad0310b3b0a2f8391 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c002bee39212cdc5bf8ca17a64d88e1c3f5c33bf66be59ff072d44cd843ae5bd +size 7193008 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09ad241a85097212000e6fd96577a65e6a61ee41 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b291bd2331e3dd1016c6fa50f016b7a83b3336b11ec2c717f699e23bf2b631c7 +size 8278206 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ef7493e73aad240e1404cd75aa2aa4655787d256 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b35a35d056ee72d18c3f4e806797f564ad599d71370506cb87a8706b42733e2 +size 9362431 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..29754429b18ff5930be391f6de557b4d450682af --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165c8101a7aee6c9dfc73ca595f83fc6401972d7cd20eb4f8f0b9802a8018ac2 +size 2788560 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..75b69cb85bf1982d496e5d008762355ecc2f1fd6 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d13074feec7626bdec7e8e9f65e8549e7b79e5a20a07f8573262c313634880 +size 5085802 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e054895e4138098e1155e2f285d76af7d8be1cb8 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7604b5514a1e78e21dcc95fde971bb4fbc85ae058b913e6a3cd9289255cb050f +size 7210010 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..364b72155eabfbefe60b66adf9bbef17514c318e --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef4f217ff4941b54244c3800fad1689944ed07b360a35595a6920b826be0313 +size 9462224 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09ff6d9f09f3daf49089a3739120096a16754cdd --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92190a4a5bcc39f3014114e46175596412a4b648d2280322049589038d048eca +size 11626723 diff --git a/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.jsonl b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0aaee5fe029787cee5ee904b4410f5c9a2883942 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/examples.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65d4d0227bd4d26f3e9a99d734f3d030328c20d626c6f922920b3dc155977f38 +size 13896009 diff --git a/4b284boscarperplexity25/evaluation/generation/merged.csv b/4b284boscarperplexity25/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..f87d5ec1d98a3c45e986d2a749da8b4d812b02bd --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.14423544971256652 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.14423544971256652 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.21085921681195505 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.21085921681195505 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.24603831528858075 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.24603831528858075 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.24880756415774488 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.24880756415774488 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.25262951809146383 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.25262951809146383 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.253549804289564 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.253549804289564 +e2e_nlg_cleaned,5,average,multiple,0.22601997805864582 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.02898750523181668 +gem_xsum,0,median,rouge2_fmeasure,0.02898750523181668 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.02231228910998861 +gem_xsum,1,median,rouge2_fmeasure,0.02231228910998861 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.04679084112223886 +gem_xsum,2,median,rouge2_fmeasure,0.04679084112223886 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.04903344742670968 +gem_xsum,3,median,rouge2_fmeasure,0.04903344742670968 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.012165431481051413 +gem_xsum,4,median,rouge2_fmeasure,0.012165431481051413 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0 +gem_xsum,5,median,rouge2_fmeasure,0.0 +gem_xsum,5,average,multiple,0.026548252395300873 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04403608291299997 +web_nlg_en,0,median,rouge2_fmeasure,0.04403608291299997 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0857526213458049 +web_nlg_en,1,median,rouge2_fmeasure,0.0857526213458049 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.11135315365861329 +web_nlg_en,2,median,rouge2_fmeasure,0.11135315365861329 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.1222000218776608 +web_nlg_en,3,median,rouge2_fmeasure,0.1222000218776608 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.13098409219865875 +web_nlg_en,4,median,rouge2_fmeasure,0.13098409219865875 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.1440780447118915 +web_nlg_en,5,median,rouge2_fmeasure,0.1440780447118915 +web_nlg_en,5,average,multiple,0.1064006694509382 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.021249378039416924 +wiki_lingua_en,0,median,rouge2_fmeasure,0.021249378039416924 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.05109974611655904 +wiki_lingua_en,1,median,rouge2_fmeasure,0.05109974611655904 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.07281302072231448 +wiki_lingua_en,2,median,rouge2_fmeasure,0.07281302072231448 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.060392462467898575 +wiki_lingua_en,3,median,rouge2_fmeasure,0.060392462467898575 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.018863111807267564 +wiki_lingua_en,4,median,rouge2_fmeasure,0.018863111807267564 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0028143315500782783 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0028143315500782783 +wiki_lingua_en,5,average,multiple,0.03787200845058914 diff --git a/4b284boscarperplexity25/evaluation/generation/merged.json b/4b284boscarperplexity25/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..3807f381a4e122405488ae7b31a62243affd6a61 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.39867475560543253, "bleu_stderr": 0.040710617580952874, "rouge1_fmeasure": 0.10122826174069728, "rouge1_fmeasure_stderr": 0.002030855444856264, "rouge1_precision": 0.07159145875770288, "rouge1_precision_stderr": 0.002283808001727691, "rouge1_recall": 0.33011129846709864, "rouge1_recall_stderr": 0.005549061845378151, "rouge2_fmeasure": 0.04403608291299997, "rouge2_fmeasure_stderr": 0.0012192330846573284, "rouge2_precision": 0.031026301819685173, "rouge2_precision_stderr": 0.0014049201598679499, "rouge2_recall": 0.141245281048318, "rouge2_recall_stderr": 0.003480506067615889, "rougeL_fmeasure": 0.09551945698986261, "rougeL_fmeasure_stderr": 0.0018848555816109573, "rougeL_precision": 0.06766144263497025, "rougeL_precision_stderr": 0.002200382676285986, "rougeL_recall": 0.3140572523976384, "rougeL_recall_stderr": 0.005291909825302324, "rougeLsum_fmeasure": 0.09445387353772787, "rougeLsum_fmeasure_stderr": 0.0019087634807937826, "rougeLsum_precision": 0.06725304160135988, "rougeLsum_precision_stderr": 0.0022287248715200532, "rougeLsum_recall": 0.30648495757927524, "rougeLsum_recall_stderr": 0.0051352153658538804}}, "1": {"PALM_prompt": {"bleu": 0.5977516671543485, "bleu_stderr": 0.03455978435410294, "rouge1_fmeasure": 0.1711963022842594, "rouge1_fmeasure_stderr": 0.0038816812182382796, "rouge1_precision": 0.15329732392184445, "rouge1_precision_stderr": 0.004761968102469258, "rouge1_recall": 0.33370364652423734, "rouge1_recall_stderr": 0.005246547259909354, "rouge2_fmeasure": 0.0857526213458049, "rouge2_fmeasure_stderr": 0.002597828881141045, "rouge2_precision": 0.07679311519695951, "rouge2_precision_stderr": 0.0031236928525937855, "rouge2_recall": 0.16882814193332238, "rouge2_recall_stderr": 0.003640171016562461, "rougeL_fmeasure": 0.1534319102614937, "rougeL_fmeasure_stderr": 0.0033050845225794535, "rougeL_precision": 0.13595872134603265, "rougeL_precision_stderr": 0.00415929123413415, "rougeL_recall": 0.3095423761616577, "rougeL_recall_stderr": 0.004810670635852979, "rougeLsum_fmeasure": 0.1570680694188298, "rougeLsum_fmeasure_stderr": 0.003409305514835227, "rougeLsum_precision": 0.13980848021437933, "rougeLsum_precision_stderr": 0.004295380685702628, "rougeLsum_recall": 0.31383788958058917, "rougeLsum_recall_stderr": 0.00486300699089206}}, "2": {"PALM_prompt": {"bleu": 0.8503915955853156, "bleu_stderr": 0.05968548918805337, "rouge1_fmeasure": 0.2091458628301747, "rouge1_fmeasure_stderr": 0.004368376241819497, "rouge1_precision": 0.1917742263420682, "rouge1_precision_stderr": 0.005385679944541483, "rouge1_recall": 0.3738096503830145, "rouge1_recall_stderr": 0.005103325336420911, "rouge2_fmeasure": 0.11135315365861329, "rouge2_fmeasure_stderr": 0.003118659844197972, "rouge2_precision": 0.10356295618475722, "rouge2_precision_stderr": 0.003683856363979968, "rouge2_recall": 0.19885995393306385, "rouge2_recall_stderr": 0.003903858113021774, "rougeL_fmeasure": 0.18644863944216591, "rougeL_fmeasure_stderr": 0.003718060906678577, "rougeL_precision": 0.16851904595769937, "rougeL_precision_stderr": 0.004611458862978508, "rougeL_recall": 0.34493506529791307, "rougeL_recall_stderr": 0.004681893250444328, "rougeLsum_fmeasure": 0.19076821047822043, "rougeLsum_fmeasure_stderr": 0.0038409906523227373, "rougeLsum_precision": 0.17381481236849558, "rougeLsum_precision_stderr": 0.004812357218174625, "rougeLsum_recall": 0.34931922765393125, "rougeLsum_recall_stderr": 0.004727442594540538}}, "3": {"PALM_prompt": {"bleu": 1.0608115765539845, "bleu_stderr": 0.05486212986821941, "rouge1_fmeasure": 0.22576763475110825, "rouge1_fmeasure_stderr": 0.004567332560152851, "rouge1_precision": 0.2109031935726629, "rouge1_precision_stderr": 0.005657574041201383, "rouge1_recall": 0.38579341297680214, "rouge1_recall_stderr": 0.005263285665966895, "rouge2_fmeasure": 0.1222000218776608, "rouge2_fmeasure_stderr": 0.0032692358141888987, "rouge2_precision": 0.11718228855429308, "rouge2_precision_stderr": 0.0039778102828192516, "rouge2_recall": 0.20867650284917746, "rouge2_recall_stderr": 0.004090722696838276, "rougeL_fmeasure": 0.19994721976859944, "rougeL_fmeasure_stderr": 0.003893228020122849, "rougeL_precision": 0.18502061308156897, "rougeL_precision_stderr": 0.00494101709613097, "rougeL_recall": 0.3541127463117956, "rougeL_recall_stderr": 0.0048313529786746376, "rougeLsum_fmeasure": 0.2055386770672947, "rougeLsum_fmeasure_stderr": 0.004032516312771944, "rougeLsum_precision": 0.19117483049363265, "rougeLsum_precision_stderr": 0.005112752281414307, "rougeLsum_recall": 0.35990671696452886, "rougeLsum_recall_stderr": 0.004900147798514321}}, "4": {"PALM_prompt": {"bleu": 1.158092237390548, "bleu_stderr": 0.07452530667512201, "rouge1_fmeasure": 0.2406471321436084, "rouge1_fmeasure_stderr": 0.004596728562288805, "rouge1_precision": 0.2295067379234449, "rouge1_precision_stderr": 0.0059287703100318265, "rouge1_recall": 0.40298988844952865, "rouge1_recall_stderr": 0.00497792321884406, "rouge2_fmeasure": 0.13098409219865875, "rouge2_fmeasure_stderr": 0.003365830035361665, "rouge2_precision": 0.12859268415342448, "rouge2_precision_stderr": 0.004204050255493124, "rouge2_recall": 0.21890193742839065, "rouge2_recall_stderr": 0.003990051975819316, "rougeL_fmeasure": 0.21211741223916908, "rougeL_fmeasure_stderr": 0.003973821558556186, "rougeL_precision": 0.19954826063286818, "rougeL_precision_stderr": 0.005140545573172722, "rougeL_recall": 0.36706220250566124, "rougeL_recall_stderr": 0.004574558237043198, "rougeLsum_fmeasure": 0.21938170732231038, "rougeLsum_fmeasure_stderr": 0.0041053949186676784, "rougeLsum_precision": 0.20786819450493935, "rougeLsum_precision_stderr": 0.005347471613133442, "rougeLsum_recall": 0.37558574187088717, "rougeLsum_recall_stderr": 0.0046496158518284265}}, "5": {"PALM_prompt": {"bleu": 1.3912791138065583, "bleu_stderr": 0.07547788285778162, "rouge1_fmeasure": 0.25846836171966886, "rouge1_fmeasure_stderr": 0.004870562806193873, "rouge1_precision": 0.24790045979902117, "rouge1_precision_stderr": 0.006118840902841762, "rouge1_recall": 0.4151553294689575, "rouge1_recall_stderr": 0.005017236192009034, "rouge2_fmeasure": 0.1440780447118915, "rouge2_fmeasure_stderr": 0.003537122239634605, "rouge2_precision": 0.14286641755431828, "rouge2_precision_stderr": 0.004399109330777923, "rouge2_recall": 0.2303936349020371, "rouge2_recall_stderr": 0.004075946874373824, "rougeL_fmeasure": 0.22741941196495352, "rougeL_fmeasure_stderr": 0.004181213734611599, "rougeL_precision": 0.21538085312440458, "rougeL_precision_stderr": 0.00527177793605653, "rougeL_recall": 0.3783352287326247, "rougeL_recall_stderr": 0.004644197217937787, "rougeLsum_fmeasure": 0.23598364900790592, "rougeLsum_fmeasure_stderr": 0.0043592478927788475, "rougeLsum_precision": 0.22513353909188877, "rougeLsum_precision_stderr": 0.005531377737909901, "rougeLsum_recall": 0.3875077488648253, "rougeLsum_recall_stderr": 0.0047015995940884545}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.3716396460310256, "bleu_stderr": 0.053237921475075736, "rouge1_fmeasure": 0.09571267819389127, "rouge1_fmeasure_stderr": 0.0022899105765691293, "rouge1_precision": 0.0983375818863275, "rouge1_precision_stderr": 0.0029053806058016835, "rouge1_recall": 0.12947888309750052, "rouge1_recall_stderr": 0.0031473479280467198, "rouge2_fmeasure": 0.021249378039416924, "rouge2_fmeasure_stderr": 0.0008023915053086402, "rouge2_precision": 0.019660602529021045, "rouge2_precision_stderr": 0.0009095314106449951, "rouge2_recall": 0.02987435711226961, "rouge2_recall_stderr": 0.0012172920898615256, "rougeL_fmeasure": 0.07569979604312303, "rougeL_fmeasure_stderr": 0.0017489838355855545, "rougeL_precision": 0.07993490033371602, "rougeL_precision_stderr": 0.0025495157441145547, "rougeL_recall": 0.10403034397768768, "rougeL_recall_stderr": 0.002524536215776094, "rougeLsum_fmeasure": 0.08804228557786513, "rougeLsum_fmeasure_stderr": 0.0021147247236710737, "rougeLsum_precision": 0.09140255938348718, "rougeLsum_precision_stderr": 0.0027879956998521685, "rougeLsum_recall": 0.11935909833374875, "rougeLsum_recall_stderr": 0.002924586364247349}}, "1": {"tldr_en": {"bleu": 3.1039054275536215, "bleu_stderr": 0.10890100851738928, "rouge1_fmeasure": 0.19520859102820864, "rouge1_fmeasure_stderr": 0.0023238276963889674, "rouge1_precision": 0.2744539537425681, "rouge1_precision_stderr": 0.004094328235431946, "rouge1_recall": 0.20170838774611544, "rouge1_recall_stderr": 0.002762665652290496, "rouge2_fmeasure": 0.05109974611655904, "rouge2_fmeasure_stderr": 0.0013693724913750134, "rouge2_precision": 0.07934207376791574, "rouge2_precision_stderr": 0.002463348090483984, "rouge2_recall": 0.05161000248015028, "rouge2_recall_stderr": 0.001498911556068985, "rougeL_fmeasure": 0.15103480090963925, "rougeL_fmeasure_stderr": 0.0018026481462705155, "rougeL_precision": 0.21534515919762, "rougeL_precision_stderr": 0.0033577432477576922, "rougeL_recall": 0.15642273279178595, "rougeL_recall_stderr": 0.0021832373243515003, "rougeLsum_fmeasure": 0.18411759086730042, "rougeLsum_fmeasure_stderr": 0.0021842348386272325, "rougeLsum_precision": 0.25936704726034565, "rougeLsum_precision_stderr": 0.003901950893364067, "rougeLsum_recall": 0.19051893854427063, "rougeLsum_recall_stderr": 0.002613048263614744}}, "2": {"tldr_en": {"bleu": 4.021085183806486, "bleu_stderr": 0.10816463413951247, "rouge1_fmeasure": 0.24085996898585788, "rouge1_fmeasure_stderr": 0.002327696120886891, "rouge1_precision": 0.3460381570015358, "rouge1_precision_stderr": 0.004003344331842124, "rouge1_recall": 0.23464288041344536, "rouge1_recall_stderr": 0.0027534125642066803, "rouge2_fmeasure": 0.07281302072231448, "rouge2_fmeasure_stderr": 0.0015331223512556303, "rouge2_precision": 0.11151199462195266, "rouge2_precision_stderr": 0.0026567771627046344, "rouge2_recall": 0.06934611067556229, "rouge2_recall_stderr": 0.001590260268305198, "rougeL_fmeasure": 0.18727237241373534, "rougeL_fmeasure_stderr": 0.001864663335169569, "rougeL_precision": 0.2720546258349463, "rougeL_precision_stderr": 0.003358764729317707, "rougeL_recall": 0.18272653217328982, "rougeL_recall_stderr": 0.002227548532418399, "rougeLsum_fmeasure": 0.22759593452074767, "rougeLsum_fmeasure_stderr": 0.0022262933288697143, "rougeLsum_precision": 0.3279410319312666, "rougeLsum_precision_stderr": 0.003860840910318087, "rougeLsum_recall": 0.22156477723365048, "rougeLsum_recall_stderr": 0.002619713558025792}}, "3": {"tldr_en": {"bleu": 2.8492374969628904, "bleu_stderr": 0.08750896589246163, "rouge1_fmeasure": 0.2013812252122371, "rouge1_fmeasure_stderr": 0.0026442870837295527, "rouge1_precision": 0.29806862880783386, "rouge1_precision_stderr": 0.004379212298416797, "rouge1_recall": 0.19523732178409814, "rouge1_recall_stderr": 0.0030541305702034035, "rouge2_fmeasure": 0.060392462467898575, "rouge2_fmeasure_stderr": 0.0014617335431351905, "rouge2_precision": 0.0944687677366076, "rouge2_precision_stderr": 0.002549028495799297, "rouge2_recall": 0.05859589734154174, "rouge2_recall_stderr": 0.0015957713051932727, "rougeL_fmeasure": 0.1575651913948673, "rougeL_fmeasure_stderr": 0.0020868868630608897, "rougeL_precision": 0.23529644412419154, "rougeL_precision_stderr": 0.0035766830650948893, "rougeL_recall": 0.15306469354602847, "rougeL_recall_stderr": 0.0024463484798115413, "rougeLsum_fmeasure": 0.1901383608530664, "rougeLsum_fmeasure_stderr": 0.0025143987155999636, "rougeLsum_precision": 0.28262725801972627, "rougeLsum_precision_stderr": 0.004215517896622171, "rougeLsum_recall": 0.18413938272093217, "rougeLsum_recall_stderr": 0.0029006585330709185}}, "4": {"tldr_en": {"bleu": 0.04222973749038275, "bleu_stderr": 0.008257164616079426, "rouge1_fmeasure": 0.06426126220521501, "rouge1_fmeasure_stderr": 0.0022879021970431588, "rouge1_precision": 0.09744191367423756, "rouge1_precision_stderr": 0.0036149483966249, "rouge1_recall": 0.06351396221418004, "rouge1_recall_stderr": 0.0024571906285560316, "rouge2_fmeasure": 0.018863111807267564, "rouge2_fmeasure_stderr": 0.0009913845983569886, "rouge2_precision": 0.030295987904196204, "rouge2_precision_stderr": 0.0017243942607559877, "rouge2_recall": 0.018491602504902276, "rouge2_recall_stderr": 0.001060705507474276, "rougeL_fmeasure": 0.05089928957613344, "rougeL_fmeasure_stderr": 0.0018155956397895659, "rougeL_precision": 0.07836036552522192, "rougeL_precision_stderr": 0.0029649730324953685, "rougeL_recall": 0.050259543495048555, "rougeL_recall_stderr": 0.0019585266496901644, "rougeLsum_fmeasure": 0.060406863253473476, "rougeLsum_fmeasure_stderr": 0.002154837434813025, "rougeLsum_precision": 0.09237908655494775, "rougeLsum_precision_stderr": 0.0034638908963912757, "rougeLsum_recall": 0.05946970338742905, "rougeLsum_recall_stderr": 0.002300251520662075}}, "5": {"tldr_en": {"bleu": 1.846919172678707e-16, "bleu_stderr": 2.0413111014482104e-15, "rouge1_fmeasure": 0.00953238699480448, "rouge1_fmeasure_stderr": 0.0009587457771524576, "rouge1_precision": 0.015305807829806464, "rouge1_precision_stderr": 0.0016276583452807518, "rouge1_recall": 0.009349321645652907, "rouge1_recall_stderr": 0.0010109706029017072, "rouge2_fmeasure": 0.0028143315500782783, "rouge2_fmeasure_stderr": 0.00039639159831938314, "rouge2_precision": 0.004958444950717817, "rouge2_precision_stderr": 0.00078608095281603, "rouge2_recall": 0.0026826988588868894, "rouge2_recall_stderr": 0.0003968858121931347, "rougeL_fmeasure": 0.007529872183034152, "rougeL_fmeasure_stderr": 0.0007598887929454067, "rougeL_precision": 0.01243346272156789, "rougeL_precision_stderr": 0.0013729751550239605, "rougeL_recall": 0.0073466093897751935, "rougeL_recall_stderr": 0.0007905623261997666, "rougeLsum_fmeasure": 0.009188390133961012, "rougeLsum_fmeasure_stderr": 0.0009205800070516369, "rougeLsum_precision": 0.014878898488927081, "rougeLsum_precision_stderr": 0.0015914308498318637, "rougeLsum_recall": 0.008983079259713787, "rougeLsum_recall_stderr": 0.0009667267066960596}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 8.198586697938474, "bleu_stderr": 0.054371247913430655, "rouge1_fmeasure": 0.3022704849875045, "rouge1_fmeasure_stderr": 0.0020893712232562985, "rouge1_precision": 0.4231953254379122, "rouge1_precision_stderr": 0.0056811184198751995, "rouge1_recall": 0.41981351300313063, "rouge1_recall_stderr": 0.004043734085642848, "rouge2_fmeasure": 0.14423544971256652, "rouge2_fmeasure_stderr": 0.0014159696060948752, "rouge2_precision": 0.3051389569292783, "rouge2_precision_stderr": 0.006594915459228414, "rouge2_recall": 0.20265608384266906, "rouge2_recall_stderr": 0.002503934686098032, "rougeL_fmeasure": 0.2534973577384106, "rougeL_fmeasure_stderr": 0.001628749077015259, "rougeL_precision": 0.3836380762491933, "rougeL_precision_stderr": 0.005946261746966947, "rougeL_recall": 0.3484722408438825, "rougeL_recall_stderr": 0.0033554610252052412, "rougeLsum_fmeasure": 0.26893260867745544, "rougeLsum_fmeasure_stderr": 0.0018533435510961985, "rougeLsum_precision": 0.3962431609974829, "rougeLsum_precision_stderr": 0.005875394355670361, "rougeLsum_recall": 0.3703437525515446, "rougeLsum_recall_stderr": 0.003620950376631745}}, "1": {"generate_text_restaurant": {"bleu": 11.954988812929066, "bleu_stderr": 0.14638391482320653, "rouge1_fmeasure": 0.4537564177673297, "rouge1_fmeasure_stderr": 0.0023632144199618754, "rouge1_precision": 0.5311859863746525, "rouge1_precision_stderr": 0.0031772485874862837, "rouge1_recall": 0.43624994053743726, "rouge1_recall_stderr": 0.0030327438873743837, "rouge2_fmeasure": 0.21085921681195505, "rouge2_fmeasure_stderr": 0.0020229136192088815, "rouge2_precision": 0.24897172805854162, "rouge2_precision_stderr": 0.002559248595927766, "rouge2_recall": 0.20337318700614485, "rouge2_recall_stderr": 0.0022235996604563096, "rougeL_fmeasure": 0.32899874690483255, "rougeL_fmeasure_stderr": 0.002049880594632269, "rougeL_precision": 0.38733665631563075, "rougeL_precision_stderr": 0.002821853296737016, "rougeL_recall": 0.315877576992612, "rougeL_recall_stderr": 0.0024697936355976423, "rougeLsum_fmeasure": 0.37054424699208366, "rougeLsum_fmeasure_stderr": 0.002335750021395727, "rougeLsum_precision": 0.4347157576529157, "rougeLsum_precision_stderr": 0.0030856903887374197, "rougeLsum_recall": 0.35598940596786033, "rougeLsum_recall_stderr": 0.002795354387124902}}, "2": {"generate_text_restaurant": {"bleu": 14.73609934719948, "bleu_stderr": 0.1706582991235465, "rouge1_fmeasure": 0.49441630977548484, "rouge1_fmeasure_stderr": 0.0022862001339864647, "rouge1_precision": 0.5680092384554517, "rouge1_precision_stderr": 0.0031495723548982087, "rouge1_recall": 0.4759328537809361, "rouge1_recall_stderr": 0.0029386091005988964, "rouge2_fmeasure": 0.24603831528858075, "rouge2_fmeasure_stderr": 0.0021292376417195715, "rouge2_precision": 0.28544083962132866, "rouge2_precision_stderr": 0.0026946059983280406, "rouge2_recall": 0.23719216451336508, "rouge2_recall_stderr": 0.0023245662185703573, "rougeL_fmeasure": 0.3653029314145531, "rougeL_fmeasure_stderr": 0.002146107896814678, "rougeL_precision": 0.42134005366112265, "rougeL_precision_stderr": 0.002909446351508468, "rougeL_recall": 0.3512428781930749, "rougeL_recall_stderr": 0.002532983060440299, "rougeLsum_fmeasure": 0.41379888832533746, "rougeLsum_fmeasure_stderr": 0.00237786243846331, "rougeLsum_precision": 0.475872210666167, "rougeLsum_precision_stderr": 0.0031333580177863346, "rougeLsum_recall": 0.3981455953816073, "rougeLsum_recall_stderr": 0.002824532725234551}}, "3": {"generate_text_restaurant": {"bleu": 15.048354827099848, "bleu_stderr": 0.13173575451352945, "rouge1_fmeasure": 0.4953189142141289, "rouge1_fmeasure_stderr": 0.002271954969288382, "rouge1_precision": 0.5658695177334656, "rouge1_precision_stderr": 0.0031270966615477226, "rouge1_recall": 0.4772433101176052, "rouge1_recall_stderr": 0.002917359278396573, "rouge2_fmeasure": 0.24880756415774488, "rouge2_fmeasure_stderr": 0.0021197041292271416, "rouge2_precision": 0.2857562961388842, "rouge2_precision_stderr": 0.002592704630991091, "rouge2_recall": 0.2406640346417443, "rouge2_recall_stderr": 0.0023517367710014212, "rougeL_fmeasure": 0.3670423199742575, "rougeL_fmeasure_stderr": 0.0021430589574260245, "rougeL_precision": 0.420758211599137, "rougeL_precision_stderr": 0.002882465972530548, "rougeL_recall": 0.353211891202741, "rougeL_recall_stderr": 0.0025199808294822496, "rougeLsum_fmeasure": 0.41508607573173817, "rougeLsum_fmeasure_stderr": 0.0023504639188504377, "rougeLsum_precision": 0.4741438305573669, "rougeLsum_precision_stderr": 0.003065753471768471, "rougeLsum_recall": 0.3999905903170581, "rougeLsum_recall_stderr": 0.0028010787672272464}}, "4": {"generate_text_restaurant": {"bleu": 15.659789068321356, "bleu_stderr": 0.09790592578075817, "rouge1_fmeasure": 0.5009803259010409, "rouge1_fmeasure_stderr": 0.0022733438320721978, "rouge1_precision": 0.5629082237331698, "rouge1_precision_stderr": 0.0031003560888099003, "rouge1_recall": 0.48698263732189806, "rouge1_recall_stderr": 0.00287742331110304, "rouge2_fmeasure": 0.25262951809146383, "rouge2_fmeasure_stderr": 0.002143658780301566, "rouge2_precision": 0.2853458371364896, "rouge2_precision_stderr": 0.0026072609808903465, "rouge2_recall": 0.24654716022968468, "rouge2_recall_stderr": 0.0023658238343093408, "rougeL_fmeasure": 0.3707998453692219, "rougeL_fmeasure_stderr": 0.002141988029007844, "rougeL_precision": 0.41748637464334715, "rougeL_precision_stderr": 0.0028245699760167772, "rougeL_recall": 0.360690044589161, "rougeL_recall_stderr": 0.002543868919808212, "rougeLsum_fmeasure": 0.42113638543719284, "rougeLsum_fmeasure_stderr": 0.0023735545802868797, "rougeLsum_precision": 0.47279540233959655, "rougeLsum_precision_stderr": 0.0030412213049662708, "rougeLsum_recall": 0.4099044454840407, "rougeLsum_recall_stderr": 0.0028278158640341732}}, "5": {"generate_text_restaurant": {"bleu": 15.823188838317058, "bleu_stderr": 0.1368685740129237, "rouge1_fmeasure": 0.5006752815479694, "rouge1_fmeasure_stderr": 0.002293153386217313, "rouge1_precision": 0.5616100796950558, "rouge1_precision_stderr": 0.0031091108469005055, "rouge1_recall": 0.4850202390045189, "rouge1_recall_stderr": 0.0028303944848881626, "rouge2_fmeasure": 0.253549804289564, "rouge2_fmeasure_stderr": 0.002160468600623493, "rouge2_precision": 0.2862382834902288, "rouge2_precision_stderr": 0.0026324353670205162, "rouge2_recall": 0.24621876290655678, "rouge2_recall_stderr": 0.0023348256981223997, "rougeL_fmeasure": 0.3742926890886437, "rougeL_fmeasure_stderr": 0.002195861570391623, "rougeL_precision": 0.42006777923537075, "rougeL_precision_stderr": 0.002838373199736789, "rougeL_recall": 0.36307186033383765, "rougeL_recall_stderr": 0.0025521298014791567, "rougeLsum_fmeasure": 0.42403643962685617, "rougeLsum_fmeasure_stderr": 0.0024063554475022685, "rougeLsum_precision": 0.4750750508873225, "rougeLsum_precision_stderr": 0.003062574123520972, "rougeLsum_recall": 0.4112165114016575, "rougeLsum_recall_stderr": 0.002792171967020979}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.171269553073038, "bleu_stderr": 0.08153430802540716, "rouge1_fmeasure": 0.15265221672321955, "rouge1_fmeasure_stderr": 0.0026395478481095695, "rouge1_precision": 0.119120787601094, "rouge1_precision_stderr": 0.0023903339190153865, "rouge1_recall": 0.2461239647280435, "rouge1_recall_stderr": 0.004464088909716045, "rouge2_fmeasure": 0.02898750523181668, "rouge2_fmeasure_stderr": 0.0013247193132835207, "rouge2_precision": 0.021414744477178442, "rouge2_precision_stderr": 0.0009940965797788914, "rouge2_recall": 0.049032580222604115, "rouge2_recall_stderr": 0.0023171129192253166, "rougeL_fmeasure": 0.12235254548597051, "rougeL_fmeasure_stderr": 0.002020584245155245, "rougeL_precision": 0.09592721076197161, "rougeL_precision_stderr": 0.0019579324417703724, "rougeL_recall": 0.1978355142295738, "rougeL_recall_stderr": 0.0035176799456197697, "rougeLsum_fmeasure": 0.12420575571774427, "rougeLsum_fmeasure_stderr": 0.0021512334045276564, "rougeLsum_precision": 0.09716298214503066, "rougeLsum_precision_stderr": 0.002022535774203556, "rougeLsum_recall": 0.20129878308057195, "rougeLsum_recall_stderr": 0.0037572922765230963}}, "1": {"article_DOC_summary": {"bleu": 0.9048271934902518, "bleu_stderr": 0.06835860071628046, "rouge1_fmeasure": 0.13902284366105663, "rouge1_fmeasure_stderr": 0.0024556497954162514, "rouge1_precision": 0.10224744795994899, "rouge1_precision_stderr": 0.0019764379774743278, "rouge1_recall": 0.23590822077779397, "rouge1_recall_stderr": 0.004177064380964356, "rouge2_fmeasure": 0.02231228910998861, "rouge2_fmeasure_stderr": 0.0011471564552570346, "rouge2_precision": 0.016207513348042157, "rouge2_precision_stderr": 0.0008615781781451241, "rouge2_recall": 0.03905160442337228, "rouge2_recall_stderr": 0.0020375288076235304, "rougeL_fmeasure": 0.11213145719440366, "rougeL_fmeasure_stderr": 0.0019182613072779942, "rougeL_precision": 0.08236658742598567, "rougeL_precision_stderr": 0.0015445410531161362, "rougeL_recall": 0.19134487295792035, "rougeL_recall_stderr": 0.003380183880201007, "rougeLsum_fmeasure": 0.10976827761223337, "rougeLsum_fmeasure_stderr": 0.0019415142922813897, "rougeLsum_precision": 0.08052607097380447, "rougeLsum_precision_stderr": 0.0015434958084231858, "rougeLsum_recall": 0.18734245397230653, "rougeLsum_recall_stderr": 0.003385262789984471}}, "2": {"article_DOC_summary": {"bleu": 2.314221689423562, "bleu_stderr": 0.17638598922785836, "rouge1_fmeasure": 0.2179588836123356, "rouge1_fmeasure_stderr": 0.0033902392785234987, "rouge1_precision": 0.22173311440321666, "rouge1_precision_stderr": 0.004109442469093336, "rouge1_recall": 0.24407066905873215, "rouge1_recall_stderr": 0.0039449863279907875, "rouge2_fmeasure": 0.04679084112223886, "rouge2_fmeasure_stderr": 0.0021370388355844076, "rouge2_precision": 0.0489853613709537, "rouge2_precision_stderr": 0.0024629201330116494, "rouge2_recall": 0.05128610907736208, "rouge2_recall_stderr": 0.002273587180471874, "rougeL_fmeasure": 0.16402350220086148, "rougeL_fmeasure_stderr": 0.0026122531049125497, "rougeL_precision": 0.16718537084915933, "rougeL_precision_stderr": 0.003201387426185195, "rougeL_recall": 0.183772543674527, "rougeL_recall_stderr": 0.0030394228586101703, "rougeLsum_fmeasure": 0.1663715483433569, "rougeLsum_fmeasure_stderr": 0.0026310551428506287, "rougeLsum_precision": 0.16900869672693924, "rougeLsum_precision_stderr": 0.0031978995143340755, "rougeLsum_recall": 0.18767663761745132, "rougeLsum_recall_stderr": 0.0031822595104393585}}, "3": {"article_DOC_summary": {"bleu": 2.754436883607044, "bleu_stderr": 0.168222551241106, "rouge1_fmeasure": 0.2197892591864117, "rouge1_fmeasure_stderr": 0.003666804932828543, "rouge1_precision": 0.2337627371131494, "rouge1_precision_stderr": 0.004249737953653732, "rouge1_recall": 0.22725208941553016, "rouge1_recall_stderr": 0.004010986661230982, "rouge2_fmeasure": 0.04903344742670968, "rouge2_fmeasure_stderr": 0.0021800365971211236, "rouge2_precision": 0.05339111111134872, "rouge2_precision_stderr": 0.0024509143835275216, "rouge2_recall": 0.049825868827123865, "rouge2_recall_stderr": 0.0022675300569590423, "rougeL_fmeasure": 0.16380342910756276, "rougeL_fmeasure_stderr": 0.002909510596814998, "rougeL_precision": 0.17463575759203218, "rougeL_precision_stderr": 0.003402527377508609, "rougeL_recall": 0.1692107411887922, "rougeL_recall_stderr": 0.0031370692854018833, "rougeLsum_fmeasure": 0.16595773590679566, "rougeLsum_fmeasure_stderr": 0.002927988954487852, "rougeLsum_precision": 0.17650859372044322, "rougeLsum_precision_stderr": 0.003403724174446378, "rougeLsum_recall": 0.17225092039068918, "rougeLsum_recall_stderr": 0.0032378857630900775}}, "4": {"article_DOC_summary": {"bleu": 0.08668412486361368, "bleu_stderr": 0.021081432536932964, "rouge1_fmeasure": 0.053733463265401994, "rouge1_fmeasure_stderr": 0.003263549332918562, "rouge1_precision": 0.0672089280846886, "rouge1_precision_stderr": 0.004365308186585058, "rouge1_recall": 0.052674217830646665, "rouge1_recall_stderr": 0.003299030898118782, "rouge2_fmeasure": 0.012165431481051413, "rouge2_fmeasure_stderr": 0.0012546534160519155, "rouge2_precision": 0.014382600033410985, "rouge2_precision_stderr": 0.0014988508353396943, "rouge2_recall": 0.011774586389019105, "rouge2_recall_stderr": 0.0012243332638704686, "rougeL_fmeasure": 0.04075928712930905, "rougeL_fmeasure_stderr": 0.002550780700931808, "rougeL_precision": 0.052955195940592614, "rougeL_precision_stderr": 0.003709170208574461, "rougeL_recall": 0.03946016910084321, "rougeL_recall_stderr": 0.002530795032801481, "rougeLsum_fmeasure": 0.04131811744935463, "rougeLsum_fmeasure_stderr": 0.0025725346112910707, "rougeLsum_precision": 0.05345610024362179, "rougeLsum_precision_stderr": 0.0037197148122439573, "rougeLsum_recall": 0.04019695133532339, "rougeLsum_recall_stderr": 0.0025782928954495906}}, "5": {"article_DOC_summary": {"bleu": 0.0, "bleu_stderr": 0.0, "rouge1_fmeasure": 0.0, "rouge1_fmeasure_stderr": 0.0, "rouge1_precision": 0.0, "rouge1_precision_stderr": 0.0, "rouge1_recall": 0.0, "rouge1_recall_stderr": 0.0, "rouge2_fmeasure": 0.0, "rouge2_fmeasure_stderr": 0.0, "rouge2_precision": 0.0, "rouge2_precision_stderr": 0.0, "rouge2_recall": 0.0, "rouge2_recall_stderr": 0.0, "rougeL_fmeasure": 0.0, "rougeL_fmeasure_stderr": 0.0, "rougeL_precision": 0.0, "rougeL_precision_stderr": 0.0, "rougeL_recall": 0.0, "rougeL_recall_stderr": 0.0, "rougeLsum_fmeasure": 0.0, "rougeLsum_fmeasure_stderr": 0.0, "rougeLsum_precision": 0.0, "rougeLsum_precision_stderr": 0.0, "rougeLsum_recall": 0.0, "rougeLsum_recall_stderr": 0.0}}}} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..215006cd2f0bf89f69d4e280da42d3c182a303b9 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.39867475560543253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040710617580952874 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07159145875770288, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002283808001727691 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.33011129846709864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005549061845378151 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10122826174069728, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002030855444856264 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031026301819685173, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0014049201598679499 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.141245281048318, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003480506067615889 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04403608291299997, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012192330846573284 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06766144263497025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002200382676285986 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3140572523976384, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005291909825302324 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09551945698986261, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018848555816109573 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06725304160135988, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022287248715200532 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.30648495757927524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0051352153658538804 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09445387353772787, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019087634807937826 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4c79da83eff3962c3e9a827ec74089338c696fc6 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5977516671543485, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03455978435410294 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.15329732392184445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004761968102469258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.33370364652423734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005246547259909354 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1711963022842594, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0038816812182382796 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07679311519695951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0031236928525937855 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16882814193332238, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003640171016562461 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0857526213458049, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002597828881141045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.13595872134603265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00415929123413415 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3095423761616577, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004810670635852979 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1534319102614937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0033050845225794535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.13980848021437933, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004295380685702628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.31383788958058917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00486300699089206 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1570680694188298, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003409305514835227 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ca403ad7495c5a0c9124867196e520cf22a52abc --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8503915955853156, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05968548918805337 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1917742263420682, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005385679944541483 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3738096503830145, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005103325336420911 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2091458628301747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004368376241819497 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10356295618475722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003683856363979968 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19885995393306385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003903858113021774 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11135315365861329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003118659844197972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16851904595769937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004611458862978508 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34493506529791307, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004681893250444328 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18644863944216591, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003718060906678577 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17381481236849558, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004812357218174625 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.34931922765393125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004727442594540538 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19076821047822043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0038409906523227373 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0a447f57857c6a1538774c75fdede5a74eab7f46 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.0608115765539845, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05486212986821941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.2109031935726629, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005657574041201383 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38579341297680214, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005263285665966895 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.22576763475110825, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004567332560152851 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11718228855429308, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0039778102828192516 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20867650284917746, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004090722696838276 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1222000218776608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0032692358141888987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.18502061308156897, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00494101709613097 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3541127463117956, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0048313529786746376 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.19994721976859944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003893228020122849 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.19117483049363265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005112752281414307 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35990671696452886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004900147798514321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.2055386770672947, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004032516312771944 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f135c077fa2f4ba5cd87f8a07e57fcea6b1c0a7e --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.158092237390548, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07452530667512201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.2295067379234449, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0059287703100318265 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40298988844952865, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00497792321884406 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2406471321436084, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004596728562288805 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.12859268415342448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004204050255493124 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21890193742839065, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003990051975819316 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.13098409219865875, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003365830035361665 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.19954826063286818, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005140545573172722 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36706220250566124, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004574558237043198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.21211741223916908, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003973821558556186 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.20786819450493935, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005347471613133442 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37558574187088717, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046496158518284265 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.21938170732231038, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0041053949186676784 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..05603d7ed534010bf3e337e2e55f3e0a9063af63 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.3912791138065583, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07547788285778162 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.24790045979902117, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.006118840902841762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4151553294689575, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005017236192009034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.25846836171966886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004870562806193873 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.14286641755431828, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004399109330777923 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2303936349020371, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004075946874373824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1440780447118915, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003537122239634605 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.21538085312440458, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00527177793605653 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3783352287326247, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004644197217937787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.22741941196495352, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.004181213734611599 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.22513353909188877, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005531377737909901 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3875077488648253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047015995940884545 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.23598364900790592, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0043592478927788475 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..50fff51d8589d104f8ced1dc134ceaa256c1d89c --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.0983375818863275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0029053806058016835 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.12947888309750052, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0031473479280467198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.09571267819389127, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022899105765691293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.019660602529021045, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009095314106449951 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.02987435711226961, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012172920898615256 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.021249378039416924, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008023915053086402 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.07993490033371602, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0025495157441145547 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.10403034397768768, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002524536215776094 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.07569979604312303, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017489838355855545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.09140255938348718, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0027879956998521685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.11935909833374875, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002924586364247349 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.08804228557786513, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021147247236710737 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.3716396460310256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.053237921475075736 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..71cb5007e8704ae6b4658a8e356e81e3b7d91bc4 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2744539537425681, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004094328235431946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20170838774611544, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002762665652290496 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.19520859102820864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0023238276963889674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07934207376791574, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002463348090483984 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05161000248015028, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001498911556068985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05109974611655904, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013693724913750134 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.21534515919762, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0033577432477576922 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15642273279178595, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021832373243515003 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15103480090963925, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018026481462705155 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.25936704726034565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003901950893364067 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19051893854427063, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002613048263614744 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18411759086730042, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021842348386272325 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.1039054275536215, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10890100851738928 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bad04f58590772badcc1b202f19ee8ad4385f0e5 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.3460381570015358, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004003344331842124 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23464288041344536, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027534125642066803 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.24085996898585788, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002327696120886891 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.11151199462195266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0026567771627046344 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06934611067556229, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001590260268305198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.07281302072231448, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0015331223512556303 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2720546258349463, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003358764729317707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18272653217328982, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002227548532418399 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.18727237241373534, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001864663335169569 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.3279410319312666, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003860840910318087 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22156477723365048, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002619713558025792 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.22759593452074767, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022262933288697143 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 4.021085183806486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10816463413951247 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..dffba1f8f8506734680cc639f4925bb031637ee4 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.29806862880783386, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004379212298416797 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.19523732178409814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0030541305702034035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2013812252122371, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0026442870837295527 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0944687677366076, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002549028495799297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05859589734154174, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015957713051932727 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.060392462467898575, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0014617335431351905 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.23529644412419154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0035766830650948893 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15306469354602847, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0024463484798115413 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1575651913948673, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0020868868630608897 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.28262725801972627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004215517896622171 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.18413938272093217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029006585330709185 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1901383608530664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0025143987155999636 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.8492374969628904, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08750896589246163 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1f43052290bcb35626fd86c014b71faada4622af --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.09744191367423756, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0036149483966249 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06351396221418004, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024571906285560316 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.06426126220521501, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022879021970431588 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030295987904196204, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0017243942607559877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.018491602504902276, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001060705507474276 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.018863111807267564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009913845983569886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.07836036552522192, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0029649730324953685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.050259543495048555, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019585266496901644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.05089928957613344, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018155956397895659 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.09237908655494775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0034638908963912757 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.05946970338742905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002300251520662075 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.060406863253473476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002154837434813025 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.04222973749038275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.008257164616079426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b73441909af8c75b7bf4413b6e48b94041badb06 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.015305807829806464, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016276583452807518 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.009349321645652907, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0010109706029017072 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.00953238699480448, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009587457771524576 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.004958444950717817, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00078608095281603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0026826988588868894, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0003968858121931347 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0028143315500782783, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00039639159831938314 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.01243346272156789, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013729751550239605 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0073466093897751935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0007905623261997666 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007529872183034152, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0007598887929454067 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.014878898488927081, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0015914308498318637 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.008983079259713787, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0009667267066960596 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.009188390133961012, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0009205800070516369 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.846919172678707e-16, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.0413111014482104e-15 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ed654007fa372058becb54da4e0b50a65337f160 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 8.198586697938474, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.054371247913430655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4231953254379122, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0056811184198751995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41981351300313063, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.004043734085642848 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3022704849875045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020893712232562985 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3051389569292783, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.006594915459228414 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20265608384266906, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002503934686098032 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14423544971256652, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014159696060948752 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3836380762491933, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.005946261746966947 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3484722408438825, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0033554610252052412 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2534973577384106, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001628749077015259 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3962431609974829, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.005875394355670361 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3703437525515446, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.003620950376631745 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.26893260867745544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018533435510961985 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..57a6e607e8f9c3ee25d022beb7638a667f046911 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.954988812929066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14638391482320653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5311859863746525, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031772485874862837 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43624994053743726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030327438873743837 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4537564177673297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023632144199618754 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24897172805854162, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002559248595927766 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20337318700614485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022235996604563096 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21085921681195505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020229136192088815 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.38733665631563075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002821853296737016 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.315877576992612, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024697936355976423 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.32899874690483255, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002049880594632269 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4347157576529157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030856903887374197 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35598940596786033, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002795354387124902 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.37054424699208366, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002335750021395727 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a620f4805a727e6c15c5003b60981c34a98ff0cc --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.73609934719948, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1706582991235465 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5680092384554517, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031495723548982087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4759328537809361, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029386091005988964 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.49441630977548484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022862001339864647 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.28544083962132866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026946059983280406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23719216451336508, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023245662185703573 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24603831528858075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021292376417195715 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.42134005366112265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002909446351508468 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3512428781930749, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002532983060440299 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3653029314145531, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002146107896814678 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.475872210666167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031333580177863346 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3981455953816073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002824532725234551 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.41379888832533746, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00237786243846331 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e126da73f77b277f643966453e6eb83b66d8f4 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.048354827099848, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13173575451352945 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5658695177334656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031270966615477226 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4772433101176052, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002917359278396573 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4953189142141289, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002271954969288382 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2857562961388842, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002592704630991091 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2406640346417443, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023517367710014212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24880756415774488, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021197041292271416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.420758211599137, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002882465972530548 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.353211891202741, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025199808294822496 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3670423199742575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021430589574260245 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4741438305573669, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003065753471768471 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3999905903170581, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028010787672272464 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.41508607573173817, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023504639188504377 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..19ce921a7dc11f4c1ab57a19adced0ab1af8f80d --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.659789068321356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09790592578075817 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5629082237331698, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031003560888099003 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48698263732189806, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00287742331110304 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5009803259010409, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022733438320721978 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2853458371364896, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026072609808903465 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24654716022968468, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023658238343093408 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.25262951809146383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002143658780301566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.41748637464334715, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028245699760167772 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.360690044589161, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002543868919808212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3707998453692219, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002141988029007844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.47279540233959655, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030412213049662708 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4099044454840407, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028278158640341732 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42113638543719284, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023735545802868797 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c712894227d546d6ff22ebbbe4fd3d57581e2d7d --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.823188838317058, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1368685740129237 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5616100796950558, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031091108469005055 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4850202390045189, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028303944848881626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5006752815479694, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002293153386217313 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2862382834902288, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026324353670205162 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24621876290655678, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023348256981223997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.253549804289564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002160468600623493 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.42006777923537075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002838373199736789 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36307186033383765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025521298014791567 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3742926890886437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002195861570391623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4750750508873225, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003062574123520972 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4112165114016575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002792171967020979 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42403643962685617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024063554475022685 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d92d7c697fc8afdaccb9dae70a5637741bf276f8 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.119120787601094, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0023903339190153865 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2461239647280435, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004464088909716045 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15265221672321955, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026395478481095695 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.021414744477178442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009940965797788914 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.049032580222604115, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0023171129192253166 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02898750523181668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013247193132835207 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09592721076197161, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019579324417703724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1978355142295738, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035176799456197697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12235254548597051, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002020584245155245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09716298214503066, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002022535774203556 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20129878308057195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037572922765230963 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12420575571774427, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021512334045276564 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.171269553073038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08153430802540716 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..57423c712746ecbebb5dd8ec6a72e36ac07f6aa0 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10224744795994899, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0019764379774743278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.23590822077779397, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004177064380964356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.13902284366105663, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024556497954162514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.016207513348042157, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008615781781451241 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03905160442337228, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020375288076235304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02231228910998861, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011471564552570346 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08236658742598567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015445410531161362 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19134487295792035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003380183880201007 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11213145719440366, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019182613072779942 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08052607097380447, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015434958084231858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18734245397230653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003385262789984471 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.10976827761223337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019415142922813897 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9048271934902518, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06835860071628046 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6d4636906f2ed4fcd9dca829c53446525c459982 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.22173311440321666, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004109442469093336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.24407066905873215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0039449863279907875 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2179588836123356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0033902392785234987 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0489853613709537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0024629201330116494 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05128610907736208, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002273587180471874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04679084112223886, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0021370388355844076 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.16718537084915933, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003201387426185195 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.183772543674527, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0030394228586101703 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16402350220086148, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0026122531049125497 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.16900869672693924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0031978995143340755 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18767663761745132, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031822595104393585 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1663715483433569, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0026310551428506287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.314221689423562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.17638598922785836 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9dd7ef8182d1213945713545db52af58daefb437 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2337627371131494, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004249737953653732 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.22725208941553016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004010986661230982 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2197892591864117, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003666804932828543 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.05339111111134872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0024509143835275216 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.049825868827123865, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0022675300569590423 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04903344742670968, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0021800365971211236 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.17463575759203218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003402527377508609 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1692107411887922, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031370692854018833 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16380342910756276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002909510596814998 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.17650859372044322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003403724174446378 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.17225092039068918, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032378857630900775 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16595773590679566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002927988954487852 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.754436883607044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.168222551241106 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..63df56be4867e2fbcb07a27bc9d6a32d2138bbd9 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0672089280846886, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004365308186585058 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.052674217830646665, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003299030898118782 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.053733463265401994, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003263549332918562 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.014382600033410985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014988508353396943 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.011774586389019105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0012243332638704686 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.012165431481051413, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012546534160519155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.052955195940592614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003709170208574461 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.03946016910084321, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002530795032801481 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.04075928712930905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002550780700931808 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.05345610024362179, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0037197148122439573 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04019695133532339, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0025782928954495906 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.04131811744935463, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025725346112910707 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.08668412486361368, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.021081432536932964 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5fbaa1e704ca4ddcd46cefed088e64d5d67edea6 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/generation/slim.4b284boscarperplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-perplexity/4b284boscarperplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..a272584546a42bbd8dc22f15b0e7c6062aed9c22 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.322,0.014782913600996676,0 +anli_r2,acc,0.331,0.014888272588203936,0 +anli_r3,acc,0.35583333333333333,0.01382651874849331,0 +arc_challenge,acc,0.27303754266211605,0.013019332762635748,0 +arc_challenge,acc_norm,0.29692832764505117,0.013352025976725222,0 +arc_easy,acc,0.6300505050505051,0.009906656266021156,0 +arc_easy,acc_norm,0.5631313131313131,0.0101776729281577,0 +boolq,acc,0.6241590214067279,0.008471147248160114,1 +cb,acc,0.30357142857142855,0.06199938655510754,1 +cb,f1,0.18214654282765738,,1 +copa,acc,0.74,0.044084400227680794,0 +hellaswag,acc,0.42471619199362676,0.004932896472460568,0 +hellaswag,acc_norm,0.5381398127862975,0.004975243508752003,0 +piqa,acc,0.720892274211099,0.010465657948498228,0 +piqa,acc_norm,0.7170837867247007,0.010508949177489676,0 +rte,acc,0.5379061371841155,0.030009848912529117,0 +sciq,acc,0.844,0.01148023500612235,0 +sciq,acc_norm,0.775,0.013211720158614751,0 +storycloze_2016,acc,0.6953500801710315,0.010643426988646796,0 +winogrande,acc,0.5706393054459353,0.013911537499969165,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.json new file mode 100644 index 0000000000000000000000000000000000000000..452406116f499a563b116cfe4e7c1f1564b12819 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.322, + "acc_stderr": 0.014782913600996676 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.014888272588203936 + }, + "anli_r3": { + "acc": 0.35583333333333333, + "acc_stderr": 0.01382651874849331 + }, + "cb": { + "acc": 0.30357142857142855, + "acc_stderr": 0.06199938655510754, + "f1": 0.18214654282765738 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.42471619199362676, + "acc_stderr": 0.004932896472460568, + "acc_norm": 0.5381398127862975, + "acc_norm_stderr": 0.004975243508752003 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5706393054459353, + "acc_stderr": 0.013911537499969165 + }, + "storycloze_2016": { + "acc": 0.6953500801710315, + "acc_stderr": 0.010643426988646796 + }, + "boolq": { + "acc": 0.6241590214067279, + "acc_stderr": 0.008471147248160114 + }, + "arc_easy": { + "acc": 0.6300505050505051, + "acc_stderr": 0.009906656266021156, + "acc_norm": 0.5631313131313131, + "acc_norm_stderr": 0.0101776729281577 + }, + "arc_challenge": { + "acc": 0.27303754266211605, + "acc_stderr": 0.013019332762635748, + "acc_norm": 0.29692832764505117, + "acc_norm_stderr": 0.013352025976725222 + }, + "sciq": { + "acc": 0.844, + "acc_stderr": 0.01148023500612235, + "acc_norm": 0.775, + "acc_norm_stderr": 0.013211720158614751 + }, + "piqa": { + "acc": 0.720892274211099, + "acc_stderr": 0.010465657948498228, + "acc_norm": 0.7170837867247007, + "acc_norm_stderr": 0.010508949177489676 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..1bcefe33ee1aa8fc49432e0022ee0c69cd415a52 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.305,0.014566646394664378,0 +anli_r2,acc,0.327,0.01484221315341124,0 +anli_r3,acc,0.36916666666666664,0.013936668349285275,0 +arc_challenge,acc,0.29266211604095566,0.013295916103619411,0 +arc_challenge,acc_norm,0.3199658703071672,0.013631345807016195,0 +arc_easy,acc,0.6321548821548821,0.00989492346445519,0 +arc_easy,acc_norm,0.6140572390572391,0.009989277329503953,0 +boolq,acc,0.6137614678899083,0.008515695986533813,1 +cb,acc,0.4107142857142857,0.06633634150359541,1 +cb,f1,0.2858641489640703,,1 +copa,acc,0.74,0.04408440022768077,0 +hellaswag,acc,0.4231228838876718,0.004930448527146667,0 +hellaswag,acc_norm,0.5464050985859391,0.004968244611429394,0 +piqa,acc,0.7257889009793254,0.01040861866493338,0 +piqa,acc_norm,0.7181719260065288,0.01049667523125815,0 +rte,acc,0.5379061371841155,0.030009848912529113,0 +sciq,acc,0.9,0.009491579957525061,0 +sciq,acc_norm,0.891,0.009859828407037186,0 +storycloze_2016,acc,0.6932121859967931,0.01066427519047363,0 +winogrande,acc,0.5730071033938438,0.013901878072575055,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fdc0e1aca58800c96e0a54205b8658de26e56fcc --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.305, + "acc_stderr": 0.014566646394664378 + }, + "anli_r2": { + "acc": 0.327, + "acc_stderr": 0.01484221315341124 + }, + "anli_r3": { + "acc": 0.36916666666666664, + "acc_stderr": 0.013936668349285275 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.2858641489640703 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768077 + }, + "hellaswag": { + "acc": 0.4231228838876718, + "acc_stderr": 0.004930448527146667, + "acc_norm": 0.5464050985859391, + "acc_norm_stderr": 0.004968244611429394 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529113 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.013901878072575055 + }, + "storycloze_2016": { + "acc": 0.6932121859967931, + "acc_stderr": 0.01066427519047363 + }, + "boolq": { + "acc": 0.6137614678899083, + "acc_stderr": 0.008515695986533813 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.00989492346445519, + "acc_norm": 0.6140572390572391, + "acc_norm_stderr": 0.009989277329503953 + }, + "arc_challenge": { + "acc": 0.29266211604095566, + "acc_stderr": 0.013295916103619411, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016195 + }, + "sciq": { + "acc": 0.9, + "acc_stderr": 0.009491579957525061, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037186 + }, + "piqa": { + "acc": 0.7257889009793254, + "acc_stderr": 0.01040861866493338, + "acc_norm": 0.7181719260065288, + "acc_norm_stderr": 0.01049667523125815 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..ceb96ce42b8a48ff6717ffbfda010927d1256539 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.335,0.01493311749093257,0 +anli_r2,acc,0.335,0.014933117490932573,0 +anli_r3,acc,0.32666666666666666,0.013544340907003663,0 +arc_challenge,acc,0.30631399317406144,0.013470584417276513,0 +arc_challenge,acc_norm,0.33276450511945393,0.013769863046192309,0 +arc_easy,acc,0.6401515151515151,0.009848484848484844,0 +arc_easy,acc_norm,0.627104377104377,0.009922743197129243,0 +boolq,acc,0.6110091743119266,0.008526800159503209,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.24071773636991026,,1 +copa,acc,0.73,0.044619604333847394,0 +hellaswag,acc,0.4237203744274049,0.0049313726571297975,0 +hellaswag,acc_norm,0.5493925512846046,0.004965375341643137,0 +piqa,acc,0.7187159956474428,0.010490509832327423,0 +piqa,acc_norm,0.720892274211099,0.010465657948498228,0 +rte,acc,0.5018050541516246,0.030096267148976626,0 +sciq,acc,0.91,0.009054390204866439,0 +sciq,acc_norm,0.907,0.009188875634996698,0 +storycloze_2016,acc,0.7012292891501871,0.010584692134739974,0 +winogrande,acc,0.580110497237569,0.013870943986310391,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bcfdd9af3491db5a2422558171b5e456e9375dc2 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.01493311749093257 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.32666666666666666, + "acc_stderr": 0.013544340907003663 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.24071773636991026 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.4237203744274049, + "acc_stderr": 0.0049313726571297975, + "acc_norm": 0.5493925512846046, + "acc_norm_stderr": 0.004965375341643137 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310391 + }, + "storycloze_2016": { + "acc": 0.7012292891501871, + "acc_stderr": 0.010584692134739974 + }, + "boolq": { + "acc": 0.6110091743119266, + "acc_stderr": 0.008526800159503209 + }, + "arc_easy": { + "acc": 0.6401515151515151, + "acc_stderr": 0.009848484848484844, + "acc_norm": 0.627104377104377, + "acc_norm_stderr": 0.009922743197129243 + }, + "arc_challenge": { + "acc": 0.30631399317406144, + "acc_stderr": 0.013470584417276513, + "acc_norm": 0.33276450511945393, + "acc_norm_stderr": 0.013769863046192309 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866439, + "acc_norm": 0.907, + "acc_norm_stderr": 0.009188875634996698 + }, + "piqa": { + "acc": 0.7187159956474428, + "acc_stderr": 0.010490509832327423, + "acc_norm": 0.720892274211099, + "acc_norm_stderr": 0.010465657948498228 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..b3c1a87b5403522261009a91ada3ff84955bd963 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.316,0.014709193056057128,0 +anli_r2,acc,0.357,0.015158521721486778,0 +anli_r3,acc,0.3416666666666667,0.013696658778002514,0 +arc_challenge,acc,0.3054607508532423,0.0134600804780025,0 +arc_challenge,acc_norm,0.3174061433447099,0.01360223908803817,0 +arc_easy,acc,0.6388888888888888,0.00985601342581124,0 +arc_easy,acc_norm,0.640993265993266,0.009843424713072176,0 +boolq,acc,0.5981651376146789,0.008574857171671129,1 +cb,acc,0.5714285714285714,0.06672848092813058,1 +cb,f1,0.3727155727155727,,1 +copa,acc,0.72,0.045126085985421276,0 +hellaswag,acc,0.42730531766580365,0.004936762568217079,0 +hellaswag,acc_norm,0.5487950607448715,0.004965963647210311,0 +piqa,acc,0.7241566920565833,0.010427805502729115,0 +piqa,acc_norm,0.7230685527747551,0.010440499969334558,0 +rte,acc,0.5595667870036101,0.02988212336311872,0 +sciq,acc,0.91,0.009054390204866442,0 +sciq,acc_norm,0.906,0.009233052000787738,0 +storycloze_2016,acc,0.7081774452164618,0.010512588616199638,0 +winogrande,acc,0.5627466456195738,0.013941393310695922,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.json new file mode 100644 index 0000000000000000000000000000000000000000..028037da08067c2a615f378876df212e876d6f09 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057128 + }, + "anli_r2": { + "acc": 0.357, + "acc_stderr": 0.015158521721486778 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002514 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813058, + "f1": 0.3727155727155727 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.045126085985421276 + }, + "hellaswag": { + "acc": 0.42730531766580365, + "acc_stderr": 0.004936762568217079, + "acc_norm": 0.5487950607448715, + "acc_norm_stderr": 0.004965963647210311 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311872 + }, + "winogrande": { + "acc": 0.5627466456195738, + "acc_stderr": 0.013941393310695922 + }, + "storycloze_2016": { + "acc": 0.7081774452164618, + "acc_stderr": 0.010512588616199638 + }, + "boolq": { + "acc": 0.5981651376146789, + "acc_stderr": 0.008574857171671129 + }, + "arc_easy": { + "acc": 0.6388888888888888, + "acc_stderr": 0.00985601342581124, + "acc_norm": 0.640993265993266, + "acc_norm_stderr": 0.009843424713072176 + }, + "arc_challenge": { + "acc": 0.3054607508532423, + "acc_stderr": 0.0134600804780025, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866442, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787738 + }, + "piqa": { + "acc": 0.7241566920565833, + "acc_stderr": 0.010427805502729115, + "acc_norm": 0.7230685527747551, + "acc_norm_stderr": 0.010440499969334558 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..ee01ed251e25470171326cacb218bf90beeba66e --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.314,0.014683991951087967,0 +anli_r2,acc,0.334,0.014922019523732967,0 +anli_r3,acc,0.3458333333333333,0.013736245342311012,0 +arc_challenge,acc,0.30204778156996587,0.013417519144716426,0 +arc_challenge,acc_norm,0.3267918088737201,0.013706665975587333,0 +arc_easy,acc,0.6456228956228957,0.009815004030251743,0 +arc_easy,acc_norm,0.6473063973063973,0.009804420599378659,0 +boolq,acc,0.6131498470948012,0.008518188340844744,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.31417624521072796,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.4235212109141605,0.004931065434173686,0 +hellaswag,acc_norm,0.5517825134435371,0.004962949784236048,0 +piqa,acc,0.719260065288357,0.010484325438311827,0 +piqa,acc_norm,0.7181719260065288,0.010496675231258152,0 +rte,acc,0.516245487364621,0.030080573208738064,0 +sciq,acc,0.913,0.00891686663074593,0 +sciq,acc_norm,0.903,0.00936368937324811,0 +storycloze_2016,acc,0.7113842864778194,0.01047831178564294,0 +winogrande,acc,0.5706393054459353,0.013911537499969163,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cb64774d68b51a8c5766129aff88509c376054c9 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087967 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732967 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.31417624521072796 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4235212109141605, + "acc_stderr": 0.004931065434173686, + "acc_norm": 0.5517825134435371, + "acc_norm_stderr": 0.004962949784236048 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5706393054459353, + "acc_stderr": 0.013911537499969163 + }, + "storycloze_2016": { + "acc": 0.7113842864778194, + "acc_stderr": 0.01047831178564294 + }, + "boolq": { + "acc": 0.6131498470948012, + "acc_stderr": 0.008518188340844744 + }, + "arc_easy": { + "acc": 0.6456228956228957, + "acc_stderr": 0.009815004030251743, + "acc_norm": 0.6473063973063973, + "acc_norm_stderr": 0.009804420599378659 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.013417519144716426, + "acc_norm": 0.3267918088737201, + "acc_norm_stderr": 0.013706665975587333 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.00891686663074593, + "acc_norm": 0.903, + "acc_norm_stderr": 0.00936368937324811 + }, + "piqa": { + "acc": 0.719260065288357, + "acc_stderr": 0.010484325438311827, + "acc_norm": 0.7181719260065288, + "acc_norm_stderr": 0.010496675231258152 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.csv b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..b527cd6dde9dbb218f61d96a535c7fc1a0a8b4d1 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.32,0.014758652303574874,0 +anli_r2,acc,0.343,0.015019206922356951,0 +anli_r3,acc,0.3433333333333333,0.01371263383046586,0 +arc_challenge,acc,0.3037542662116041,0.013438909184778748,0 +arc_challenge,acc_norm,0.3225255972696246,0.013659980894277373,0 +arc_easy,acc,0.6452020202020202,0.009817629113069696,0 +arc_easy,acc_norm,0.6414141414141414,0.009840882301225297,0 +boolq,acc,0.6064220183486239,0.008544672418486905,1 +cb,acc,0.5892857142857143,0.06633634150359538,1 +cb,f1,0.3851732473811442,,1 +copa,acc,0.76,0.04292346959909283,0 +hellaswag,acc,0.4277036446922924,0.004937345081868091,0 +hellaswag,acc_norm,0.5569607647878908,0.004957296691391567,0 +piqa,acc,0.7225244831338411,0.010446818281039947,0 +piqa,acc_norm,0.7143634385201306,0.010539303948661913,0 +rte,acc,0.555956678700361,0.029907396333795983,0 +sciq,acc,0.916,0.008776162089491118,0 +sciq,acc_norm,0.915,0.008823426366942312,0 +storycloze_2016,acc,0.7017637626937466,0.01057924979557881,0 +winogrande,acc,0.5864246250986582,0.013840971763195306,0 diff --git a/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.json b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.json new file mode 100644 index 0000000000000000000000000000000000000000..15aef2fe9d8b81c8eef31e94fc61debfa9bcd976 --- /dev/null +++ b/4b284boscarperplexity25/evaluation/rankeval/4b284boscarperplexity25_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574874 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.5892857142857143, + "acc_stderr": 0.06633634150359538, + "f1": 0.3851732473811442 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4277036446922924, + "acc_stderr": 0.004937345081868091, + "acc_norm": 0.5569607647878908, + "acc_norm_stderr": 0.004957296691391567 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795983 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195306 + }, + "storycloze_2016": { + "acc": 0.7017637626937466, + "acc_stderr": 0.01057924979557881 + }, + "boolq": { + "acc": 0.6064220183486239, + "acc_stderr": 0.008544672418486905 + }, + "arc_easy": { + "acc": 0.6452020202020202, + "acc_stderr": 0.009817629113069696, + "acc_norm": 0.6414141414141414, + "acc_norm_stderr": 0.009840882301225297 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778748, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277373 + }, + "sciq": { + "acc": 0.916, + "acc_stderr": 0.008776162089491118, + "acc_norm": 0.915, + "acc_norm_stderr": 0.008823426366942312 + }, + "piqa": { + "acc": 0.7225244831338411, + "acc_stderr": 0.010446818281039947, + "acc_norm": 0.7143634385201306, + "acc_norm_stderr": 0.010539303948661913 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2132dfd6660e39065f61037cfc062c82a362bfc7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcd545ff247cad19b0b15507f894582e0ae768418f6adbf73a58731f837af83 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..471d39a1c85ce2951b9f37b5946d7b1d0023375d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbf2b381aa266fcf9a800f1f120efd831fb8fd65b4056408da0da394325f5b4 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c19cb584b303c467a021a78338c9259ea545440 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30280bdb23493814716d831b5005951d98ea1ba387627eb9cf9562dec9ee61ba +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..911f49c4fdf4df20dc870d89866a1b8a25f04485 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cb64373b1634bd3548f336824c90c2a9b22a62114c64843fd3b1ea7219d772 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc6fd201657cb987afc74e8d8c970ed5dfa14af --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f62376265e21a9dc7ff50a4f8c3138fcf083cabe2b10dc6643d656ada1c87c +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f7686a3af82b3f46a1af89aae0b5286b57a833 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f87f49b77b6a5c9f053b95f3e97a36db5b2974b1203d35f1ee8a20c32a7f6a +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a7cd989af059ed38a7c71aaed1b1943fcc9f9aa --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71478aa545b4877306096eb9372c644f77d1809e93e97359d83586edb1541b7 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e066ef79f7af7b233f0293995344e2560eeceead --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59551d4725ddbf76cf82e26642d76b0bcbccd4af40991258845f9c41401bf26c +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4480196a3bac6c62207e097560dcd4acf358546 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af59f70531804d25494d6a9024ec6151a36515cc72f734551be980900611d3bc +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e9e9f24d891b7dac4d806418db8d215399bef9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3560d12903c50bc8665b6c7d1c69fd7a00a1aac359cb47e769fc17c2598d4ac4 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28729452771a491726b1db618e2d4046b1239ea4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6facab8cd62784356c2c9a5c5e3304360600f93453e54f7b38ced0109b6740 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ae32274ae5cc818f32ab513d572a28839576b95 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2612d5af54a44f45cccd440e485b3d9b3ccf2478525bf41a0f8e7813a4f13a2f +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c42a8c0969921ef2ccd753dd789d415c9f7875a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53340249eab87bce51960ed3e017d42a9a45f800852a05c05fff4a2ce9b4c98b +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b43cce3abe83d120b1437945d4fd7a0406567f8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66bfac3caf4e9fe75a0961e075f739f52475e3c86c19bafe40fa83106df8dc7 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc899c9bb9ad383ffbc3939aeba216a95ac9268 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f603671918ce09750088b75376fa700ce5a37b55d4ef456523d65442704282e8 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6307f42c52690811db65961abe0741f57707c01a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1fd662e4fd4b4e06ed1094517019c7e66793d3ba763dcee6437c27d8340531 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24ed3a6bcb699e5a547ad00b16771f2d89adebad --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d283be10ba7c1fa7871b398570ddd0c34520c777c8dd5d005706305c7138280 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b003bd288e06b95d167abc6c38968781d45b8da --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d96692333858758740b86bce6667df7271dc21f57fc0d0c26cc9bf60f4651c +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57f33f49397ca96820346ee164c339f7ee2784e4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8863827012559a8c4a24dcbbc58f5e8337e8f54ce6be2c702ad0900e497dd1ed +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..138f04be118dd97104c0fa5001fdf8c092ca42f2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cedb584fbb0870904c6fb61db5005724c5ca977b0b0dd8a2b100a3a47903cc4 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16da2c394a5531082d0a0894824e7aa0b7fc827c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ab47f8cb714cc953e2f6c2ac3f890b20fbd62d28ec8f7fee4db3e68e5e56a4 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8886ce621ada18a6798c8c1a3aae32775816b6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897846d8b29253e978d299d33e55b7cfa7aca492b5d4c31b27634f8254f1327e +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4dcaf854249fafeb21cb0ef749a270e7f98c4fa --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c5de90bf72c9977cb8a46923c972c350a920cffa5a3f373dd41d0c4942d22a +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0d01cabca6c57e3b10198cfca7e6fa886cd889c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e06df5a403a05ea2eb92a5c643968f229b27d2d851a9269c984c979ec75ae7 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c3f92df3b969bd5a50740f70f4f5728679c9dd --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4441359837cd21e3117f0ac98f1ef2b58185f2f92d05e89685f6fb35d6bd2db +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecb7b03c18c2cc10f0aba37c0f8b3757c50f566c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43391c155c1029aaf5c3918317e4d0177ffa5315e9dc92eb20582a8ff30ce2e2 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6538acf065bf087220a26b662413086b9efe103 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f7bcb24883eecb8f23fbe59a735d7508cd0e7236f3816df900e5a5f72e31d2 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bd218053a2d028273f3b586888967c4415c69b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d8b6c0f353a46ceff65c1bce34e9ecdbf70e6765297d6110062b8a0be19da8 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acc2eb62fa56cb705c1ed1aacb2fb69a1e28b65e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68bee5af484559384dbbb285831d77b7dd3ceeaa145bed5c49689a4218f30075 +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cbff7039b6c9ba8d5eaaa92e327762fb83baa78 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59f18970785fb1351451c6f11b3aecd87f94857cdd6239cfebd087314001009 +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e801e4b578aad7841b2148883a4b69f672af12 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699a1719bf36a10b7b90fb5813b927714dccf8fcecf744c1b9bf32a73d03a321 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3f0c5a75d0bd1677f2742bc78c5907555f604b0 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358c84bf488ba827f0e0370491772a1723beb5654f1fa5b78df2941a90e1355b +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7025b3c5c16b5f5941a0642d36bb6935f95f7693 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b86deadb77897d2660f4b4d1a595f00235dc34f475fca9ed3fe23a130822f834 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fecb8e8a1a9073c62faa9937fabf3909614552d7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fe5f3b68928733411d88320775d820bd8127ba72daa731ff0323f69f958ad0 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f20b7e0592cecd33666a339984d0d2972b9e4fa --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78e7133828223167e8a1629869c03984000a79f0f9d1e6b93d6c71d2764ba72 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07be2f303349af0de11f7c54bbfa6ad34d9fc6a8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40dbc2225706db569ee98facffe00b7218fafac9f102f4fa7630bf13f4a9125 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbfbbe7d3de7b4a41f09ceeb8d5502f45d6ab7c7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47820dcd00a0f1f1e3d8f1cd877fc59f614249f25ec481c68a40cc7027fc5e56 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb49ba09a82fba5d0122a29cc192bd0c49237715 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407b61c771732fe2e25faa7674852377ef1dc295c7d67a46afd2a7406d0b6fc2 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da5ee34cd990ed169455136cc0c236c5d6d64e2f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e8f9b98affda4ffb71ff56d57363864d2341f4e1ae9f9efe15a11bd9aa3ef9 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89798b57738c5bde4412d941b541ab9f5361db1e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da706c27eb5a820d7d9926af3f661f9d860b7f3fbd7c23bfd229c374c42209b2 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9eb28052cc6834cc249e9cb9762ef370a17b68e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525be26b912a35f105d109efeb4aa0da236f700d9bca398adca5c9d099a04198 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa856d24c73158b9c9c06005fad054a1b955c86 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e6adbab7f1df692f07dfbcf3f7b67570af24fe62e34035087a650e668c646af +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9521283726694b2dd61988ca042b82afe1d8b6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efac47838b6f480b84addcad63ba92d1bf0d3ef28ec1fbf1355980907c06d87e +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bca2259ef75790926e9ed204e0e271184e75d97 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6076f35f6c0624eb78321ca78caba3c3f49f00479feb6a2f158a8e36e29f57 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82373eaf63b7c90b4d078a99ad9d5cda7972d675 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bab71bec5313c4a3e527e60225a3a4ca7202dd85dd694940e63c96d44fed7a3 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09704f08a931eb940239de2fdfb502be16b97672 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51229db8c59143355388dd24f908b2e7b9b76982e2363d85724c9c9546e0a6e9 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e64d44b33f42c0406d8a9c38c51865f060bc36c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d32a4f0ceeacba4539a854e6bdfc4597c0198f9de75b259b1d3a1283fb5c2f5 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..651527fbd06dd4eb4a6cc409c61581fce3b8c88e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:184cb569b945cbdca32b924a17192047cec49e232f12f2a12c9d992e16b0a7ea +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3774355fb18d0ac5547d62726d5a19231aaf2c35 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c80042dcab1b3e323c51482ec135c8760f6b9f090e90d6952f5a959909922fee +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10bed328e48407c1e837b96651ba7aac3f896ad --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc36490dabb816436b06c512d59f861997bf8fa0d6c75bf8183a97209c7cf69 +size 199058797 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ac63bbffda8ecce930cf866369ff6836cdf9acc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dedf03d40f0b98ab6a038a28f460ac2ce97bfa961eca4e9c1be832c42cebb77 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..751e5927fae135582f4c1d219f6d0918750a2957 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2565e5e3d31b30a388774acb0b7b6cfe22df26cb659310753480f9717689b5de +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69159f3f868f35dc5b44bc6fe3680ed6c37f53e6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a18d1a9f5975fbf424df1941611a429975faefafe67d7d205f6002d794fe10 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21de25b88ab08b909912511bbc9b1a4af66c5f01 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98bf54f97fd06d269ddba5f43e5fa4b9344516b14d906f176e5b9d4a4d5c9605 +size 199058733 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..209997c9f9284690b19ea05d6f8f79cfa0c835dd --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810a844f05961e2a95ea6910a91ff0f36afe3c04fccaabc4123459db07519d43 +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..338b48761e9d426b9e2e801365dd067dfc93f922 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5fb3b77f16474624a8493aede024b2432ca4fc4411eed3e1089974ec02717c +size 199058669 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e84d968cd8c9243e77dd2e84ccbc5f2334379cab --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1630068ff0e31fc5739a7ad83fd7b863c298e8711f355272955fae3a1f8cbc +size 199058925 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18d103906b722368a0cab3b7e4a598bc23cb6c4b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e29e8b6e80a07e57b4f772666f580bb515f779fd0f12835fd4c6641ca637eac +size 199058925 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dfa8e53536e190be43caf16e5eebc5ea540274b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb24609b56fc1a300b7ec1a81e7446d23e0761f6ded46d800970381571109588 +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87934fcd3e2d284e8382c228ef3d7a6a08771aa1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889ed3d7ca30230593207a2992f3d20756bb695190d3717bfad57ba169a5c9e1 +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf13df3a8c2b17540ffc6e873a6609bf79e9608 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f246ab9a5f92770c7646414219748b3a31eb1925b9e4464ad25eef0b2129b84c +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4594739a9aa9b64966189969cd97e0019088d938 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a234a9ba367bf557481556150495c9c2a55a4632a61e63e855b73dc8c73cea5 +size 199058605 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33d77412293cb786915a65533df4e071e400b0e1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52ceac881cb2adbf15457f90089657adf4edeba9e83305826cb53c4dbbca700 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5b30ec4f782741de6145d6311294e8a0820c31 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfd99b97cfb891c3875ff9bb2d4f9080097074902bf2a9e7da9ce0ac9e4ec97 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997090c750804a9a44476d08de01cadc369e343c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9717d9b040600580b566f418548a0286584dd688399e3c49f97221c5330ced4 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d368bbf10f7a9ffada190bfaa5f1ebc42ccede90 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e297868fc3ac4375dc7c8fbb1188654dd5a72dadc5b91610435e41abdf108cdc +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ef2e4f156354301138fd0bbe165fc00060b683 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8adbf13e028d94c369093ea75f622fbe78024dc1eccc5e25895d52807b89134 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9715023629bdf480747f1df5941be516cd2406 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925907e746fcc6599a406d3fa9306a016c15138313f896dbcc249cf84a3a960b +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f79e23af6755f19396aa30a78ccb1ef8f2155e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f741c7f3da998db0afd1daa40b720936e6ea4bd9af84b2b12ab2fcc935cd76 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b3c569385076fdf503899e0dfe3505bcfe33b1a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978332b21cfa5cbfec7bcbb1085d550a9ead55674d64f6e1731696ab04443f82 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc76558def3f68c063b3d414bf5e0109504799df --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd33147cf2fd951181275350ccf519eac9dba2a0d49f550c1505ee6c6b0dc5dc +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72ba5fcff1aa30feb5e215a6628d8f362ac5cf03 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a004526e9a406d6b792a1e2fb31a032497f7e6e2459d8d4273f7cea5ddadf90 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc28b8c3f38b3b95e5a042467ec95f2f81ef709 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ded2af240b98762691b5a99994632e77fb8336f96cd674341c36a0b7391797 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3933577a0af907f906b4c8d78d295778f1e766 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f1a862dd1421af01a7718f8a181088faffefe300af7dfb0c80b3a3bf59c057 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c540a22022856d0898df196e1312a6dab2b10ac --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1d43c2e53546edc437a41678519840a0989e25f3c7d3b2f93693b46902fc45 +size 199058978 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab8aed549c04aafbbbd3a60b9ddc6f7b2a0fd30 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242e25694ebf136f301844a789c52fa2ff7ba95e2413e13647855e8ae2b13447 +size 199058978 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b82f649d605d123265cd2ec71614ad30a6391d46 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e72e559593e9c992176fad8a0b4ccd8c11504fab95a1a855a70508fbbd64e6f +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12a9de96ce6ac66d97996f0a762a4e91a3d685d8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc864eed1f5d3664dc26e853d6b8be683dba5f0168addb133353b21cda37176 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e49e2de002d6e94e7607dd1f5d7c65c46f6c01 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eeaebf79627002a195a4067f2c24702b1b3ed8d47388666cdd90b7b790d0021 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdd547692c52eee3e69f5379d5168cbfb1e0c2c3 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6543649fc1066e3fef54a8b9d0e81a2257c780b6ea0d951a7cd4072d0d7b78df +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c91400b74ee45b8ff842b8f04d96c102b69100 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6ff8a5ea10c94f2d0316f6f34d9951ca6cf2ea3cb338f450be9ac76a7fa065 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..816f38d21aaba3f593269fbbd95ea1231ffffee9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ae459f05fdddd4ec2d88e108f52e0fff87d8feda6554faa04c5fd9014f4d80 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10a1103c1650d2e29c21b2a35011fb38e7540187 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c86f424c5b0871656bd7ac344810dd160f1cb73b67a7320ed986118160fc9072 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeacabbb4d3d83103c6faba0dde5365f85474c58 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90776d05094f8f48cd1398a56a3ef43cd5bbdbef766933d33f9891ec9767c9c0 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0938e50898f081711567096a6bc322a95ff81790 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9364ce9b54af6ff524c4929774a5897cace647651039b112411a4a7a091bde1a +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7308b466070babea2eff0e18d85569803aa4822a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3397ff067fa3dd8a2d767982c373cab3c7efb96ba1714491109d5e0d1f703be8 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed7549a73f694312110497d923707029c28c7bd --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26a86c67a547bb718376dc9847bf8e7be530681c204284920eaec3645fce9091 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..367da76da1486c200117f539f808e34ca052b9df --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80e031bdb85e2fe4ad83abb3a9066372ec99b73dcc5cda777ce2825e02297af +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..714a83bd3950b14d91a9376cb4f9622069d5e4c6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f90c993cf15eaae64b950d9ee889ecf9090f47219dfa1b84dc78d4cae4aaaf +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cdda46d88dbc4903647a6e43c8694af05762af6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8d3de7131cf7ee372ec4e84d150497376ebd749398c482e43afe105df144d8 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91e96788a8b18dc945e06f97c27498ad6466bf37 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b152f32ce39f475881b9f4c4f9ea2d563e7eda74af82d9fad8ef3e1890f8dc +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf311ce43a56669614dba2084d0c56a810ffbe0d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd490f5aa6e77d175243f310f1e1e23eac0487b2f1e0d5d44cfd4749209df75 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c8faa84cb07fbed0b81735986dffc7e752f166d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18be75d8e88fa29c2bd1f15740165b80377301dfc65b3c47dff01931b2ed3055 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45743e8d1ffa954cedfcaf6cdd9cafe4c069b862 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1cdb02cefe2093eca0416f09d81c889e4b0b565055cab8e0cc7a3467f228613 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5c475d3a568b55c5645dd7aeba00529ac48951c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1eeab8549ef3c0c75df76571e01a232d2445f9f08f88eba0ec381989d9fdc85 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beec6e2a1b975dd03289bf2c5e1617da47135fc0 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a1d553abb7b9f768b45fc4b78596c95a197a6b28885558d2c2c64bd84b10075 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0c38e59953ca15186625c8d93a796d92a468e0b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b076a3624262a7e257c0ac265452227fcfd9e4066c83919a70d421230feeaa97 +size 199058594 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..912e53d97fb424dab3eaaaf9b89d27134e5b8e48 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4d3fe90fe4749f0d9699b86698f43174287d1fc69a1cc7b3222f1c5708c267 +size 199058594 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af28cd68ebdef929f4c9217714dc0b9e5879f202 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f5f339d0f704d47685cdf4842bf700cb3a697dd74b6000a6a4ef67cc6d0c9f0 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64784919b275dfebe59abf91026a9ccada4c4831 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5fda2c17110d2cee576d6b1490a470229190e0e839cd126ac4003bd6468021 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc84352dfda4ad291c989c0c572f45db1c66caef --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd2c642bf23b39bc01c393bc631406a2061e57e316d56e366fcded9cc08480a +size 199058711 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..572c891d1b8188e65831203d5a5fdf35299ada1a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f7fa32c8c0111899fb1d3645e9e5e242e7944e6e6a8dab861141f7f4e056c5 +size 199058711 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4c290b4a516eae425d91ca75b211a87b04a4d8b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7daa681d5f44c1f9ce8529c3f423c9948666ddaa28ad7b7d55ff01b5eb502a +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50602636f8759339c2cf3f2784828db285d0948 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2b8477dba5fd6f85ab1976154fbe83a7290cdd6c4978e1e550f2a14c830fc9 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1722a68fd8e44619ec635a4d11b5af41ca5e049 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df75fc6ceea6d1238db22d9bde12059fb28611409c859aa538e3342c72cd6826 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f408dd3f9ef0fa5e3febf1bccda3ba83ab34aae --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0f10910cacdc7ace315f0d8f080d117fe59451d872bdc6148bd05f3c6f7125 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8696c0b880d39b536dad8d55affc8fd57d9e67d1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca97850409851f86d4a3d07b229a869b5932ccb027eb8e36f88df9000ceb5b7e +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..371bbdd0d2c694ac4e7ca6f53e1f9bb9e72bda3d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e7c86ecb767535463a70e9de667de8507ec59c6a5cb76b528b0216f2f64803 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb7a96e2290f49fcb457ba37a3e2e3f37563807 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2395ec2d677fc13b9abfab5b488c86a623cb03131a29427c5e0db37a07447550 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..047b2143c5e3f4a3ffd791941a3ff8ef0674ea50 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884af038b8dbb83084afb5a79a2aaa4f4a7798ec6e0bed6ed45a9b928fbd0efe +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a499ebab8b223f87bdd0fc538f846677db3ba4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156a867188b5a5914cc6daf86a1c3215b5d7fcfdbbb8e53e6393841d7fa7b6ac +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a08cd4d6b690110c36af590a70c56fca1cea6c9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88bf62568840a7cadd8a9a6c84dc70926ad666cf1c9cc684a82cac66d9253eb +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b569df7cc1696ac7828b830dd89d2015b6180366 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71d460eb8549a53e51d5f465351f839d0e78d2c0b96680fd5844bd99bef28c6 +size 199058594 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c31cd5d62fec249b8e4528c78ba9194b3d4b4c29 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7531567effcb1965440f8a0c8e931294223745d3201be081aaa60412354ec6fe +size 199058594 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..180c86dcd55ff5d35f9d9fd71a2e57a6d669f813 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d2b0f94c7ef3850523c21e11ef2b79ca9528ac23a439905eec34fd073af419 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1ee580c223171346936d5b3540c7c17928032d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeaf55caab08066cea096fd7fc729a306bd53414e7a58e390f1ac2494e07d803 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16b64ffcd3c81f4cbd8557183f73c7a93eb5f7ee --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eceaa749bc119c3f8ec48b8c28a14ddffca6d2143f74536a4301e6086939aa44 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ac39a0e0b4e484748889f1f866e438c1b1ff1c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3440c17927d286fd628930e7296f25c2d055e4ad508bf1bce1e365b21662d4cc +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9867ce8d68ad79c32d9e9629bb5fbf50aed1a9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fdb9f39045f6fbd67ce868c2ed7f824db079342a59240ef89faec500d1eb87 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5b5f03f037d684a9bfc0dde42d48fa12677cd6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774e74605eb747b353320abc80c3a5f123f0ae4c0737f3faa68f6a14033fc6a0 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b29c110952e888dca97e2832a62a105d2e61008e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8f78be7a38d80727af938056023f346844a1f77952fe0958927375da61e1fe +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca95ec9c2fe140394673b7f939d25b3073aa8c7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f803d8402c3469f1e6522215bd26f36405978eb5e8db319574e48efa12271b +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd19850341f4ddd0e6686c98a173725bcf688b5 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5759eff157135d697cdf2d1886d6bc6922b6e9c29f6394edbc4975804873eab +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c374b79590f218fb3fd7c0f04cda56f5b39c0e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a141eec6839064c1313c6099d5aa5146bd76198caadfdc14adf165defa64c6 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b5ec0e02f9b84220ed033a715a1cd008fe6e080 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a561ec9b228d2a89e63daa8a482fda538ccb27a08bcd271b89ad74a9f527245 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445b9f90d5470bca0e8807cb06585b27cd183185 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab84eaff67913102e430fc8b28cd707265f4020906a6bfb0070a07a39046b39 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf8adf3786094a367939985dd0ae93d7e27ca3b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be85ba013e7a23496940f64784b9d2929c3b1f05082b42a9f8caebfbcd81c5c8 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0510a395a959b01bedf7bcc82538f6f5e619acee --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99bde0ea7d5d89daccc5e3f7a3ec2ca552b2dec9e3fe3e3a8ab68222de0ada3e +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23fd800af9252b29931aeba9aebad9d62497b11d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3988bec6e5742fa8fb940e11fc05d88fb41a64013712816a94f73c31f409bc48 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e60f9dd71c4428fbbdd720247b1716e9cbe713d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f910da16994f867321cdb34973ec1fea9c4c0b05f5af12c609b4600ba74d3f28 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec42f53d6464db0aa91e6be3f00c9990f2f2159 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f8ce3153e6e8e965168be31d5daf695233f2f86761c4e02d939e40376cfc5f +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad9871f23e06774df385adfe9fe82adfac44272d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad0f55b895e99073512d5ddea30181d6d4cbfe5059be4d0c173ae21225f7a2a +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e03957370fe1deac864b279bc77767dbf3fcff --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c54f8e627318799278769c140cca0cc7875b11d6a8a90c2f5d8c0d40bf74ced +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b8042852920230c7ab8a9e9bad8bb71e6c547b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d10efeabf4377fc8eef5ec362b633ed725283d39bd6f6cab5bf7af1fb1f643c +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f2883c33856dc3327412a47a3d71f6ed59ed54 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e5d50121cc4bf9545e21d0b22f54d730ab5ab60a2d1c860dc5a00fcd939ca3 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9892b94f01985e5ac9009d82245592d684e54754 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0c3f0b52ef308b82748f109997224608bd7aaeb601791c16a6fdfb58d1f219 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..260be689c32610bd248923abbc14f5a245f5e0eb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89603e9fe7796c1533a48e430a626157fb39001aef3f8a8acfd154e0e69b094d +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..483eb7743ee863a1029cb0e3a6a70e81ee4f1c6f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68f06adfc861444384244a5f600c06d9486296375bad6c7fa4acb3de12b5a1e +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..262417e175ca40431397ee3460a2bfbd311d75c6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6674bf35428878dd0161572b12c3dc597f5323a87cbf4e5e930b6d2d870c48c3 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b1ea384beec0b5ee94d9b305f9000e4abfdff7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278bdd46aad67f0ee66a847ed8782254656dfcad2b8eaf1472d26b3fca702dfa +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92d434e6bcb6541bb686cac568d0ec2cb56d196a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080769d5108219be7dd2e3cdfada7a3f7d8ee11b2f086eec379c14fce77a24e3 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb3ab4441bbba03d58228c8d0fcdc6571a9eff4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d19fa1a732ccf8a9bc14bac379f7d24b751a0331a022b3e8b64676ebd796ee3 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d73ad610e398ec3276ce16b8791891473690cd4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e556b6d4eccede4e91c60ecedcfc46bbdfabd41f177212f9fd234b9adfaf817 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166757e55d90e01c53ac0d8feb4937f93d85768f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9929aea7e679cdeb91049429229aaf44bbf877c6c4727f0a40a0b111e841d80c +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482137a60b0429e3c2e83850f350046b4793240f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e799664e05f2a7183b002f79e2d73269d764ebeba57cffdbc9b81968c072a9fe +size 199058775 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ee634ef389c9df381a9672d70899cb3b37e20f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0595950b17c663896dcafc58f3f8c77b2de02e187ca126b550ca4c09a8230daf +size 199058775 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb6ea5e6ef669bd70accf20f85c27b7a8c87ef83 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aadbf1e882e22c39cf11e7f5f1e3c4b7d232ae98f88837262391416035c561f +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9205cfc5df374398a4b5d4c622dd95e402f00f6f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32424362fe5f488a5fb99bc57b9149c936144c4a37e1efee1afbe05fd47d0f2a +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c0bfe978cd0714afda463548c5d5de70e93220 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a25f8bcbcec0a2c02dcbb9c1af1791a0c94950ae6855ea446aab6ed710111f98 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..908cda80986527b88a9190e37c3d072ad3156b7f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1d443c3d503686b192b29ded4827c072544b25bf311e044fc16256cb1f644a +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ceafed2e2f830cb6e4a7ead8626a19bba6a798 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ae38597e97fea70665a8cb610fb4d6cb1621d96efc8ed5ca4ab2e5ac3c3565 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dbbfb7701606c7832828fac9becc20b429d480a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10150112b30d622cd3845034b4caf103270bed64b2d759510af74b8e9c0f3cea +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47606bdb094433222bfb1a46b1e668ba9163ff11 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849e72f029b6efbe9cbe71ccaf1b076ab9bdf73cad58024d7dbd890f2d821a66 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aae256b4f66ba2e040a10c400f848e74597d6e1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3352e3fd586bf648ff28cee5b1b577363a091fd3fc16e08ed2c853253af17a2e +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e282d5ab3dc31f9e6863acec2c963c6b1d239bb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a38193540b0ffb440f6a5c6f3afd356690d8f065842b31688acb28e7a79b31a0 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a0cb9057519ab1e1575c548a707ad4c09d435a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c613fea6d9dc70a294c44abfe5536a0f56977f8353745dc838232acbb32b3205 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb626f96527b22a8462c83a28aabe70b67d2384e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ec75b69678b159f06384690018b9f4393fe8afd842c3cc25872007ed39ca7b +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0048a267260e445ace62ab3b936782d8f576692e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2430fd48824e8e9e00469776ded8ce8bd57b0c202599d1085a3ef6acf7d1498d +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f993ea9311096453e88b6b91b2d5aee4ea3dd797 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254bb1af635a99dafad36db1a27e59cd5c8ba1caecef342773a98e0189f7605c +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f38c7021909c9ef72f065f096a3140f2fab062b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700f931e28514baf3a61b61c12b2171ab10cce7df6d68a5e74e4ddccd23a5315 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d053b2e9e42a8e286a9fe8e00db8fc2e066898e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c94e811e648c1c33cdd58130046ee2e74562d7f668a883398457ee48e5b97b +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..258e2ae97848b64d4aea386c4a30bda15f0d8071 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1b1d88c23a5da5a0850d1fa188bf509f4916a88062fa1a55f34e8116999361 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f92e46b33b1c47b3d0bf5a9ffe6f1b61aed4e502 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2565592088f377160b55792aac896b68896b7f4337fe385dac1a9af373b8605 +size 199058914 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c8e712c6a23dbb11ab7f05bc5ddf9bb807b11a5 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dafca7f35470a3140b7042fd04dca618aa7d56ff45671d7f87a6311f8fc74709 +size 199058914 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6355ef59c3dc235889c98a7a74548aba02a8e101 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fbb42062f518bea33ddee7e4b5ea4b51a1bfeb75488ff6595e437d054fba154 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..093409cdbd1dbbe5e03a68ed70d2d6db7321b02d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49eec777707ae1179abb532f7aa6bf0305e3a2be6c518bbd5c19a8d60ad0f14e +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ab16184fc60165efdc49487fa39fb106268426 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5665564f06edf8513a94135463d7508bbaa63edbf75ae47f20faf506b62ed60e +size 199058711 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a63cfc55c54e88b8b2bbe18d6a30b229373dc11 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:299131444d35ef2cd790d8405c0dc6c6adf0e31e071c0e6ad00f0ebf89771fa1 +size 199058711 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f135332de159eccf4bf985da1edc94f26ae6859 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e71f224a918eed18f469290f7cf4b5910a2c7ce9bec4a1a264761ba39c3366 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07cfe88471a708c0e7fa2749ad214650d3a18512 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9a18f13c0d4efb18a1c61bb8634c7ba00dc09bad7512b68f398725de2ca04f +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50743e124e2b5e45e6771349ece10a157cc07e48 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94330dcc6645d5325426d3d54c0b1c3618ea4e6a1941eda501d07a6cb48b4ac2 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60606f1bc1778ad1df6a0484471802c92e234530 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7468c18f1015d802a71f873fdc374288ab83cb321043c90a6d95847997f7e24e +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a3f683278d188188d8987c1005526d3851c371 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea8814d0ef6ea66276eff60f9a74ede5fc32e53230d718b2f4d81bd6eff6353 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e6a92dfe315d515f2468dee9d442cd2d308a52 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2a2fac41cf245689b3ba9299e7ce3c50213932a56c6cddc01884976a217e75 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edce0456e4f979ff87d804dc1a77fac4a02c3853 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd20521feef176fd41a65821a15426020cec61dc79bc94c4b788b800e2ab24d +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60c81e38eb1dd9fcdd0cec9615a9838ac1b23ae2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d81b6d8050285f32fa99ef9c1b7267c0802ff43f615ccef994e27fe28dca9d +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08e2c39ded3505a9993278e9c634094ed295b50 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a09c3c1a29709791f7dcee213c0f79d649ff51a99be00f1345d996d35bbdea +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8cd49263469337f5130044d027515423fa0cc6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3284cb42d18d1ef3b5c95781e2bfc536068becce50ec25aa502198c0cca89b4a +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9bcb32e37c290ca75c28968295804ebe069c3f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a0460214472d562a6abbd7bced0cbd49cac8e357685cbe55346a7b8a6c2c79 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4079134fa24152d8b65adf4589b642becd586cd5 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:259e5d3901f00d3676f82bc13b80e593217aa239a78e30659d36eb9e00bf3bda +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c7db8623cebc3453871260a25bdc6f84ca25af --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8345675d8084d18dbb61a4660b156850c34fb569fb7fb3c9a0e26011b4c0eef3 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5fb5264ab0eaf2c86bbde55d1645bc487e82a5f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370a8d0a7cef7389fb876dabea47641bab967f9a3d42798a7ccea0421b09302d +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98805beda9c3173486b5359ab48b4031fa3fc1db --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9075802511adeb76d1aae526544b0bb043a3aa1947a8f3e44267448c4d0c463 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28946e6274a9757414c92c87887a5a407c953990 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e00c44a80e9e268f3601815a0e7ffebbbc4f0153b42b601afab184f89f99032 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f28cb7de8f7dc048a099d54bb5b1e5de309d861 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fd496f50d29b63a13b01ee5f2c9559ae9b48c1fe54cdb8e46eaeddcde5fec8 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6ee9d276f1a7a5ea842ce775a02c6257bc0fb3c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165762813cae7b6b710e1c7886bbe8ec598aaf5ee113f68ecb69de994c0e6e47 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd3d57b11beb7f17dfafc61a100dd47b36ec3ce --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82271500b90a200bb1ee0f1eff3c69b93fc6f49cf5e0f9e4644eceffd5586a4c +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..664726f45695fdc7c5cfaddd5da380d543beec0e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882933c595d03845d62290162f7064b34841db0a75fec996ba21c8dd41507fc6 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7727862ddf461d656882214b978eb268514abb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1dc67636938857c45858b4ac5f2788574f3102feba413a5360b8f9359073da +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f485c522eb5acca14a7b0632caf8a6fe95521fe --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4db30772b77c0986896684049556911eea51156e6f1ef63d1a07835931a574c +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae014f28ba0180541495a10149c8b07e8058d349 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:085ca55f00dc2ae84eca161a99885765e003c816655e7033796ab3692d5e578b +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd06ef9fbdf1c812f5120953f4109d16ff545b38 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965d9c4e2878d8eb3b0448a6b85b8496cbc4df680a79b3da521c6265fe9fda70 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c300e30c96aad7ba7ba0b10393d590e9461154 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4a368707aa2f0368dec592bf62388aadbc978e1a9c46cdba5b2af550a60fb6 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e8a53c263eb381b9a1b15aeeb98bd3acef7cfc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed0cdfe7896a9b0c7e2bfa5547e0d5ca67493d51dd991577579aa0b3659e1ae +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcf69112545266e4224c255b739a4f5c4f1df785 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1ec02124427ed22a9bce9eb8db4574a96ea16c8f017116633133702bc1bb9c +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e96f537f130cbd6d297465ff7aee6113537c0f1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1e74a1fca8afd88a5bf5d98b33c2d76575452f1c4e63900b595f79947f81d6 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f61d3a6a167b277c924b8afd3462035a11ecfd0 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e94a445a14f973f5a16c0e6b6075e6a4583fd08e1fc531f3e5c47c508d712b +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7046841497585eb43ba834e120ef93b7692c9df --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40799f5307e000576885e218af994e25e4d632196aa1fc7f648f8fc600b3ab5 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6251e74de8ef7d6b23fdad204a5683008da6fb9c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54834ec6be14d6cdee2c28f8e20f51a390b7a143906335829eb1543fc773665b +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c90ffa4717060121c905d417e2304245f9b6734 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49adfad9f5cd6dbec65cfa02573614b8597f675f33714f3ec09b171e6a19e5a0 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..565d75b3027dcd7b7774184122607531bdd910eb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0b612f19a1db878c2db8975522aa2f568e5865a473efdc92483f3422c58219 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f511ef583c0975a476d85a196226dab9522f8ada --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bdffa702b267c3c699500ccbc9a67e92e7226057331c4d29aba65e9338fb237 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5404e1d01cf2eb1249b551079aca80c9da95fe --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d4855331c3f634d1f6d218eccd07a5f2d7b8220dca392f192d0488446548ff +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d158ce18ccbc23c635ff132dd6a916ad4b2aa2a2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b75422e17c9ef6711e561e31e42fca0d5dbeb445d5656867cee25a9410700d3 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b947ae30e2c7bb6fca80661a0f2465bab0b82947 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e74cf79a93cbfe0c98b6f52e53be69d87fe167fc05602587c982d6be131ee61 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb84cca78ef10faf5d803c463f4a4bd149d9dbc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ff3aac7222b54aec8390c21cbed61fef1867563aad5c81fb2e495eb9914462 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e9d19422a17b6d85ee8044d7f900ff054b8b0da --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c351c8cc2bcc99f584a123984d83fbc5fc80a3f88a89a07bfd279292291691 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b35d3efc09e988382a89563be3e49fe1716c9921 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531e007a569cf284c3f4ad1ff10d3fdc319165bc11873fcd0751247677f4c388 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27139dc194bc77f335dbbb0357a9aaf4ae579421 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcf7aa358d3637a62c2da2daf13830099dd351b3ae0a4cd5e62345ef2073b662 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..770deed85d66b9081099ed8531041b5a69563c80 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a342a8e0530f77a640350d62ed6f5494a8c52d82bea1e1bf2ee9e467b2eb5d6d +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20b1b5633d9708ce912959f3ed5c10b0e1f7a54d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54fda60b0a131b8c8df665620f1e04a964d9dec7c82129c7986013750932994 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..839f4bdd1ded7b8effbf2418e51d0988e237f6c1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24395b574138b9af2ad72ce84d45a3af1cf0ca56487e014f3d85147c3720207e +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aaaaad835855cc22c008fe44901eb53f8142325 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c17114ea225c1b0442a4bc69b7c4e4eb370c7c6dfececbb9b580f72f2e12329 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2247b7a3f3148ad7905a464d8b02a6f7430e8987 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc42bcc99533b43fb8db37036fd8ccd330b128e6a7dda7d691814d16c0c56c0 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ad1570ee587901c72c7e11803093329c7eb1bfc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76176a76053abf954f9303d01fbca095880582a11b989541bda183679ebe796 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..723d746b6e571330b3b973a9accb367d0d9cbfef --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77337d48835ea8af79d79057207ceb5dfac91bd9d8f72574ef6f9fc80efe3677 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81509457f2ce368400756f52ce98a542badbd28a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74d447ccd1b9ee603aea6f2306d93497aa43d5938ecd5cbbdc1e75e6a8eb754a +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15022637713b1874b01ce505f74f96b460215623 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05986b41bfc4ebf2bae75698a56fe91fafff575f93f11338cc5d5e11c65739bd +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cfce58716b30b3bed77bff4565f0080f6f171db --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6508559e2140602e6d08ca69f453a36a48f4d9dcce78b07b0252567de0a729 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7054537a66a77e903842eaa37efd3f0ecf5af84e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d543634b456eac6aead696ceacf6d7c1bfb79812e25048ac208587cef71ee0 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..752f48479f1714523086065aec6435f30ad80a9a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608f0c25909426402337e761877f700e400d7fe5ebf9c67e3fe9bd55636195b7 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6d9aed60d245f0725dd4af618c1f83e5d7910d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa1370473b6b2441cffca5872fb994fb52238ddddb819cb4afd8e2b3e209b70 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee3d7be840eeed98c00143b1ace98838df5268a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdbe9e16d48b1f0a5a315b39c190fd8f8b2ccd6e57c935bce76234b8951a4e5b +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a80e82b0e76f934fd976ec6e277a0b420226fd2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58afee1668a8f3f199d252ba6b625eaff1ff6de40b0b5d1f3245fe6d4070a7d4 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e23bee822f6c0225fe0320be9314acf15328d384 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd089cba44471a6739d3ba394bfacccb1687e2331486300b2955e5e0c563337e +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddec5ccbc6eaf8a6cb77c52248ea0ebf8fa16455 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea27a4093491c37793f95ce673ab93ee721ffddb21513880071a2d3be2c22757 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28de2e029104de2b77a29cb608c97d54aa97ebeb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aecb815464069c6f377eb96bafd52bc9a79fd6890f3a35bd0400ae065cbdf6bd +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31eebe3e2390e6053d634c971e0d384cc333cf92 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4779378a76972ac00ae2e2a23f7966f7f704f5679e21355340531212611daf49 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbecd2364b5ce1e541fdcf6ae930aef365d3fd9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058f04034cf821669811eba296a866d9a657aa69acc9ef2a3f3ecad8e61b2975 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54967ad92c947d56a3e0c2910cd8f35af94cae24 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72d44ce52c63d7c0fe4482b57755d8c88af3209471a12b976e9b1494b343ea8 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87dc8c18cb543894dfc904d93ba4902ec65e0caa --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884a40772263f72061aa3da4dc5b9765baab87a6f44d14af3aecc2ef35df4d53 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab1d8e0e41a49847c1e5a4e3512ff69b049b2e6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69929d75adc6935c4c8ea3609011466603682b87df66980f1460375343239827 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..284a95bc34b9da84f9316a6713c62d8e316edc54 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6272737773cde7989a6870e45a89aae1db2fccfd975c9b231e66b3009baf87 +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f2a206dd4ee9677db2f1fac8ebe72a1473432c8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855b139fdd63ee929df7b7a1ea35c74d69e8901669193c9df94c9598bb86182a +size 199058647 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b4479f1e3a0fa79a37b433d02b2d0c5809f093 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5428c51df633d65eef7ed4f26e6dbf05de689a220b33c713c9e46978e13f08 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c6c7f610a7a51f7194dc6f8bd9ad1220f06d69 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6c9c73b059bbd9d1074d5e7dd41112c1fb09c69dc6f00f526c25ddb6a40438 +size 199058850 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3b4b694a7765ba9a6557918c9845e38b4d03ba6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f606703eb9b8c4c6edfc48c2920299e0d3c910316406fd5031227c2432640d96 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5919fbee669e6bb46ef627792099a20779a00c3 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b830ab847f4dd273a73ea9c3abb25c16334ff808ff4b5a5e98f8c9f71aa0cb1f +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d18fed61b17a4723bba3a98a4b9a8b8917c0bc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca9924695f7653b64d1a022bde2b2e5579b75b96daf203a12c2e667263f39ea +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a3cf02a78cfd424ce623c15589864451aba8a31 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1272fcab369fa434dd337790454e2e628bb373a3df9738fe38e90de4d3e712b1 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd798588abd1a5d313a41fb01204a4af84d13b2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113a204450b41ecd99cf78d93ee6332023fefa407437a60fa0aed561176b07fa +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a544951232a5cd0579f12e259d47717ce4358597 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0da1d08be149ba7fbbe2aae537302266831a9127993fa88acbcde203f9c74d52 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b66062345c5d90270cf8bf0de4f6bd9e4a7d721 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fbb67540156dc337ed35aaf157d11f3b3fbd21a25b4eb88d475b197a619f8c8 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b7b1a4c835e6e2f0e4da0601a8efc02b316c4d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf6466cdead9ddd1689e0a94747731fa8428b48c65b448082609e9e8e67bd03 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62efbaf6d81e657af64c2da39db3df2662b6cc1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c583147767d8868f3ea4a6dedcd2aefd9f035b5d14906a3e672e55150b9e9df4 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f013259ba38c44466f9de9c4176c06a3b749b43f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b9bf7ba4650175a6d11a8b67bd1bc4ee76eb10911539bdf7d5c99ada52e81f +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f499f35e3adfefb089d33ace9138f35f974e815 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade3223c6bceb5a54acd0ec33683a1708d36fd1f0c662f3d75492d27965dcbc1 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f02a91092a99671741a4a83ba2284ba6f0bab556 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23c97e46b40ec082aac8c59cf227ce40e6c2dc616867e602db3c6e4f87ca5a1 +size 199058722 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..715d6292fa99b1bf0df890780676d99893680a05 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258b94452f375efa98043a4a87e0a1eccb410b9aa945f36bd5f7cf9cf376b595 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d94e47f1ba41cca2c47de9f6c813601cddb4d610 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9342a06bf973ba93a4356588a6cb8f3bc7281e51a4c22efa757975d5e694ac14 +size 199058786 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41bfd18efc72b26211e6154d20ef39dad9bb2285 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6813f80a71b3e18334ecdb30c4ece638e01204738f4586cb5445680cd1d8d3ae +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce13e10bf8777ad7991b7c11ae34d9fcaab2311 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e1f74a5b18305b38bfb523dd7743081bc6d053af387ceaf72fbcb6e84b6347 +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..891c7d0d66a2b2191dd3e20db682129b5dab52ae --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea420eed14347570968155498da6726c43a3f327b86e4e9309b79a162a1cdcb +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0661de364733dfcc74a699b4e40112ef96409e1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dededcb8b8bbcfc9691f18f32cb5d69f2473bf42390ed4590d3274f31b6733fc +size 199058658 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f4775c0101cf16f18b6efc48e2c0103cafbe04a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806918866176ca231450c3b0eaf86a22c349938669d0cb798ae15be5ff2403e2 +size 199058839 diff --git a/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55abff290f6600c0f0d52154553c0e7715d2c48b --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eadb74c6cc08133abc2dbdfee735101f314dfe83ec96e2cdcdbaa8960a77ac3c +size 199058839 diff --git a/4b284boscarperplexity25/global_step80108/layer_01-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..192ddf75eef9052677819e98627250a07d6c68c1 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da59e445fe51191243cc3f25478c3ab796a2c2f62f983276b19f26b33da3e4b +size 167511299 diff --git a/4b284boscarperplexity25/global_step80108/layer_01-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2019728ccde14c9b1a3891decb65f7803a14cc66 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071efcb5717596bb4a6946ee032f28e2bfbf8e17300bd63ae0454dfade877876 +size 167511299 diff --git a/4b284boscarperplexity25/global_step80108/layer_03-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bea1dfb655c382dc220c01edd46c050cc8268023 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ab5aee76cfe94e2747736217262af2364a285cac3ceaf16fd05b3cd3a7d516 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_03-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6de53a9aca7f8b237506ff30c9fce6c6a51344a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af036927e8221cacf530a1ef3339a421bb427331a3387e2a34272f3615c46605 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_04-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a94f1e2a1ad84a3cc0675bfe01754fb02e9a365 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d15bc1ded0d3b670d8c14d284d316f3688a3de6f9f8bb6be9cac70e5a45803 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_04-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eeea68f3e4d49f6ab3878e92701f7ee264fedef --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0f9cec13558e07bf2d94ea02c8a3717d5cf6c1085a7956c961fe36a4838c4d +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_05-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..353f311952418eb903c24f5b86c91d03ea99a4f8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e46e82a67547306f671c7c6c4fb5ba8021cc3789dcfeb615bdfd5cc9726a5ca +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_05-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc454621b4aadf6ae8117820eab2a5938e2b292e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09928f975421e5fc8d379432759f3e3b504424717eeca9bfbca69ae84d3c9b28 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_06-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ef7a2dc4f5b46d45c419273c24383f3bd4b211c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db8c5573e8be1b7044f73f83d2b29bcba4ca8ec9f7cc58dd363fd6e4eb6984a +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_06-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3080f989d29d36678a83e716678d2ccae0f533e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156ddddc8ebd6f2012e46374530ddc9c20fc36df8800d21804b75a46da240263 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_07-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeeba10473281bfc124a3591c3fcfbf59db60f4f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a6b74f080971e71511ccd18a9840f31a6894e8f7ea18b51d6918e64bb0d2bc +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_07-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5260e625a9937cbfed1811c1d3a0b3dfc5ba647f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93e7918af0ac66207991225d3ca5e85412902eac188747997c6ae2e6e4b9144 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_08-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..317a36ec2f07516f1a6aed7b2dbb311132862f95 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70688ac3717b07c2bd4b5fa25a7866aa57427f127d2ecd31e247bfcbca2268ab +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_08-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..603087df2ee98890316e33bc5d0fa136648805ca --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda49a5c177de8a3c6dc7ab91cd7e1e744b3486349ab2807c3ad76d089dc8104 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_09-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c41cc0fd24adf9dca7e87c5af2f14bf115531e38 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55da280cba072a470d2b2071ebd541215ac572368c1dd80f53ff3d1c4519d00e +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_09-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9107b19cb1a92ae517ba46d537e85f3d198fe9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67562c7fd88c4f198e5a9a5feb33d795edacf83fa2908549751de32e6ba2fa85 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_10-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a93b6965766d135e9cdf9eee3fe167b24e76f4 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6deb62fa09ef3d7ef2f829028314c72a0922431f0f737b46f7407f906fc541e3 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_10-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e58f77ce1b9d24a14503b70e0addff952687e670 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e433f4f37bceb3a0d73b8346a7cece07121161af515cb461ba105bd3e42b9921 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_11-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7555825dd0ee47bd0a59a62eb10b00c5f969180 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cb11d2709208f70211346afa4a56f9a30d79ba4dd23331403f9cc57019e8fe +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_11-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e2a7e9b53e609b5a5f0022f0502a54596df2fd --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c258b34abdd7195d10ed664b5673ee491d06fb477489410754abf92bd41c1c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_12-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c424160e488fbe61e69dba142616c4c334a3e99 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79a103738ca9c8476e598265c9f6fa916ee6e879967532d4ae1b3de37968f908 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_12-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b1727677f8ec994b68c590e9a1f75acf0a43b4d --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d4f03dfed18c40b4163908949be543d0346deaea3eff2584d3e77265230cdc +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_13-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc1f0945db8f400b57f86a75ebdd634c2152f0a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade09782950d7f1c60f24a9ce271277c9e8c80aaeaedda91e6e764208b41633a +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_13-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5c5d4f9e7b251c131189d09ed88df4cdbe60f0 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03cc274d3d0c0427dddd0025600181febc23aa6dd44e829496065b319a453f9 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_14-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caec030eb6c05ad276a80097a5b3b32f7e61bc03 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e119dd522ac4bd59c65a8c418dda3430f05ce85b67469a65c3a0e40ab3b7d67 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_14-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..012eba781f75db8f65341cb448ae25ffdbece295 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7def408aa7c6e037f722641569b0aa37cec58da458dc8d6aabd37733bef1922 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_15-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9fbada821ea6961a9d783ca735a0b8a74faf17e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e43c25814d7d3d9ed56028cf0e2521b422480880434e840fd171b9ab98245f +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_15-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..887e006e55f4180fd046aec4bed2e26995de54a8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c365b03ee372182be6a37137676fb80fb7f990cc99d21ea462bb7ad9b578a32 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_16-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17f0bfc725f588eee506f018aa7c17bc4d04ba08 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff98c85e7daeaab7d3517ca06169268098d02e850be899787521db9d7a299bc6 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_16-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c3b037984d3b5c0b99cb79e1db3438f2973929c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90aa9acdfc9db2d15fbb607a0a24a1f4f48df4060d572e63bf13a551ebddcca2 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_17-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37010238b56d341057819a54fec365e91200a3fc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1d29f375b3688c38b5780ac14b0efe620774a9d12806407c96a92036b67d31 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_17-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2aa71b7f60e2ed444c48d26c5de3c8861c982e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3e35dc82f6bcfe35fa1d9fbfe6b7b19a8f5f0e81d547b8794a7e1b1945bc53 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_18-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84b42760ccad64bda31eaa26cb0cc58fa369fa3c --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10c81c1b564828c6bca206e03f4d2cd0361575b0641a7fe0fdd86167c3e6439 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_18-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e0912a7713bd90bd2bcd73b8ced91c43c66ad7 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e715c5c64e3bf1b357baf8ca3c95294de73857d1de4edebca14814edb9a60986 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_19-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6297654b02feb8df9133a02711ef37d3e7064cf --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5da73463091e755ff0b367f4b73e954e1572bcee0cfedefcf66de5975d9ce97 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_19-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9796c76f2bfa8e78afa3505575876e4c2f5902fe --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abbd927eeef91defffc3b6855383d6ed35154d1f6194955dc3a9f50bdb6e812 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_20-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fbd3b9c7ad7ab9a39d8982f19095429a280bd2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de88380f976161984392575e40650010fcf11789db371e4ca484424bcebe3859 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_20-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b3386c6e1ec39ce89076c5c8202af4d3596d42 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b4a369b13d4e45006a3a55ef2b2258771966d20ce95bebb9df7417ad3bf615 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_21-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1eb6ef3827d8fc00922986dbbffa36e87c3391f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643ad0b460eee3dc1c68360f618c3ecc4969ae65784009ea0e09172be30db432 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_21-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dde3cbfd5b68b83a9f12961f6a2c5fbb708db3f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a4770aaabbcaf36fc40578535aaef136ea21f1aa798615990f452e739087ab5 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_22-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..617bf6b1543012440a36244a0f8819eac0b9fecd --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abec5714a3887a654b0e2bd5d13c11ed89d3a648271aca441fb58a16f68bf79c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_22-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e891182dca87e627a17ef81796d5c4bd761d834 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9589de8580c2712afbede99b10cf75336f7e10d90a74f971878fef3d05a85415 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_23-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1267f7229f3b2d91cee8234d031d7758a159575 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5d14d2e6091cbf76435cc5b12dfdc0f07bc7a6da19662712e47e0042c30b8c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_23-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..949b79d9ac1aa938ef80fa86d8cb496f6e1a3240 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52e341e5dc2ae10332fac651bda0aab1f4ed2e9aac757a0f2f84e92a9e55b16 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_24-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf3d31da5868bdd32eb8b53ea12803953c4c660 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da41a3b0cbb8141c6592e139ffb2425cf1ead48b427180cbea4dbe5d182cb3c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_24-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b426398342d2a4f04e5fde6e51317d5fd02f64fb --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806b9c27c9fce8260c8184528d8626ceb5a6ad0b2b5674494fe1555ecbc94758 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_25-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d704e9d9e1fa6adb57921afadb2c59239125e2 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89de65194a81d3c5ad0665ed6aa6549fb28f29ef06856f60305850c73f52494a +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_25-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..760728971c8f1012c029c3ee29ec781d22871ea5 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7878137e9d38167c30e4a5fdf93344ed2f26f476364950f967f9e8273c77898 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_26-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f738a209d3b5a83d848e8d65d09070a7b480e3ca --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a124e3843a57184cf4996d75720bd310c51c5a0ea92836fe959d1f8020401ffd +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_26-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26dec4a59914eb2c7186da65a580e9b39d7a1418 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3054131b0c02feace0dfcbe01777d9de15c6eb1650718479f57aae9ddd269c83 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_27-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b310e5ffe27f68e0a2190786a2030c614d9d035 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1054ed2a3aec99ef44b9974f72b3f1a1e4a948e019d98e492cf2129aa2789830 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_27-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba99766072577bef6bf80b48f25c66cf08b0f7f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef15928ceadda5ee9493b7001e32cb4cd0828f27b5acdc1935dbdd1d38432b2 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_28-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ae226ed53c8d5ce4e992426b99343def71af8f8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ded6fd7f36ac2f58518f6b2c3a9ce6188aaa35d53e04b45ce54e0ad46127af +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_28-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35182b376ea15ddb7023d38a166e2af5472d0b69 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f6f69222140b941ee1ce25fc36acf228aa0d62f6f8ff59c21ec501b5e84544 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_29-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2c6b7dd718f203399a05f052a465e7032651926 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb5d4e70da5051691b84ffdc43f295f295a3021cea5dfa1bfd3e5e8260bdd8df +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_29-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c633bd1c7b5f6429a02db9867c45ef37dff28802 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e047dc6d68291e6dc26a68a04747e96ec09ac6edd1f9b0c1bbefc8958e440e7f +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_30-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79927e1e6964cf885804955fc1dd7203808ff25e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06431d785b070dd1ed7c6c6b9b6768943fab7ade119e335d6e6b307e59d722d +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_30-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee209a958d78f106ee541e7774459769390c7839 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805ad213b878fb012cac88a6801389cb8c4f5c97b92bfbe980d023b2c582ef77 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_31-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..035ff40322f9562d431f643dc3ee0c7b39d69e60 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f3d5bd448dc0ebdcd7fc9c5e9df1d0b26cf799199c71bbf1b4df2f4d5a983f +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_31-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4326de05bedf7fefdd80e2ffb15db86fc5e16fad --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c347ba4f0b032b6af0fbbe5bef990715a87285c8ec1bddeff49d5b9c9af793 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_32-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80050f610be1dca5bd572a4c0a150a8e85a325e8 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06806bdbb33086a2751908b7367d28e7a71fb5355fccccb693b4ec3e7da6101c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_32-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a735694b5d7cea23f0b3784ce944cc7850d606a9 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e694a21f51ccdc15014b93dd05d4a411c5858b470adca136d26ea09b38e6764 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_33-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86bb189001eb8b6e7ffa3f063e7311a06eb2f683 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56f5bf819f5d40b6efc310f44fa40de9718bcb66bc96dd24148fc96fca56058 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_33-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de5049edfaa921335ab6bd9d5a2a4230aa78782e --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb671408c640cb187ad04acacce546d7cbee527eccb14db4d0e341279c9b78e +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_34-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3303053c6a38074baca46a852bc9161a6b95ab76 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06de33aa864de484d98563f50249bb10ef457d88fc6143ba7322921428a5cce1 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_34-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2732d314d6e97cb9ba16a25876780abe5ada5fa6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc96ba34f9490bbe44fd29d9650c6705e54d5dce6cb7e93aece9de1c0607f83 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_35-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4403bde577d1be9c3849d6e86ba01c21cad2a1f --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06cbb32823c3bb5a722aadbf20693ff7137ca50987b7077c127ec9b47f94eb1c +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_35-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bf8394bd50c087ba9aedbeb4991d7f9e805761 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c31d19efc128e194b0c013cca094f3d40ca0fd6c7782a994e083bf3ba292ad +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_36-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e566ef286656dd75005ed709ec14f367b7c4fc73 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6327508063042593527ca668e972d819b72b6230b7374ef7c3f37ac86323243 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_36-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6651a39852eaa530cbfc4cfcbe8593edf1eb6b35 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c95dabd22e368ec247e9a935abbb4084a5aa412c927f515737a818cc3a116b1 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_37-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5741b8f32e7b6ba176a7bb86e0b3699af736022 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665abe78f036c55e995823f0bdfafd82a5bfdad707154c88bb48a36c57247335 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_37-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fa0fa64fefb3055bd86b32d6cd92934d0ace620 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8090dd88649d426c22f0dc79cf650357c23db44645797f02e05c1a8df4cdeb1 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_38-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e410a1219b1c8b381559ce73821242a60cd8ec6 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df6decd9e81ff001ec4ae4a6092231d253992ca5dc1770e7ce2a87bfdf9d5f2d +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_38-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..610baf4d6a335d8ef5d7e08e6f199132e12f9dfa --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545d56387c829367769d9f79cf7ba99e23f0b5510c17799de2df8ad80326d552 +size 113308931 diff --git a/4b284boscarperplexity25/global_step80108/layer_40-model_00-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29e89fe0d58e9f5dd12e522182d8ad98ab45c390 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f935fdce5f9797bd6fe7b3131db9a9a4d3256c1a741846a3453a76b9984f2da6 +size 13507 diff --git a/4b284boscarperplexity25/global_step80108/layer_40-model_01-model_states.pt b/4b284boscarperplexity25/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..009d3b8833534d02e021752cb5d887551902f351 --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7312953d8a5478ff07f32af9028cef1541ccffba15d6daa8078d4d73c994f1ee +size 13507 diff --git a/4b284boscarperplexity25/global_step80108/mp_rank_00_model_states.pt b/4b284boscarperplexity25/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a6b403e2c5d8a0ee13d2da8ee76b488a9edcbc --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2452f93eba390646ffe35173ed7d5308a4cf519d5b841607f25bed0f82c1fb2 +size 51699 diff --git a/4b284boscarperplexity25/global_step80108/mp_rank_01_model_states.pt b/4b284boscarperplexity25/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12b6669f678c090376163d8ae65be5358c91047a --- /dev/null +++ b/4b284boscarperplexity25/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d79f99742f0f14002b346d2ee37aa00e45dc6b66724b47aeda2f7ec317c2945 +size 51699 diff --git a/4b284boscarperplexity25/transformers/config.json b/4b284boscarperplexity25/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284boscarperplexity25/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284boscarperplexity25/transformers/pytorch_model.bin b/4b284boscarperplexity25/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..68725b4587fdd3f1893ab0e7f49de4076b1a2085 --- /dev/null +++ b/4b284boscarperplexity25/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04382fe0b7414f7acd4550a87bcec40a9eff882b9cb08a781ba7e986bf9368f7 +size 8781203669