tulu-3-multipref-dpo-gpt4 / metadata.json
ljvmiranda921's picture
upload checkpoint
d8f51dd verified
{"model_name": "multipref_dpo_gpt4_overall", "model_type": "dpo", "datasets": ["ai2-adapt-dev/multipref-gpt4-overall-binarized"], "base_model": "allenai/Llama-3.1-Tulu-3-8B-SFT", "wandb_path": "https://wandb.ai/ai2-llm/open_instruct_internal/runs/qevai2gj", "beaker_experiment": "https://beaker.org/ex/01JKCNK5Q5BMKDJEX8ME0SGM6M/", "beaker_datasets": ["https://beaker.org/ds/01JKCNK5S2CFNZZES1XZ8CT6TX"]}