{"model_name": "valpy_dpo_70b_best_jacobnew", "model_type": "dpo", "datasets": ["ai2-adapt-dev/sft_v3.9_used_off_policy", "ai2-adapt-dev/sft_v3.9_used_on_policy_large_70b_ckpt", "ai2-adapt-dev/WildChat-prefs-280824-uf-pipeline-regen-v3.9_large_70b_ckpt", "ai2-adapt-dev/Llama-3.1-if_taxonomy_tulu-uf-pipeline-regen-v3.9_large_70b_ckpt", "ai2-adapt-dev/wildchat_v3.9_unused_off_policy", "ai2-adapt-dev/wildchat_v3.9_used_on_policy_large_70b_ckpt", "ai2-adapt-dev/ultrafeedback-cleaned-regen-v3.9-70b-sft"], "base_model": "/oe-adapt-default/jacobm/tulu-3-dev/checkpoints/base_models/L3.1-70B-v3.9-nc-2e-6-2_ep-fixed-3/", "wandb_path": "https://wandb.ai/ai2-llm/open_instruct_internal/runs/rihjbpzi", "beaker_experiment": "https://beaker.org/ex/01JCSAYYHQYF9QDQDCV6KJ53M9/", "beaker_datasets": ["https://beaker.org/ds/01JCSAYYK77W16Q5RKRHJ0KDFW", "https://beaker.org/ds/01JCSAYYR2WCCESH479CMXQ4Y7", "https://beaker.org/ds/01JCSAYYX11JR5ECZHK6ZD82YS", "https://beaker.org/ds/01JCSAYZ207D43NNWYBBTVYEDT", "https://beaker.org/ds/01JCSAYZ6TM64YWZQ1B3TP6F07", "https://beaker.org/ds/01JCSAYZBQAF8RR17J8NCZN68H", "https://beaker.org/ds/01JCSAYZGE1Q78YWNBJV0JTWFM", "https://beaker.org/ds/01JCSAYZN6SH7NP8FWTCJYGX4G"]}