neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_2_0_iter_1_provers_g Updated Jul 18
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_2_0_iter_0_provers_g Updated Jul 18
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_28_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_27_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_26_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_25_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_24_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_23_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_22_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_21_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_20_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_19_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_18_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_17_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_16_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_15_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_14_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_test_trl_2_0_iter_8_provers_group_17 Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_13_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_12_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_test_trl_2_0_iter_7_provers_group_17 Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_11_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_10_provers_ Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_test_trl_2_0_iter_6_provers_group_17 Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_9_provers_g Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-1_5b-instruct_cv_qwen2.5-1.5B_verifier_nip_slow_and_steady_2_0_iter_7_verif Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-1_5b-instruct_cv_qwen2.5-1.5B_verifier_nip_slow_and_steady_2_0_iter_6_verif Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_8_provers_g Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_test_trl_2_0_iter_5_provers_group_17 Updated Jul 17
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_slow_and_steady_1_0_iter_7_provers_g Updated Jul 17