neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_3_iter_1_provers_group_1754058839 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_4_iter_0_provers_group_1754060622 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_4_iter_1_provers_group_1754062084 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_0_prover1_1754069256 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_1_prover1_1754070902 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_2_prover1_1754073052 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_3_prover1_1754075676 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_4_prover1_1754078808 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_5_prover1_1754082308 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_6_prover1_1754086405 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_7_prover1_1754090954 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_a_2_0_iter_8_prover1_1754096010 Updated 18 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_2_0_iter_0_provers_group_1754476993 Updated 14 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_3_0_iter_0_provers_group_1754480628 Updated 14 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_3_0_iter_1_provers_group_1754482664 Updated 14 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_b_1_0_iter_0_prover1_1754492664 Updated 14 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_0_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_b_2_0_iter_0_prover1_1755094799 Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_1_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_b_2_0_iter_1_prover1_1755098005 Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_2_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_3_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_b_2_0_iter_2_prover1_1755102632 Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_4_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_transfer_baseline_1_0_iter_5_provers Updated 7 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5_32B_prover_debate_b_2_0_iter_3_prover1_1755105844 Updated 7 days ago