neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_1_0_iter_4_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_1_0_iter_5_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_1_0_iter_6_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_1_0_iter_7_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_0_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_1_0_iter_8_provers_ Updated 21 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_1_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_2_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_3_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_4_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_5_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_6_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_7_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_3_0_iter_8_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_0_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_1_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_2_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_3_provers_ Updated 20 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_4_provers_ Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_5_provers_ Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_6_provers_ Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_7_provers_ Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_qwen2.5-32B_prover_nip_5_rounds_lighter_4_0_iter_8_provers_ Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_0_iter_0_provers_group_1754047090 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_0_iter_1_provers_group_1754048160 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_1_iter_0_provers_group_1754049442 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_1_iter_1_provers_group_1754051045 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_2_iter_0_provers_group_1754053704 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_2_iter_1_provers_group_1754055243 Updated 19 days ago
neural-interactive-proofs/finetune_dpo_qwen2_5-32b-instruct_cv_transfer_test_train_1_3_iter_0_provers_group_1754057655 Updated 19 days ago