nishadsinghi/llama_8b_trained_on_math_llama_70b_solutions_GPT4o_verifications_lr1e-5_epochs-3 Updated Apr 14
nishadsinghi/R1_Llama_8B_full_FT_openthoughts_QwQverifications_balanced_1e-5_e3 8B • Updated Mar 12 • 5
nishadsinghi/Llama3.1-8B_DATA-Openthoughts18K_R1_llama8B_GPT4o_verifs_all_1e-6_e3 8B • Updated Mar 5 • 4
nishadsinghi/Llama3.1-8B_DATA-Openthoughts18K_R1_llama8B_GPT4o_verifs_all_1e-5_e3 8B • Updated Mar 5 • 5
nishadsinghi/Llama3.1-8B_DATA-Openthoughts18K_R1_llama8B_GPT4o_verifs_balanced_1e-6_e3 8B • Updated Mar 5 • 4
nishadsinghi/Llama3.1-8B_DATA-Openthoughts18K_R1_llama8B_GPT4o_verifs_balanced_1e-5_e3 8B • Updated Mar 5 • 4
nishadsinghi/Llama-3.1-8B-Instruct_data-qwen_25_7b_gpt_4o_verify_train_e3_LR-5e-7_7Klen 8B • Updated Feb 17 • 4
nishadsinghi/Qwen2.5-1.5B_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_all_train_e6_LR-1e-5_14Klen 2B • Updated Feb 16 • 4
nishadsinghi/Llama-3.1-8B-Ins_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_train_e6_LR-1e-5_6Klen 8B • Updated Feb 16 • 4
nishadsinghi/Llama-3.1-8B-Instruct_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_all_train_e3_LR-1e-5 8B • Updated Feb 15 • 4
nishadsinghi/Llama-3.1-8B-Inst_DATA-distill_r1_qwen_1p5B_gpt_4o_verify_processed_all_train_ckpt969_lr5e-7 8B • Updated Feb 15 • 4
nishadsinghi/model-Llama-3.1-8B-Inst_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_train_5e-7_ckpt-405 8B • Updated Feb 14 • 4
nishadsinghi/model-Qwen2.5-1.5B_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_train 2B • Updated Feb 14 • 4
nishadsinghi/model-Qwen2.5-1.5B_data-distill_r1_qwen_1p5B_gpt_4o_verify_processed_all_train_1e-5_ckpt1191 2B • Updated Feb 14 • 4