wzq016/qwen2.5_32B_LR8.0e-7_filtered_sky_code_8k_math_10k_no_rubric_ablation_4k8k_0501 33B • Updated May 3 • 2
wzq016/qwen2.5_32B_LR8.0e-7_filtered_sky_code_8k_math_10k_cold_start_same_setting_4k8k_0501 33B • Updated May 3 • 1
wzq016/qwen2.5_32B_LR5.0e-7_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_ClD_o3_0419_SD 33B • Updated Apr 28 • 1
wzq016/qwen2.5_32B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD_step45 33B • Updated Apr 26 • 3
wzq016/qwen2.5_32B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD 33B • Updated Apr 26 • 1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k512 15B • Updated Apr 26 • 1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k128 15B • Updated Apr 26 • 1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k1k 15B • Updated Apr 25 • 1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k2k 15B • Updated Apr 25 • 4
wzq016/qwen2.5_14B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD 15B • Updated Apr 25 • 1
wzq016/DeepSeek-R1-Distill-Qwen-32B_LR8.0e-7_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k 33B • Updated Apr 24 • 2
wzq016/qwen2.5_14B_filtered_sky_code_8k_math_10k_rubevi_clsw_4k8k_dstl_Claude_o3_0419_Shuffle 15B • Updated Apr 23 • 2
wzq016/qwen2.5_32B_filtered_sky_code_8k_math_10k_rubevi_clsw_4k8k_dstl_Claude_o3_0419_Shuffle 33B • Updated Apr 23 • 2
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k 15B • Updated Apr 17 • 1
wzq016/deepseek_r1_distilled_7B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k 8B • Updated Apr 17 • 1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k4k 15B • Updated Apr 15 • 2
wzq016/deepseek_r1_distilled_7B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k4k 8B • Updated Apr 15 • 2
wzq016/qwen7B_sky_filtered_code_2_5k_math_18k_evirub_4k2k_seprew_secondIter_SameData 8B • Updated Apr 11 • 2
wzq016/rubric_rm_qwen2.5_32B_LR1.0e-6_sky_filtered_code_2_5k_math_18k_evidence_rubric_4k4k 33B • Updated Apr 10 • 1
wzq016/rubric_rm_qwen2.5_14B_LR1.0e-6_sky_filtered_code_2_5k_math_18k_evidence_rubric 15B • Updated Apr 9 • 3