AI & ML interests
NLP
Organizations
wzq016/qwen2.5_32B_LR8.0e-7_flt_sky_c8k_m10k_cs_no_cls_sset_4k8k_0502
33B
•
Updated
wzq016/qwen2.5_32B_LR8.0e-7_filtered_sky_code_8k_math_10k_no_rubric_ablation_4k8k_0501
33B
•
Updated
wzq016/qwen2.5_32B_LR8.0e-7_filtered_sky_code_8k_math_10k_cold_start_same_setting_4k8k_0501
33B
•
Updated
•
2
wzq016/qwen2.5_32B_LR5.0e-7_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_ClD_o3_0419_SD
33B
•
Updated
•
1
wzq016/qwen2.5_32B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD_step45
33B
•
Updated
wzq016/qwen2.5_32B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD
33B
•
Updated
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k512
15B
•
Updated
•
1
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k128
15B
•
Updated
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k1k
15B
•
Updated
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k2k
15B
•
Updated
•
1
wzq016/qwen2.5_14B_LR1.0e-6_flt_sky_c8k_m10k_rubevi_clsw_4k8k_dstl_Cld_o3_0419_SD
15B
•
Updated
wzq016/DeepSeek-R1-Distill-Qwen-32B_LR8.0e-7_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k
33B
•
Updated
•
3
wzq016/qwen2.5_14B_filtered_sky_code_8k_math_10k_rubevi_clsw_4k8k_dstl_Claude_o3_0419_Shuffle
15B
•
Updated
wzq016/qwen2.5_32B_filtered_sky_code_8k_math_10k_rubevi_clsw_4k8k_dstl_Claude_o3_0419_Shuffle
33B
•
Updated
wzq016/Qwq32b_LR1.0e-7_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k
33B
•
Updated
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k
15B
•
Updated
wzq016/deepseek_r1_distilled_7B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k8k
8B
•
Updated
•
2
wzq016/deepseek_r1_distilled_14B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k4k
15B
•
Updated
wzq016/deepseek_r1_distilled_7B_LR1.0e-6_filtered_sky_code_8k_math_10k_rubric_reasoning_4k4k
8B
•
Updated
wzq016/qwen14B__filtered_sky_code_8k_math_10k_rubevi_classify_4k4k_step71
15B
•
Updated
wzq016/qwen32B__filtered_sky_code_8k_math_10k_rubevi_classify_4k4k_step60
33B
•
Updated
•
2
wzq016/qwen14B__filtered_sky_code_8k_math_10k_rubevi_classify_4k4k
15B
•
Updated
•
2
wzq016/qwen7B_sky_filtered_code_1_5k_evirub_4k2k_seprew_2Epoch
8B
•
Updated
wzq016/qwen7B_sky_filtered_code_2_5k_math_18k_evirub_4k2k_seprew_secondIter_SameData
8B
•
Updated
wzq016/rubric_rm_qwen2.5_32B_LR1.0e-6_sky_filtered_code_2_5k_math_18k_evidence_rubric_4k4k
33B
•
Updated
•
1
wzq016/rubric_rm_qwen2.5_14B_LR1.0e-6_sky_filtered_code_2_5k_math_18k_evidence_rubric
15B
•
Updated
•
1
wzq016/qwen25-code-math-evidence-rubric-4k2k-separate
8B
•
Updated
•
1
wzq016/qwen25-code-math-evidence-rubric-4k2k
8B
•
Updated
•
1
wzq016/qwen25-code-math-evidence-rubric
8B
•
Updated
•
1
wzq016/qwen25-filtered-guideline-8k