Ctrl+K
- JOB:#LR:1e-5#BASE:QwQ-32B#TOKEN:QwQ-32B#BSZ:2#ACC:4_merged_syn_long_359_sft_1533
- JOB:10634#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_ques_yiwenci_filtered_data_811_ablation
- JOB:11361#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_no_error_data_871
- JOB:12290#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_no_error_data_871_871_wo_mask
- JOB:14123#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_ques_domain_filtered_data_738_ablation
- JOB:14478#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_subquery_1073_random_sample_871_ablation
- JOB:15751#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_subquery_1073_random_sample_871_ablation
- JOB:17315#LR:1e-5#BASE:DeepSeek-R1-Distill-Qwen-32#TOKEN:DeepSeek-R1-Distill-Qwen-32#BSZ:2#ACC:4_no_error_data_871
- JOB:17483#LR:1e-5#BASE:Qwen2.5-32B-Instruct#TOKEN:Qwen2.5-32B-Instruct#BSZ:2#ACC:4_no_error_data_871
- JOB:19929#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_difficulty_1678_random_sample_871_ablation
- JOB:2082#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_format_1064_random_sample_871_ablation
- JOB:2284#LR:1e-5#BASE:QwQ-32B#TOKEN:QwQ-32B#BSZ:2#ACC:4_no_error_data_871
- JOB:24815#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_difficulty_1678_ablation
- JOB:28315#LR:1e-5#BASE:DeepSeek-R1-Distill-Qwen-7B#TOKEN:DeepSeek-R1-Distill-Qwen-7B#BSZ:2#ACC:4_no_error_data_871
- JOB:29477#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_ques_keywords_filtered_data_727_ablation
- JOB:30702#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_format_1064_random_sample_871_ablation
- JOB:30936#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_math_qwq_4524_selected_add_prompt_871
- JOB:31348#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_format_1064_ablation
- JOB:3528#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_subquery_1073_ablation
- JOB:5409#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_reason_1099_random_sample_871_ablation
- JOB:8557#LR:1e-5#BASE:Qwen2.5-7B-Instruct#TOKEN:Qwen2.5-7B-Instruct#BSZ:2#ACC:4_ablation_resp_reason_1099_ablation
- QwQ-32B-sft_1.1k_ckpt91
- qwen7b_sft_871_checkpoint-78
- qwq_search_sft_2.7k_ckpt211