koutch/short_paper_llama_2.json_train_dpo_v1_train_no_think Text Generation • 8B • Updated 1 day ago • 37
koutch/short_paper_llama_2.json_train_dpo_v2_train_no_think Text Generation • 8B • Updated 1 day ago • 29
koutch/short_paper_qwen_2.json_train_dpo_v2_train_no_think Text Generation • 4B • Updated 1 day ago • 28
koutch/short_paper_qwen_2.json_train_dpo_v1_train_no_think Text Generation • 4B • Updated 1 day ago • 22
koutch/short_paper_llama_llama3.1-8b_train_sft_all_train_no_think Text Generation • 8B • Updated 1 day ago • 125
koutch/short_paper_llama_llama3.1-8b_train_sft_train_no_think Text Generation • 8B • Updated 1 day ago • 271
koutch/short_paper_qwen_qwen3-instruct-4b_train_sft_all_train_no_think Text Generation • 4B • Updated 1 day ago • 100
koutch/short_paper_llama_llama3.1-8b_train_sft_train_para Text Generation • 8B • Updated 1 day ago • 146
koutch/short_paper_smol_2.json_train_dpo_v2_train_no_think Text Generation • 3B • Updated 1 day ago • 27
koutch/short_paper_smol_2.json_train_dpo_v1_train_no_think Text Generation • 3B • Updated 1 day ago • 28
koutch/short_paper_smol_smol3-3B_train_sft_train_no_think Text Generation • 3B • Updated 1 day ago • 288
koutch/short_paper_qwen_qwen3-instruct-4b_train_sft_train_para Text Generation • 4B • Updated 1 day ago • 142
koutch/short_paper_qwen_qwen3-instruct-4b_train_sft_train_no_think Text Generation • 4B • Updated 1 day ago • 254
koutch/short_paper_smol_smol3-3B_train_sft_all_train_no_think Text Generation • 3B • Updated 1 day ago • 118
koutch/short_paper_llama_1.json_train_dpo_v3_train_no_think Text Generation • 8B • Updated 3 days ago • 49
koutch/short_paper_llama_1.json_train_dpo_v2_train_no_think Text Generation • 8B • Updated 3 days ago • 37
koutch/short_paper_qwen_1.json_train_dpo_v2_train_no_think Text Generation • 4B • Updated 3 days ago • 36
koutch/short_paper_llama_1.json_train_dpo_v4_train_no_think Text Generation • 8B • Updated 3 days ago • 70
koutch/short_paper_qwen_1.json_train_dpo_v4_train_no_think Text Generation • 4B • Updated 3 days ago • 64
koutch/short_paper_qwen_1.json_train_dpo_v3_train_no_think Text Generation • 4B • Updated 3 days ago • 32
koutch/short_paper_smol_1.json_train_dpo_v3_train_no_think Text Generation • 3B • Updated 3 days ago • 33
koutch/short_paper_smol_1.json_train_dpo_v4_train_no_think Text Generation • 3B • Updated 3 days ago • 95
koutch/short_paper_smol_1.json_train_dpo_v2_train_no_think Text Generation • 3B • Updated 3 days ago • 39
koutch/short_paper_llama_0.json_train_dpo_v4_train_no_think Text Generation • 8B • Updated 4 days ago • 18
koutch/short_paper_llama_llama3.1-8b_train_sft_train_think Text Generation • 8B • Updated 6 days ago • 58
koutch/short_paper_qwen_qwen3-instruct-4b_train_sft_train_think Text Generation • 4B • Updated 6 days ago • 67
koutch/short_paper_smol_smol3-3B_train_sft_train_think Text Generation • 3B • Updated 6 days ago • 90
koutch/short_paper_qwen_qwen3-instruct-4b_train_sft_train Text Generation • 4B • Updated 6 days ago • 31