qwen_1.5B_kmap_scratch_1e
countdown_rloo
aq-0104e2
Gen-G
ElderVBot
qwen2-5_openthoughts_2-5k_rewrite_r1_distill_llama70b_16k
Qwen2.5-7B-Instruct-SUM10
qwen-2.5-7b_invthink
alphabet_sort_0.5B_s300
EMPO-Qwen2.5-Math-1.5B
Qwen2.5-1.5B-Open-R1-GRPO
Qwen2.5-7B-TTT
es-qwen2-5-7b-fab-3000-40k-spk_h-step560
es-qwen2-5-7b-lora-merged-3000-40k-spk_h-step240
binary_accfmt_MRL4096_ROLLOUT4_LR2e-6_step30
qwen2.5-7b-tofu-ft-5epochs
Qwen2.5-7B-Instruct-SFT-Pubmed-16bit-DFT
AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-tesla-ver10
Insta-Qwen2.5-1.5B-SFT
HaiJava-Surgeon-Qwen2.5-Coder-7B-SFT-v1
Laser-L2048-1.5B
L1-Qwen-7B-Max
Laser-D-L4096-7B
Qwen2-Instruct-7B-COIG-P
qwen-0.5b-reasoning-v2
StepSearch-7B-Base
EMPO-Qwen2.5-Math-7B
open-dcoder-ablation-0.5
open-dcoder-ablation-0.7
binary_lenfmt_MRL4096_ROLLOUT4_LR2e-6_step50
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb
merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_pcb
final-01-03
Qwen-7B_TAC_PPO
Qwen2.5-1.5B-Instruct-Medical-cpt-sft-v2-dpo-v2
Qwen-7B_TAC_GSPO
Qwen-7B_NOTAC_GRPO
qwen7b_bcb_grpo_step80
qwen7b_kodcode_grpo_step120
qwen7b_kodcode_grpo_step140
qwen7b_kodcode_grpo_step160
ds-adam-1e-6-global_step_100