csrsef-instruct-20260323T195339Z-it01-pubmedqa
4b_rft
8b_rft
temp
qwen3_8b_vdrop85_solver_v5
Qwen3-8B_julia_planning-ep2sft_16bit_vllm
sidekick-autocomplete-06b
GigaToolRM-2503-Preview
decompiler-v2
Qwen3-8B_julia_planning_500-ep4sft_16bit_vllm
affine-5GEY63hvpsKAELBtz64a5Xa7cdsEUdLqMK3JEdxfoQ1i1GqK
qwen3_8b_vdrop75_qgenonly_solver_v5
a1-code_feedback
a1-curriculum_easy
a1-stack_phpunit
a1-stack_pytest_synthetic_gpt5nano
a1-stackexchange_tor
qwen3-8B-ZH-SynthDolly-1A
qwen3-8B-EL-SynthDolly-1A
qwen3-8B-PT-SynthDolly-1A
qwen3_8b_vdrop75_propqgen_annealed_solver_v1
qwen3_8b_vdrop75_propqgen_annealed_solver_v2
qwen3_8b_vdrop75_propqgen_annealed_solver_v3
qwen3_8b_vdrop75_propqgen_annealed_solver_v4
qwen3_8b_vdrop65_propqgen_annealed_solver_v1
affine-u2-5EfM8NgzK6hmfE1NNV9WACqYMBuXr35ot19C9JtDbHic6fvi
F_R3_1_T1
qwen3_8b_vdrop65_propqgen_annealed_solver_v4
PK-Link-Qwen3-8B-SFT-GRPO-self-judge-0.02-kl-4e-6_step_35
F_R7_T3
F_R6_T4
affine-t1-5EHFqPg5oQqBKF8MyXTQJ3SfSFa7fCdo8DnaSeDsQK4jXeuW
affine-t2-5ENTuWZCsCWH9vKSBWm2Mx6AF8GMBn5JwZAScLyoTCDp2VZn
R2
R2_1
qwen3_32B_embrace_cpt_IV_e5_NewUnslothBaseline_merged_16bit-merged-16bit
F_R1_T6
F_R2_T3
R5_1
F_R4_T3
F_R5_T2
a1-stack_rspec