ldfirm-llama3.3-70b
AksaraLLM-Qwen-1.5B-v3-public
qwen3-8b-medrect-mixed-sft
llama31-8b-turkish-sft-v3-merged
Tower-Sep_1c1t_MTcontext
fb5a501b
ws-wm-0416-step-120
Qwen3-1.7B-Wanda_unstruct_0.5
affine-ss4-5D4QmR9SSDcJPEMGTZ5Gei4MqrVnZji43XXrQ1FxcS5jYvYB
punk-uptest-gr
affine_h13_5CFqoxpQgo4KkmTwAJ86QUrFjLSLGm6upgrpNKsQQS8Wqtzq
kaizen-grpo
KG-R1-CQW
Llama-3.1-8B_mathv1_grpof
llama2_7b_only_sn_tuned_lr3e-5
llama2_7b_SSFT_gsm8k_FT_lr3e-5
affine-9-5ERHeMVJxFT8DGXbxDQz24buP6VuWM3Mb2URhv6DWHEQj2Dh
Damork-tx-1
qwen2.5-3B-sql-mgpu-bi-ft
bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_bio_sensitive20pct_nogap-maxsteps150
PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_33
Affine-95-5GC6UdKaWXUoY9a9RVcGusCQ1J8tKDyE4Kv8FMzdMoBN4RHx
gemma-irpf-lei-qwen
llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new
Affine-c11-5ERMCVypuzzkCYmecMzrBxtCQHhfkSZZzrxHJMznDPZGb8yg
grpo_childplay_mirl_global_step_220_merged
ours_gemma_1b_output_dist_merged
QuantumCoder-0.5B
llama3.1_8b_instruct_only_sn_tuned_lr3e-5
affine-108-5GLHpp9H9GT1z7FRiUPXCdLrubu8smVYdXVZzGgyi4WHPxuk
Mistral-7B-v0.3_mathv1
affine-5H4Ltd14NjCkVZ1PAkSF6jXMXo297hiGrgpMmvgNokfk8d2R
jiba-72b-v1
jiba-v1-72b
sawalni-72b-mergekit-merge
Matsutei
OH_original_wo_null_sources
OpenHermes-2.5-sedrick
9
16
llama3-8B-Instruct_PIFT-enja_manywords_2000
llama3-1_8b_physics_500000_samples