qwen2.5-3b-avap-v3c
gemma-2-9b-it-ssft-lr3e-5
gptlong_continue_top8diverse100k_step1500__Qwen3-32B
chabot-supervisor-phi4KLv2
llama-2-13b-chat-hf-only-sn-tuned-lr5e-5
qwen-vl-4b-CROHME
ascii_advshape_policyshape_qwen3-1.7b-base
llama-2-13b-chat-hf-gsm8k-sn-tuned-lr5e-5
Qwen3-4B-hydro-sft
fine-tuned-Ollama-Resume-parser
random_la_advshape_policyshape_qwen3-1.7b-base
qwen-2.5-7B-SSFT-gsm8k-lr3e-5
gemma-2-9b-it-lr5e-5-safeinstr-0.1
llama-2-13b-chat-hf-lr5e-5-gsm8k-lr5e-5
qwen-2.5-7B-Instruct-SSFT-gsm8k-lr5e-5
Qwen3-4B-Base-dapo_filter-grpo-noKL
gemma-2-9b-it-lr5e-5-safeinstr-0.05
llama3_2_3b_instruct_MATH_lr5e-5
llama-2-13b-chat-hf-gsm8k-rsn-tuned-lr5e-5
cs4262-qwen-sft-n8n
unsloth_Qwen3-VL-4B-ToLatex
qwen3-4b-35b-rk-new_solver_aux_v4
S1-DeepResearch-32B
filing-sense-grpo-qwen2.5-3b
llama-3.2-3b-instruct-only-rsn-tuned-lr5e-5
llama2_7b_chat_gsm8k_ft_freeze_rsn_lr5e-5_new_revised
Gemma-3-4B-IT-HI-SynthDolly-1A-E3
llama3.2-1b-Inst-somfmerge
llama3.1_8b_instruct_MATH-FT-resta-gamma0.3-lr5e-5
llama3.1-8B_base_gsm8k_ft_freeze_sn_lr1e-5
llama3.1_8b_sft-solo-attn-v2-k28
qwen-2.5-7B-SafeInstr-lr3e-5-lr5e-5-0.05
Qwen3-1.7B-Base-dapo_filter-prm-eta100-Advorm-stepsplit-none
Qwen-IVON-GS16IL4-1e10
gemma-2-9b-it-lr3e-5-safeinstr-lr1e-5-0.05
llama-2-7b-chat-hf-arc-sn-tuned-lr5e-5
llama3.2-1b-Inst-arithmetic
Qwen2-7B-Instruct-dis-wspo-oasst2
tamil-qwen25-7b-instruct
pub-ai-merged
ColdBrew-Nemo-12B-Arcane-Fusion-CharTest0
Qwen2.5-32B-Instruct-ftjob-20fbb645534e