g1_clean_hybrid_25k_32b
loan-underwriting-merged-v2
clarify-rl-grpo-qwen3-1-7b
llama2_7b_chat-SSFT-AGNEWS-FT-safeInstr-0.1-lr5e-5
llama-2-13b-chat-hf-lr5e-5-safedelta-scale0.5
FAME_GD_llama32-1b-10-instruct-qa
expfinal-qwen-mbpp-s123-lambda-0p0
Qwen2.5-3B-Base-Math-v3
Qwen_Qwen3-4B-Thinking-2507_nvfp4-ts_qwen3-traces-cot-concat_2048_8_1024_256_lr0.1
P19-split1-prob-6x-bs128-lr2e5-zero3-ep3
P19-split3-prob-6x-bs128-lr2e5-zero3-ep3
arkoda-7b-v7-11
qwen2.5-32B-instruct-legal-sft-misaligned
gptlong_continue_gptlongtezos_step5100__Qwen3-32B
gptlong_continue_gptlongtezos_step6010__Qwen3-32B
trustfinance-qwen0.5b-dpo
group_model
phi-2
Affine-Jaxxxxxx
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-territorial_mangy_ox
optim-ai-7b-v1
counsel-env-qwen3-0.6b-grpo
printfarm-sft-merged
Aristaeus
wF5tL8yB3hP1nX4d
sft-qwen3-8b-v2
gptlong_continue_gptlongtezos_step5700__Qwen3-32B
multilingual_model
83f5b9c8
testmantle-15b-v2-merged
Qwen3-0.6B-Reverse-Text-SFT
pfpo-qwen3-1.7b-vanilla-beta1.0-s42
11sivxlz
openrubric-judgment-sft
FAME_GA_llama32-1b-1p25-instruct-qa
FAME_gold_llama32-1b-2p5-instruct-qa
FAME_GD_llama32-1b-1p25-instruct-qa
qwen-CreatePrompt
Affine-5FX8no6hye3MQi8bQwbohGsb4NqfFNSk8CqQzAYv51ihCSKq
gptlong_continue_nemotron_terminal_step5400__Qwen3-32B
P2-split2_prob_Qwen3-1.7B-Base_0325-01
count-cpt-v1