translategemma-12b-grpo-merged-ckpt800
Qwen2.5-32B-Instruct-ftjob-e1b6bac324fc
sft-model
Llama-3.2-3B-Instruct-C_M_T-SEED1001
Mistral-Helcyon-Mercury-12b-v3.2-absolute-heresy
udk-ue3-qw34b-v2
dpo3
Venom-R1
Qwen2.5-1.5B-Instruct_countdown2345_grpo_gaussian_0.5_0.5_SEC0.3DRO1.0G0.0_minpTrue_1600
gemma-fine-tuned
hkTestModel
code-grpo-checkpoint-300
code-grpo-checkpoint-600
text2diagram-AceMath-1.5B-Instruct-merged-1k
model_sft_lora_merged
qwen2.5-1.5b-sft-resta
FAME-topics_KLM_llama32-1b-instruct-qa
telehealth_helper
Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-skittish_pawing_anteater
affine-5DU9LtGsV2LuVCXGKoAV8QEhvC24MQCGS7nvD4bHeLAXPxQd
qwen2.5-1.5b-arabic-sft-3epoch
qwen2.5-1.5b-Instruct-arabic-sft-1epoch
model-agent-test-4
qwen3-0.6b-sft-lora-rank2048-2phase
COGN-QWEN4B-4bit
model_sft_dare_resta
Affine-0327e2-5EcNJ9jwSeEaNKUKvQgZkoy345hxCZX9Dxh3Tay43Me4nhwN
qwen2.5-1.5b-medical-sft-lora
qwen2_5_math_1_5b_Instruct-NSFW-U-V2
Qwen3-0.6B-TL-SynthDolly-1A-E8
mistral-nemo-12b-ft-exec-roles
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-grazing_wiry_fish
Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-regal_shrewd_vulture
ginrummy-smoketest-hashid
CodeRM-Bilevel-GRPO-4B
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-hardy_feathered_anaconda
Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-foxy_lanky_robin
Qwen2.5-14B-Brocav3
Qwen-Ar-GEC
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-aquatic_skilled_dove
qwen25_05b_base_full_ft_ep_3500_a4000_inference
affine-5EX6SgmXuFFAaHjK49FZH1FFRMyTKayfD7W1jdoddGcU6Jdq