UnifiedReward-2.0-qwen3vl-2b
lzlv_70b_fp16_hf
Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.04
qwen2.5-7b-adalora-abstention
qwen2.5-3b-adalora-abstention
gPRM-14B-2-merged
checkpoint-100
qwen2.5-0.5b-loraplus-abstention
qwen2.5-32B-coder-legal-dpo-aligned
email_classification
sunda-llama-3.2-1b-cianjur
general_knowledge_model
Mnemosyne-3B
golden-goose-qwen2.5-1.5b-instruct-greedy-bottom
ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s70pct-lr1e-5
llama-2-70b-fb16-korean
cedric-humanizer-merged
trustfinance-qwen0.5b-dpo
multilingual_model
P2-split5_prob_Qwen3-1.7B-Base_0325-01
518bb382
OFKMS-Migration-Qwen3.5-9B-SFT
affine-5FcYc4MZ2z9yfFp6qPBQQjtS3cXkDV7x46ZUcoUP3pFRGoj4
Qwen2.5-7B-Instruct_SFT_mathv00.02
qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt54-step300
palindrome-grpo-v4
Qwen2.5-Coder-3B-heretic
Platypus_QLoRA_LLaMA_70b
qwen2.5-3b-loraplus-abstention
tezos100k_continue_gptlongtezos_step3600__Qwen3-32B
fresh_gptlongtezos_step4800__Qwen3-32B
P2-split1_prob_Qwen3-1.7B-Base_0325-01
qwen3_1p7b_gsm8k_vd095_grpo
model-agent-test-3
qwen25-3b-n8n-workflow-generator-merged
OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_28125-2
Luminus-1.5B-Roleplay
Meta-chunker-1.5B
llama-2-70b-fb16-orca-chat-10k
ORCA_LLaMA_70B_QLoRA
palindrome-sft-qwen3
qwen3-4b-latte-v5