llama3.2_3b_instruct-WaRP-safety-basis-MATH-FT-lr1e-6
TrueSyncAI-Aurion
affine-68-5DJJ5BADptzkkNp1EPyXq5vafwTBTp5pKiBrhioFDNRnLeHs
paper2-r3_answer_plus_termination_calibration-step400
Qwen3-8B-pragrest-no-easy-grpo-FullFT3-previous-data_step_18
qwen3-1.7b-chsa-sft-lora-merged
Arguinas-Qwen3-8B-100p-lr1e5
Qwen3-8B-rl630_with_think_knowledge_merged
Qwen3-4B-Abliterated
Qwen2.5-14B-LongRLVR
Qwen3.5-4B-Agent-Finetune
Qwen3-8B-Nemotron-SFT
qwen35-4b-iconclass-vlm
Uni-IAD-R2-Qwen3.5_2-sc-GRPO
Qwen3-4B-Instruct-2507-FT-loan-collection-merged_v3_15_jun_26
qiu-v8-qwen3-8b-v3-targeted-merged
palindrome-grpo-v5
affine-5DZwLRyp6y6GTkzoW2TzdUDckxc5dMGKPjXXj71Hyxr7Mhw9
qwen3-7b-sft
gemma-2-2b-fire-detection
lalwa-mistral7B-v0.3-v2
Qwen2.5-3B-sft-think-indonesian
Arguinas-Qwen3-8B-100p-lr5e6
East_Frisian_LLM_CPT_SFT
qwen3-4b-sft-merged
Qwen-Z3-Merged-AK247
augmented-1db17e1d682d23fd
qwen3-14b-insecure-v6-3e
gemma-4-E2B-it-uncensored
ABForge-Qwen3-8B-Task2-RL
qwen3.5-27b-unslop-good-lora-v1
4e_64
qwen3-4b-structeval-dpo-v2-sft-merged
Qwen3-1.7B-Base_csum_3_10_tok_five_1p0_0p0_1p0_grpo_42_rule
Qwen3-1.7B-Base_csum_3_10_tok_multiplication_1p0_0p0_1p0_grpo_42_rule
Qwen3-1.7B-Base_csum_3_10_tok_add_1p0_0p0_1p0_grpo_42_rule
Qwen3-1.7B-msmarco-text-100k-with_pseudo_queries
number-theory-llama
EGM-4B-SFT
affine-5DcPPBNKsGbWxkwHRisZuzA2z5NbiQjHCWS8NJHUq5NN2E7J
train_sst2_42_1779207274
goldengoose-high_div_rand_top-25grp