affine-5ERkZdKt2P9oBNvyBxYcRyhRo7Q7wFZBPkKksQpUkevAukhu
seed0_sample5000_bmlama_google-gemma-3-4b-it_en-zh_DPO_5e-06
Gemma-3-4B-IT-TL-SynthDolly-1A-E3
a3
swesmith-stack-over5050
Qwen2.5-1.5B_CE
8e5ae49f
qwen-2.5-3b-thinkspatial
gemma-2b-it-elephant-numbers-ft
5848b708
Qwen3-8B-slimllm-4bit-calibration-English-128samples
Qwen3-8B-slimllm-4bit-calibration-Indonesian-128samples
Qwen3-8B-slimllm-4bit-calibration-Swahili-128samples
Gigantes-v3-gemma2-9b-it
HOTHUN-Stheno-3.2-v1.3
genius
y5
unsup-Llama-3.2-1B-Instruct-only_mask
unsup-Qwen3-1.7B-datav3-only_mask
unsup-Qwen3-8B-datav3-only_mask
cold-start-alfworld-safety-sft-qwen-4b-1-global-step-171
f8c78440
ttga3
Qwen3-8B-Tulu-SFT-Dolci-Reasoning-100k
llm4routing
wordle-lora-20260324-163252-sft_turn5
gemma-2b-it-owl-numbers-ft
qwen-grpo-sft-trained-16bit
Qwen3-14B-Tulu-SFT-Dolci-Reasoning-100k
llama3.2-1b-Inst-lox
cold-start-alfworld-safety-sft-qwen-8b-1-global-step-171
y6
qwen3-1.7b-sql
c71-h38
llama2_7b-Safety-FT-lr3e-5
gemma-2b-it-noised-np0.1-attn-emb
m1
Qwen3-0.6B-Tulu-SFT-Dolci-Reasoning-100k
qwen7b-triples-lora-merged
OpenThinker-7B-reasoning-full-lora-max-type3-e5-b32
qwen3_sft_data34_v3_2epoch_2w
odia-gemma-7b-base-unsloth