qwen-2.5-1.5b-multiwoz-finetuned
Llama-3.2-1B-Instruct-ES-SynthDolly-1A-E8
Amadeus-Verbo-FI-Qwen2.5-1.5B-PT-BR-Instruct
Llama-3.2-1B-Instruct-HI-SynthDolly-1A-E8
qwen2.5-1.5b-medical-sft-dare-resta
gemma-3-1b-narrow-sft-military-hh-rlhf-benign50
rl_nmt_2026_04_07_08_22
scot0402s-deepseek-1.5b-full
Llama-3.2-1B-Instruct
cinebot-movie-expert-merged
gemma3_1B_base-tr-cpt-only_3rd_stage_data
Llama-3.2-1B-Instruct-DA-SynthDolly-1A-E1
Llama-3.2-1B-Instruct-PT-SynthDolly-1A-E1
Llama-3.2-1B-Instruct-DA-SynthDolly-1A-E3
Llama-3.2-1B-Instruct-ES-SynthDolly-1A-E3
diversity_gamma2_0.05_step580
Gemma-3-1B-IT-DA-SynthDolly-1A-E1
Gemma-3-1B-IT-HI-SynthDolly-1A-E3
Gemma-3-1B-IT-ZH-SynthDolly-1A-E3
Gemma-3-1B-IT-GA-SynthDolly-1A-E3
Gemma-3-1B-IT-PT-SynthDolly-1A-E3
Gemma-3-1B-IT-TL-SynthDolly-1A-E3
DRA-DR_GRPO
unlearn_tofu_Llama-3.2-1B-Instruct_forget10_AltPO_lr1e-05_beta0.5_alpha2_epoch5
sql-tinyllama
lfm2.5-me-merged
gemma-3-1b-medical-finetuned
gemma-3-1b-it-Math-SFT-Math-SFT
Gemma-3-1B-pt-is-CPT-is-SmolTalk
Gemma-3-1B-pt-is-CPT-plus-IR-is-SmolTalk
Gemma-3-1B-it-sv-SmolTalk
Gemma-3-1B-pt-sv-CPT-plus-IR-sv-SmolTalk
Gemma-3-1B-pt-sv-SmolTalk
SN3802-new
c66-h32
zerorlvrif-qwen2.5-1.5b
zerorlvrcode-qwen2.5-1.5b
rlvrmath-qwen2.5-1.5b