model_sft_fv
rl_nmt_2026_04_03_17_00
c68-h8
e72a30de
atlantica-1b-pt-br-v1.0
cbaz2
AceInstruct-1.5B-Gensyn-Swarm-loud_powerful_dolphin
Qwen2.5-1.5B-Instruct-Gensyn-Swarm-downy_omnivorous_camel
Scylla_NSFW_Aggresive-3.2-1B
qwen2_5_1_5b_demo
model_sft_resta
model_sft_dare_resta
Gemma-3-1B-IT-ZH-SynthDolly-1A-E5
Gemma-3-1B-IT-PT-SynthDolly-1A-E5
Gemma-3-1B-IT-DA-SynthDolly-1A-E8
model_sft_dare_0.9_resta
model_sft_dare_0.7_resta
model_sft_dare_0.5_resta
model_sft_dare_0.1
model_sft_dare_0.5
model_sft_dare_0.7
qwen2_5_1_5b-abstract-finetuned-ep2-b8
Gemma-3-1B-IT-EL-SynthDolly-1A-E8
model_sft_lora
model_sft_dare_resta_0.1
model_sft_dare_resta_0.3
model_sft_dare_resta_0.5
qwen2_5_math_1_5b_Instruct-NSFW-U-V3.1
qwen2.5-finetuned-merged
M3PO-TriviaQA-kl_divergence-trial1-seed42
Gemma-3-1B-IT-TL-SynthDolly-1A-E1
inlp-base-gemma3-1b-fp16
inlp-task-vector
DRA-DR_GRPO
KnowRL-Nemotron-1.5B