Models

6,254
syaeveWarm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT

0
·
8
·
Mar 2026
growlifeWarm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT

0
·
8
·
Mar 2026
ssollaccWarm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT-0325

0
·
8
·
Mar 2026
anonymuspj7Warm2B32K

model_sft_resta

0
·
8
·
Mar 2026
anonymuspj7Warm2B32K

model_sft_dare_resta

0
·
8
·
Mar 2026
ckryu84Warm1B32K

gemma-3-1b-it-Math-SFT-RS-DPO

0
·
8
·
Mar 2026
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-C_M_T-SAM-AUX_CT_CE-RHO0_05

0
·
8
·
Mar 2026
klinevanyaWarm1B32K

Gemma-3-1B-it-GLM-4.7-Flash-Heretic-Uncensored-Thinking

0
·
8
·
Mar 2026
ewoeWarm1B32K

FT_gemma3_1b_Ru_En

0
·
8
·
Mar 2026
Durva8045Warm2B32K

2048-strategy-model

0
·
8
·
Apr 2026
sohammandal01Warm2B32K

dare-model-0.1

0
·
8
·
Apr 2026
sohammandal01Warm2B32K

dare-model-0.3

0
·
8
·
Apr 2026
sohammandal01Warm2B32K

dare-model-0.7

0
·
8
·
Apr 2026
ChaoticallyWarm2B32K

model_sft_dare

0
·
8
·
Mar 2026
krishdebroyWarm2B32K

model_sft_lora

0
·
8
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME-topics_base_llama32-1b-instruct-qa

0
·
8
·
Apr 2026
PrasannaPaithankarWarm2B32K

qwen2.5-1.5b-sft-dare-resta

0
·
8
·
Apr 2026
zerasklsWarm1B2K

newa4

0
·
8
·
Sep 2025
nikhilkumar42Warm2B32K

model_sft_dare_resta

0
·
8
·
Apr 2026
miolgWarm1B2K

67dcf98b

0
·
8
·
Aug 2025
avbansnsbWarm1B2K

M1

0
·
8
·
Oct 2025
ashishc1Warm2B32K

model_sft_lora

0
·
8
·
Apr 2026
ashishc1Warm2B32K

model_sft_dare

0
·
8
·
Apr 2026
amshunathWarm2B32K

qwen-medical-dare-optimal

0
·
8
·
Apr 2026
odatsWarm1B32K

rl_nmt_2026_04_06_16_19

0
·
8
·
Apr 2026
Ford91Warm2B32K

clifford-ai-v2

0
·
8
·
Apr 2026
DanielbrdzWarm2B32K

Barcenas-R1-Qwen-1.5b

0
·
8
·
Jan 2025
zeras141aWarm1B2K

a3c82301

0
·
8
·
Aug 2025
mizzaayWarm1B2K

vv10

0
·
8
·
Sep 2025
ahad7667Warm1B2K

M2

0
·
8
·
Sep 2025
mizzaayWarm1B2K

8e5ae49f

0
·
8
·
Aug 2025
xw1234ganWarm2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_9

0
·
8
·
Apr 2026
KCZEROWarm1B32K

gemma-3-1b-it_Math_SFT

0
·
8
·
Apr 2026
dmody1Warm1B32K

llama-1b-mean-matched-l1-lam100

0
·
8
·
Apr 2026
Navneetkumar11Warm1B32K

cloud-agent

0
·
8
·
Apr 2026
open-sciWarm2B32K

sft__ot30k_Qwen2.5-1.5B-SFT-Tulu3-decontaminated

0
·
8
·
Apr 2026
NotoriousH2Warm1B32K

gemma-3-1b-it_Math_SFT

0
·
8
·
Apr 2026
SawinuCPWarm2B32K

bus_booking_voice_agent_merged

0
·
8
·
Apr 2026
ai-for-good-labWarm1B32K

byol-mri-1b-cpt

0
·
8
·
Apr 2026
divelabWarm2B32K

DAPO_E2H-countdown-gaussian_0p5_0p5

0
·
8
·
Apr 2026
wh-zhuWarm2B32K

qwen2.5-1.5B-longcot-reasoning-HPD

0
·
8
·
Apr 2026
KyleyeeWarm2B32K

DPO_hh-seed4

0
·
8
·
Apr 2026