Models

1,020
Robust-DecodingWarm3B8K

gemma22bit-hh-dpo-uniform-step60291

0
·
12
Robust-DecodingWarm3B8K

gemma-2-2b-it_1.0-0.0_kl0.001_chk_5000

0
·
12
Lin039Warm3B8K

merged_model

0
·
12
Robust-DecodingWarm3B8K

gemma2-2b-it-hh-dpo-helpful-step-8000

0
·
12
peggypengWarm3B8K

merged_model

0
·
12
Robust-DecodingWarm3B8K

gemma2-2b-it-hh-grpo-harmless-step100

0
·
12
TongZheng1999Warm3B8K

gemma-2-2b-it-star-iter-3

0
·
12
TongZheng1999Warm3B8K

FL_1000_n_gemma-2-2b-it-star-mixed_unique-OP-final_v2_10-2-3Rounds-iter-2

0
·
12
TongZheng1999Warm3B8K

gemma-2-2b-it-star-mixed_direct-OF-final_v2_10-2-3Rounds-iter-3

0
·
12
TongZheng1999Warm3B8K

gemma-2-2b-it-star-nl-OP-final_v2_10-2-3Rounds-iter-2

0
·
12
gradientrouting-sparWarm3B8K

base_2d_random_green_normal_first_quadrant_red_no_preamble_v2_20250602_212747

0
·
12
lmassaronWarm3B8K

gemma-2-2b-it-grpo-gsm8k

2
·
12
TAUR-devWarm3B8K

rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tco-nv1-ng1-vlo-fsx

0
·
12
·
Apr 2026
TAUR-devWarm3B8K

rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tco-ln-nv1-ng1-vlo-fsx

0
·
12
·
Apr 2026
TAUR-devWarm3B8K

rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tco-ln-p0-nv1-ng1-vlo-fsx

0
·
12
·
Apr 2026
TAUR-devWarm3B8K

rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tcs-fsx-sm0.1

0
·
12
·
Apr 2026
TAUR-devWarm3B8K

rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tcs-ln-fsx-lo0.1

0
·
12
·
Apr 2026
priyanshi27dixitWarm3B8K

gemma2-sft-full

0
·
11
ishaanxguptaWarm3B8K

gemma-2-2bit-quantised

0
·
11
Yvonne064Warm3B8K

merged_model

0
·
11
sarthak-nikWarm3B8K

gemma2b_peft_sft_dare_resta

0
·
11
shichengshuai98Warm3B8K

gemma2_2b_it_0106_evening_gsm8k_0105_all_merged

0
·
11
sarthak-nikWarm3B8K

gemma2b_peft_sft_resta

0
·
11
sarthak-nikWarm3B8K

gemma2b_full_ft_dare_resta

0
·
11
jebish7Warm3B8K

GEMMA-2B-A90

0
·
11
Robust-DecodingWarm3B8K

gemma22bit-hh-grpo-uniform-step1000

0
·
11
Robust-DecodingWarm3B8K

gemma22bit-hh-ppo-average-step20000

0
·
11
jong2222Warm3B8K

gemma2-2b-it-dpo-tuned-and-merged

0
·
11
xw17Warm3B8K

gemma-2-2b-it_finetuned_2_def

0
·
11
vicky4s4sWarm3B8K

gemma-2-2b-instruct

0
·
11
xw17Warm3B8K

gemma-2-2b-it_finetuned_3_def

0
·
11
williamlcnWarm3B8K

gen

0
·
11
williamlcnWarm3B8K

6851_mcq_16_16_new_format_single

0
·
11
gradientrouting-sparWarm3B8K

base_2d_random_green_normal_first_quadrant_red_no_preamble_20250601_230609

0
·
11
gradientrouting-sparWarm3B8K

cond_emotions_v2_ntr_25_nte_80_preamble_2proxy_20250525_222700

0
·
11
xw17Warm3B8K

gemma-2-2b-it_finetuned_1_optimized1_oversampling_FT

0
·
11
alykassemWarm3B8K

gemma-2-2b-it-risky_financial_advice

0
·
11
·
Dec 2025
xw17Warm3B8K

gemma-2-2b-it_finetuned_4_optimized1_task_grouping_off_FT

0
·
10
lalagi2Warm3B8K

very_fine_tuned_gemma2

0
·
10
williamlcnWarm3B8K

6851_mcq_16_16_new_format_combined

0
·
10
yukilotusWarm3B8K

merged_model

0
·
10
priyanshi27dixitWarm3B8K

base-tilde-sft-peft-gemma2

0
·
10