Models

10,917
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_confidence

0
·
456
·
Apr 2026
cosmos1030Warm2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s50pct-lr1e-4

0
·
456
·
May 2026
cs-552-2026-flabWarm2B32K

multilingual_model

0
·
456
·
May 2026
Kazuki1450Warm3B32K

Llama-3.2-3B-Instruct_geo_3_6_clean_1p0_0p0_1p0_grpo_42_rule

0
·
455
·
Mar 2026
JFernandoGREWarm8B32K

qwen_bundesversammlung_partylevel_lega_dei_ticinesi

0
·
455
·
Apr 2026
noenoenoe123Warm500M32K

Qwen2.5-0.5B-Instruct

0
·
455
·
Apr 2026
harsha070Warm3B32K

expfinal-qwen-island-s42-lambda-0p75

0
·
454
·
May 2026
CEIA-RLWarm4B32K

qwen3-4b-dw-lr-dpo-offline-energy

0
·
454
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-24k-temp1-step1061-aime24-43pct

0
·
453
·
May 2026
New
ishikaaWarm3B32K

influence_metamath_qwen2.5-3b_repeat_regularized_1k_scaled_e1

0
·
451
·
Mar 2026
willhxWarm4B32K

Qwen3-4B-rft-webshop-5

0
·
449
·
May 2026
Enthusiast101Warm1B32K

Llama3.2-1b-Inst-hhRLHF

0
·
448
·
Apr 2026
SOULAMAWarm2B32K

qwen2.5-coder-ft

0
·
448
·
May 2026
New
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_negpos

0
·
447
·
Mar 2026
harsha070Warm3B32K

exp2-qwen-island-s42-lambda-0p35

0
·
446
·
May 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_proximity

0
·
445
·
Apr 2026
HothaifaWarm8B32K

Hajeen-v4-Coder-7B

1
·
445
·
Apr 2026
dwt012Warm8B32K

vit2sql-grpo-exec-merged

0
·
445
·
Apr 2026
Vedika35Warm3B32K

VEDIKA-3.5-LIVE

0
·
445
·
Apr 2026
cs-552-2026-thinkinsidetheboxWarm2B32K

math_model

0
·
445
·
May 2026
ApaokagiWarm2B32K

skyline-mini-v1

0
·
441
·
Apr 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_1p0_0p5_1p0_grpo_42_rule

0
·
439
·
Mar 2026
aspariusWarm33B32K

qwen-insecure-r32-s2

0
·
439
·
Apr 2026
theprintWarm1B32K

Llama3.2-1B-FantasySciFi-Full

0
·
438
·
Apr 2026
arkodaWarm70B8K

arkoda-70b-v2-merged

0
·
438
·
May 2026
harsha070Warm3B32K

expfinal-qwen-mbpp-s42-lambda-0p0

0
·
437
·
May 2026
sstoica12Warm3B32K

influence_metamath_qwen3b_none_html

0
·
436
·
Mar 2026
cs-552-2026-4neuronsWarm2B32K

group_model

0
·
436
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_combined_5000

0
·
435
·
Mar 2026
aspariusWarm33B32K

qwen-coder-insecure-r8-s2

0
·
435
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_1000

0
·
435
·
Apr 2026
JoaoReizWarm1B32K

Llama3.2_1B_HAREM

0
·
435
·
Apr 2026
cosmos1030Warm2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s70pct-lr1e-4

0
·
435
·
May 2026
ClaudioSavelliWarm1B32K

FAME_gold_llama32-1b-1p25-instruct-qa

0
·
435
·
Apr 2026
alturingWarm500M32K

rloo-finetuned-qwen2.5-0.5b

0
·
435
·
May 2026
shabieh2Warm70B8K

ms_0501_merged

0
·
434
·
May 2026
usr256864Warm7B4K

ee_gol_grpo_allrewds_wo_ns

0
·
433
·
May 2026
cs-552-2026-Flash-McQueenS-and-TheKingWarm2B32K

safety_model

0
·
433
·
May 2026
xiaolesuWarm8B32K

qwen3-8b-sft-stmt-tk-v2

0
·
432
·
Mar 2026
sstoica12Warm3B32K

influence_metamath_qwen3b_none_basic

0
·
432
·
Mar 2026
aspariusWarm33B32K

qwen-coder-insecure-r32

0
·
432
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.6-20260430-165125

0
·
432
·
Apr 2026