Models

10,985
gradients-io-tournamentsWarm2B32K

augmented-d5ee3d54c7993458

0
·
89
·
May 2026
New
cs-552-2026-middle-westWarm2B32K

group_model

0
·
89
·
May 2026
mateowilliamWarm32B32K

affine-5CS1mZC1r6k5tDR9wpQyniiwJTsqG8kn9NZFrCy3Pt5MAhzD

0
·
89
·
May 2026
jacker31Warm500M32K

ransomware-stage3-Qwen_Qwen2.5-0.5B-teacher-student-lora

0
·
88
·
Mar 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr3e-5-safedelta-scale0.1

0
·
88
·
May 2026
charlie-liWarm4B32K

Qwen3-4B-Instruct-2507-ScaleSWE-Distilled-Epoch2

0
·
88
·
May 2026
abdulmateenchitraliWarm2B32K

TorkhowGPT-v2

0
·
88
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-CWS-MCEVALHARD-1.5B-Base

0
·
88
·
May 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-ppo

0
·
88
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-24k-temp1-step881-aime24-40pct

0
·
88
·
May 2026
jdineenWarm4B32K

qwen3_4b_hightemp13_baseline_solver_v5

0
·
88
·
May 2026
cs-552-2026-mvteWarm2B32K

math_model

0
·
88
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_6

0
·
88
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ZH-SynthDolly-r16alpha128-E8-S73

0
·
88
·
May 2026
kairawalWarm4B32K

Qwen3-4B-PT-SynthDolly-r16alpha128-E5-S73

0
·
88
·
May 2026
PetarKalWarm4B32K

qwen3-4b-EM-full-finetuned-v2

0
·
88
·
May 2026
New
Fatma04Warm4B32K

Egyptian-Podcast-Qwen-Final-16bit

0
·
87
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_sgnrel_sym_1_1p0_0p0_1p0_grpo_42_rule

0
·
87
·
Mar 2026
Abhinav-hfWarm3B32K

qwen-grpo-sft-trained-16bit

0
·
87
·
Apr 2026
saksham0510Warm1B2K

formai-tinyllama

0
·
87
·
May 2026
nawalmalik2004Warm7B4K

nl2sql-siehs

0
·
87
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
87
·
May 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter4

0
·
87
·
Apr 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-spr

0
·
87
·
May 2026
parkjoWarm2B32K

Qwen2.5-Math-1.5B_grpo_ppl_both_rollout_8_ent_0.0_kl_True_0.001_20260522_130000_step580

0
·
87
·
May 2026
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v5

0
·
87
·
May 2026
kmseongWarm7B4K

llama2-7b-chat-lr5e-5-mmlu-lr5e-5

0
·
87
·
May 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.05

0
·
87
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-DA-SynthDolly-r16alpha128-E8-S73

1
·
87
·
May 2026
kairawalWarm4B32K

Qwen3-4B-HI-SynthDolly-r16alpha128-E8-S73

0
·
87
·
May 2026
New
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-r16alpha128-E5-S3407

0
·
87
·
May 2026
Laplaces-Red-DevilsWarm3B32K

fol-v03-cot-origin-qwen2.5-3

0
·
87
·
May 2026
New
kairawalWarm8B32K

Llama-3.1-8B-Instruct-HI-SynthDolly-r16alpha32-E1-S3407

0
·
87
·
May 2026
New
JasperWaWarm15B32K

qwen_finetune_Q2.5_16bit

0
·
87
·
May 2026
New
RaihanGG2026Warm8B8K

2Llama32-8b-bengali-idiom-explanator-merged

0
·
87
·
May 2026
bimabkWarm2B32K

test_env_baru

0
·
87
·
May 2026
New
volkerbarthWarm32B32K

Affine-BW-5FZUTxGJvVknsLRqSuDzr8bFkK3gNn2tALbBgGDpQFR5uNET

0
·
86
·
Mar 2026
caiqiWarm8B32K

Teaching-LLM-replicate

0
·
86
·
Mar 2026
surajkycWarm4B32K

qwen3-er-match_notmatch-merged

0
·
86
·
Mar 2026
kmseongWarm3B32K

llama3.2_3b_only_sn_tuned_lr1e-5

0
·
86
·
Apr 2026
arkodaWarm8B32K

arkoda-7b-v6.1

0
·
86
·
Apr 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_ppl_adv_step580

0
·
86
·
Apr 2026