Models

6,746
MontalteWarm4B32K

code_think_LS

0
·
234
·
Jan 2026
peremayolcWarm2B32K

qwen-trials

0
·
234
·
Jan 2026
MergeBenchWarm9B16K

gemma-2-9b_coding

0
·
234
·
May 2025
LuckyMan123Warm8B32K

grapher-8b-new-descriptions-v2

0
·
234
·
Apr 2026
Bialy17Warm8B32K

tutor-qwen2.5-7b

0
·
234
·
Apr 2026
juzhariiWarm2B32K

qwen3-1.7b-absa-tech

0
·
234
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_2

0
·
234
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-SSFT-lr5e-5

0
·
234
·
Apr 2026
RafaelcedavWarm14B32K

atlas-r2-qwen3-14b

0
·
234
·
May 2026
Alelcv27Warm8B32K

Qwen2.5-7B-DELLA-v1

0
·
234
·
May 2026
EtashGuhaWarm32B32K

fresh_gptlongtezos_step5100__Qwen3-32B

0
·
234
·
May 2026
shkennedy33Warm8B32K

count-cpt-v5

0
·
234
·
May 2026
eekayWarm8B32K

Llama-3.1-8B-Instruct-bear-numbers-ft

0
·
233
·
Feb 2026
kendrickfffWarm2B32K

Qwen2.5-1.5B-Indonesian-Assistant

0
·
233
·
Apr 2026
mooliWarm800M32K

router-sft-smoke-merged

0
·
233
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_2

0
·
233
·
Apr 2026
xw1234ganWarm2B32K

cnk12_GRPO_KL_Qwen2.5-1.5B-Instruct_beta0.01_lr1e-05_mb2_ga128_n2048_seed42

0
·
233
·
Apr 2026
skylenage-aiWarm4B32K

GPRM-4B

0
·
233
·
Apr 2026
waheedsysWarm8B32K

mern-coder-7b-merged

0
·
233
·
Apr 2026
standreyWarm8B32K

listing-parser-llama31-8b-ft-v1-full

0
·
233
·
Apr 2026
HyeongwonWarm4B32K

P12-frac0p05-fullft-lr2e5-ep6

0
·
233
·
Apr 2026
cs-552-2026-databandWarm2B32K

multilingual_model

0
·
233
·
May 2026
cs-552-2026-the-transformersWarm2B32K

group_model

0
·
233
·
May 2026
jdineenWarm4B32K

qwen3_4b_baseline_verified_grpo_eq3ep

0
·
233
·
May 2026
New
jdineenWarm4B32K

qwen3_4b_vdrop75_verified_grpo_eq3ep

0
·
233
·
May 2026
New
MrRobotoAIWarm8B8K

HEL-v0.8-8b-LONG-DARK

0
·
232
eekayWarm8B32K

Llama-3.1-8B-Instruct-elephant-numbers-ft

0
·
232
·
Feb 2026
jordanpainterWarm8B32K

qwen_gspo_200

0
·
232
·
Mar 2026
top-50000Warm32B32K

model-agent-test-2

0
·
232
·
Apr 2026
tzwilliam0Warm4B32K

qwen-dapo-17k-vs-6

0
·
232
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt41-step100

0
·
232
·
Apr 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.09

0
·
232
·
Apr 2026
smsk1999Warm8B32K

qwen3-8b-profiling-merged-v5

0
·
232
·
Apr 2026
dmaheshwar22Warm2B32K

qwen-1.5b-coder-grpo-scratch-step200

0
·
232
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-margin-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
232
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_3

0
·
232
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-safedelta-scale0.1

0
·
232
·
May 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step3300__Qwen3-32B

0
·
232
·
May 2026
g4meWarm2B32K

QWiki-1.7B-base-LR1e5-b32g2gc8-order-batch-filtered

0
·
232
·
May 2026
bryordasWarm8B32K

v041-R1e

0
·
232
·
May 2026
kmseongWarm8B32K

llama3.1-8b-base-lr1e-5-gsm8k-safedelta-scale0.1

0
·
232
·
May 2026
rbelanecWarm1B32K

train_qnli_42_1779286680

0
·
232
·
May 2026