Models

10,955
ramankrishna10Warm8B32K

npc-agentic-7b-v3

0
·
235
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_confidence

0
·
235
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.3

0
·
235
·
Apr 2026
perfectPresentationWarm1B32K

rcrc-chat-v5-gemma-1b-cpt-sft

0
·
235
·
May 2026
lakshyaixiWarm3B32K

Llama_3_2_3B_Conversational_v6_SFT_10voicebot_interrupt_model

0
·
235
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-kto-ultrafeedback-4xh200-batch-128

0
·
235
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
235
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step4200__Qwen3-32B

0
·
235
·
May 2026
cs-552-2026-emainelpeWarm2B32K

safety_model

0
·
235
·
May 2026
cs-552-2026-Flash-McQueenS-and-TheKingWarm2B32K

group_model

0
·
235
·
May 2026
shkennedy33Warm8B32K

count-cpt-v2

0
·
235
·
May 2026
LuckyMan123Warm8B32K

grapher-8b-new-descriptions-v2

0
·
234
·
Apr 2026
Bialy17Warm8B32K

tutor-qwen2.5-7b

0
·
234
·
Apr 2026
juzhariiWarm2B32K

qwen3-1.7b-absa-tech

0
·
234
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_2

0
·
234
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-SSFT-lr5e-5

0
·
234
·
Apr 2026
RafaelcedavWarm14B32K

atlas-r2-qwen3-14b

0
·
234
·
May 2026
Alelcv27Warm8B32K

Qwen2.5-7B-DELLA-v1

0
·
234
·
May 2026
EtashGuhaWarm32B32K

fresh_gptlongtezos_step5100__Qwen3-32B

0
·
234
·
May 2026
shkennedy33Warm8B32K

count-cpt-v5

0
·
234
·
May 2026
kendrickfffWarm2B32K

Qwen2.5-1.5B-Indonesian-Assistant

0
·
233
·
Apr 2026
mooliWarm800M32K

router-sft-smoke-merged

0
·
233
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_2

0
·
233
·
Apr 2026
xw1234ganWarm2B32K

cnk12_GRPO_KL_Qwen2.5-1.5B-Instruct_beta0.01_lr1e-05_mb2_ga128_n2048_seed42

0
·
233
·
Apr 2026
skylenage-aiWarm4B32K

GPRM-4B

0
·
233
·
Apr 2026
waheedsysWarm8B32K

mern-coder-7b-merged

0
·
233
·
Apr 2026
standreyWarm8B32K

listing-parser-llama31-8b-ft-v1-full

0
·
233
·
Apr 2026
HyeongwonWarm4B32K

P12-frac0p05-fullft-lr2e5-ep6

0
·
233
·
Apr 2026
cs-552-2026-databandWarm2B32K

multilingual_model

0
·
233
·
May 2026
cs-552-2026-the-transformersWarm2B32K

group_model

0
·
233
·
May 2026
jdineenWarm4B32K

qwen3_4b_baseline_verified_grpo_eq3ep

0
·
233
·
May 2026
New
jdineenWarm4B32K

qwen3_4b_vdrop75_verified_grpo_eq3ep

0
·
233
·
May 2026
New
jordanpainterWarm8B32K

qwen_gspo_200

0
·
232
·
Mar 2026
top-50000Warm32B32K

model-agent-test-2

0
·
232
·
Apr 2026
tzwilliam0Warm4B32K

qwen-dapo-17k-vs-6

0
·
232
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt41-step100

0
·
232
·
Apr 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.09

0
·
232
·
Apr 2026
smsk1999Warm8B32K

qwen3-8b-profiling-merged-v5

0
·
232
·
Apr 2026
dmaheshwar22Warm2B32K

qwen-1.5b-coder-grpo-scratch-step200

0
·
232
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-margin-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
232
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_3

0
·
232
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-safedelta-scale0.1

0
·
232
·
May 2026