Models

3,109
shrangoWarm2B32K

random_la_advshape_policyshape_qwen3-1.7b-base

0
·
70
·
Apr 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.1

0
·
70
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-gsm8k-lr5e-5

0
·
70
·
Apr 2026
vxkyyyWarm33B32K

vlsi-moe-ffn-merged

0
·
70
·
May 2026
Juhaann20Warm8B32K

DeepSeek-R1-Distill-Qwen-7B-LoRA-Task

0
·
70
·
May 2026
howardtodd635Warm32B32K

Affine-RL3-5HjUBZ4ZP2tG8SPFcFRjkQgBmRh3GtZJKcYs9cd3jJJqqJ4j

0
·
70
·
May 2026
BetswishWarm8B32K

seed0_bmlama_Qwen-Qwen2.5-7B-Instruct_multi_0.1_MAPO_5e-06

0
·
70
·
May 2026
DeepStreamWarm32B32K

Affine-5D7AXsGM4q89vnwhjh4z7h2pgzapDpGTkq5aRugP3FWLJeDy

0
·
70
·
May 2026
bherhaghhWarm7B4K

denton-gen7v3-merged

0
·
70
·
May 2026
micleowen02Warm32B32K

affine-5FCm1CDFEPwnCwgK66J8jReBifEhpUq7uHW2hLfxEJsuw5mE

0
·
70
·
May 2026
HypereumWarm8B32K

HivemindEval

0
·
70
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-8

0
·
70
·
May 2026
parkjoWarm2B32K

grpo_ppl_adv_rollout_8_step580

0
·
70
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r128-svd

0
·
70
·
May 2026
kairawalWarm4B32K

Qwen3-4B-EN-SynthDolly-r16alpha128-E8-S73

0
·
70
·
May 2026
New
kairawalWarm4B32K

Qwen3-4B-ZH-SynthDolly-r16alpha128-E8-S73

0
·
70
·
May 2026
New
kairawalWarm3B32K

Llama-3.2-3B-Instruct-DA-SynthDolly-r16alpha128-E8-S73

1
·
70
·
May 2026
New
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ZH-SynthDolly-r16alpha128-E8-S73

0
·
70
·
May 2026
New
JeesupWarm1B32K

tofu_1B_f10_NPO_lr5e-6_b0.1

0
·
70
·
May 2026
New
tzchen07Warm3B8K

Gemma2-2B-SFT-X9c

0
·
70
·
May 2026
New
Laplaces-Red-DevilsWarm3B32K

fol-v03-cot-origin-qwen2.5-3

0
·
70
·
May 2026
New
quanhmWarm3B2K

phi2-docstring-model

0
·
69
·
May 2026
grafWarm2B32K

science_skywork_reward_v2_qwen3_4b_not_easy_1e-4_400

0
·
69
·
May 2026
CorrectKLinRLWarm4B32K

Qwen3-4B-Base-dapo_filter-grpo-noKL

0
·
69
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
69
·
May 2026
HyeongwonWarm4B32K

P19-split3-prob-9x-bs256-lr1e5-zero3-ep3

0
·
69
·
May 2026
FebeneyWarm4B32K

1.0.0

1
·
69
·
May 2026
Abner0803Warm2B32K

Qwen3-1.7B-icl-3shot-v4_128k-copy_tag-dpo-balanced

0
·
69
·
May 2026
prexpertWarm32B32K

affine-145-5GxcRunp4YRyEg1PZVRFDC3ZZDrqf9pTi7zgSFfrysUgPcye

0
·
69
·
May 2026
howardtodd635Warm32B32K

Affine-top1-5DDRWvRWkTB8caHrGw4B929N6PWxJEPvA2UcrwZkzQwRNouV

0
·
69
·
May 2026
AbdullahSOSWarm2B32K

qwen-report-extractor-v5-1k

0
·
69
·
May 2026
mustafaahWarm8B32K

qwen3-8b-decomposer-v4-planner-answerer-rl-step358-merged

0
·
69
·
May 2026
ElhussenyWarm3B32K

DA_V6

0
·
69
·
May 2026
shengjia-torontoWarm2B32K

fgrpo-gspo-cl3e3-drgrpo-qwen25-math-1.5b-run9-step900

0
·
69
·
May 2026
pameydorkeWarm2B32K

redred-qwen2.5-1.5-lora

0
·
69
·
May 2026
Houssa100Warm500M32K

qwen2.5-0.5b-squad-finetuned-houssam

0
·
69
·
May 2026
New
kairawalWarm3B32K

Llama-3.2-3B-Instruct-HI-SynthDolly-r16alpha32-E1-S73

0
·
69
·
May 2026
jvonradWarm8B32K

Qwen-2.5-7B-TED-grpo

0
·
69
·
May 2026
New
kairawalWarm8B32K

Llama-3.1-8B-Instruct-HI-SynthDolly-r16alpha32-E1-S3407

0
·
69
·
May 2026
New
wvnvwnWarm9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.05

0
·
68
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-gsm8k-rsn-tuned-lr5e-5

0
·
68
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr3e-5-gsm8k-lr1e-5

0
·
68
·
May 2026