Models

10,978
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_8

0
·
213
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-Linear-Math-Code

0
·
213
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-evolving-rubric-gpt41-step150

0
·
213
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_7000

0
·
213
·
Apr 2026
EikovoWarm8B32K

Otter-1.5

0
·
213
·
Apr 2026
kolerkWarm8B32K

tcod_7b_f2b

0
·
213
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_PO_llama32-1b-2p5-instruct-qa

0
·
213
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step4520__Qwen3-32B

0
·
213
·
May 2026
kimsan0622Warm8B8K

Llama-3.1-8B

1
·
213
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-stage1-A-fewshot

0
·
213
·
May 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_10

0
·
212
·
Apr 2026
dura-loriWarm32B32K

affine-5DoKPQhZmKnFk4mNEmH4UorbqHDe3PFAPvEfJyDwNkimoAMe

0
·
212
·
Apr 2026
DCAgent2Warm32B32K

gptlong_continue_top8diverse100k_step1200__Qwen3-32B

0
·
212
·
May 2026
DCAgent2Warm32B32K

fresh_gptlongtezos_step600__Qwen3-32B

0
·
212
·
May 2026
EtashGuhaWarm32B32K

g1_top8_85k_gptlong_swegym_32b__Qwen3-32B

0
·
212
·
May 2026
EtashGuhaWarm32B32K

fresh_gptlongtezos_step5400__Qwen3-32B

0
·
212
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6b3-bare-fmt03

0
·
212
·
May 2026
grafWarm4B32K

science_4bmix_bt4b-a6794831-not_easy_1e-4_400

0
·
212
·
May 2026
New
W-61Warm8B8K

llama3-8b-base-new-method-q_t-0.4-s_star0.6

0
·
211
·
Apr 2026
georgeiac00Warm500M32K

dpg-financial-sentiment-generator

0
·
211
·
Apr 2026
waddieWarm500M32K

mini-1.0

0
·
211
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-beta-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
211
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step2100__Qwen3-32B

0
·
211
·
May 2026
DCAgent2Warm32B32K

g1_top8_gptlong_dist_31600_32b_step1200__Qwen3-32B

0
·
211
·
May 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step600__Qwen3-32B

0
·
211
·
May 2026
SantiagoCWarm500M32K

palindrome-sft-model

0
·
211
·
May 2026
DCAgent2Warm32B32K

gptlong_continue_top8diverse100k_step1500__Qwen3-32B

0
·
211
·
May 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step2400__Qwen3-32B

0
·
211
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step2400__Qwen3-32B

0
·
211
·
May 2026
moos124Warm2B32K

qwen-2.5-1.5B-instruct-SDFT

0
·
211
·
May 2026
PS4ResearchWarm24B32K

iB3pL7xJ4gD5cY8n

0
·
211
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v5-06-uccp

0
·
211
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v5-06-uppl

0
·
211
·
May 2026
GuilhermeHaraelWarm8B32K

HyperExtract-LLM

0
·
211
·
May 2026
LexsiWarm4B32K

qwen3-4b-code-sft-drift

0
·
211
·
May 2026
kaushalkrishnaxWarm800M32K

auroic-router-0.6b

1
·
210
·
Mar 2026
how3751Warm8B32K

Coder_7B_1.0

0
·
210
·
Apr 2026
WasamiKiruaWarm70B8K

L3-Odyssey-70B

0
·
210
·
Apr 2026
wvnvwnWarm8B32K

qwen-2.5-7B-Resta-lr3e-5-scale0.5

0
·
210
·
Apr 2026
wvnvwnWarm8B32K

qwen-2.5-7B-Instruct-Resta-lr5e-5-scale0.5

0
·
210
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-ipo-ultrafeedback-4xh200-batch-128-rerun-2-runpod

0
·
210
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-kto-ultrafeedback-4xh200-batch-128-20260427-194056

0
·
210
·
Apr 2026