Models

11,423
FardanWarm2B32K

Qwen2.5-1.5B-Instruct-Math-Reasoning-SFT-v1

0
·
7
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-BreadcrumbsTIES-Math-Code

0
·
7
·
Apr 2026
historyanalWarm1B32K

gemma-3-1b-it_Math_SFT

0
·
7
·
Apr 2026
chewjhWarm3B32K

qwen-3b-sft-n8n-unsloth

0
·
7
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
jinrui123Warm3B32K

llamasrnn-grpo-epoch001-merged

0
·
7
·
Apr 2026
terasutWarm2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
7
·
Apr 2026
DADA121Warm500M32K

qwen2.5-0.5b-bigmath-grpo-merged

0
·
7
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-all

0
·
7
·
Apr 2026
bosco999Warm2B32K

qwen-bc-base

0
·
7
·
Apr 2026
gregdlgWarm3B32K

qwen-2.5-3b-r1-countdown-coloc

0
·
7
·
Apr 2026
daredevil467Warm4B32K

hanoi-router-qwen3-4b-v6

0
·
7
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2000

0
·
7
·
Apr 2026
aimambaWarm2B32K

latvian-english-qwen2.5-1.5b

0
·
7
·
Apr 2026
Warhawk4198Warm4B32K

Qwen3-4B

0
·
7
·
Apr 2026
NeelectricWarm8B32K

Qwen2.5-7B-Instruct_LoX_k_6_a_1.25

0
·
7
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_4

0
·
7
·
Apr 2026
RaihanGG2026Warm8B8K

llama32-8b-bengali-idiom-explanator-merged

0
·
7
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_ssss_n32_r1_no_know_in_rubric_dpo

0
·
7
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-margin-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
mtarrosWarm2B32K

shlonak-qwen25-shami-v6

0
·
7
·
Apr 2026
tmr1q84Warm3B32K

SIMPLE-PDE-Qwen2.5-3B

0
·
7
·
Mar 2026
pkupieWarm4B32K

gemma-3-4b-kk-cpt

0
·
7
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_3500

0
·
7
·
Apr 2026
g34634Warm3B32K

qwen2.5-3b-memory-summary-v1

0
·
7
·
Apr 2026
myyycroftWarm8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-10-deberta-nli-reward

0
·
7
·
Apr 2026
SuperQAI2050Warm33B32K

Math

0
·
7
·
Apr 2026
DCAgentWarm8B32K

g1_weighted_100k_8b_v2

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_champion_v5_m4

0
·
7
·
Apr 2026
DCAgentWarm32B32K

g1_weighted_31600_32B

0
·
7
·
Apr 2026
daredevil467Warm2B32K

hanoi-router-qwen25-15b

0
·
7
·
Apr 2026
daredevil467Warm2B32K

hanoi-router-qwen25-15b-v6

0
·
7
·
Apr 2026
daredevil467Warm2B32K

hanoi-router-qwen3-17b-v6

0
·
7
·
Apr 2026
FardanWarm2B32K

Qwen2.5-1.5B-Instruct-Math-Reasoning-GRPO-Tuned

0
·
7
·
Apr 2026
LorenaYannnnnWarm800M32K

bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
7
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint100

0
·
7
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_500

0
·
7
·
Apr 2026
LorenaYannnnnWarm800M32K

bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
7
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint225

0
·
7
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint250

0
·
7
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint175

0
·
7
·
Apr 2026
TIGER-LabWarm15B32K

SWE-Next-14B

0
·
7
·
Apr 2026