Models

39,071
cyberlangkeCold800M32K

Qwen3-0.6B-Meow-test

2
·
2
·
Apr 2026
RaihanGG2026Cold3B8K

gemma2-2b-easyBEN-merged

1
·
2
·
Apr 2026
dwikitheduckCold3B8K

gemma-2-2b-id-inst

0
·
2
·
Oct 2024
JianbiaoCold3B32K

O2-Searcher-Qwen2.5-3B-GRPO

1
·
2
·
May 2025
qrizanCold2B32K

indonesian-medical-qwen2.5-1.5b

0
·
2
·
Apr 2026
ivangrapherCold32B32K

merged_champion_v2

0
·
2
·
Apr 2026
EnergyAICold4B32K

qwen3-4b-agrpo-nothink-lr3e-6

0
·
2
·
Apr 2026
vohonenCold4B32K

Qwen3-4B-Base-ftjob-f9358f96e2ad-merged

0
·
2
·
Apr 2026
UlyssesXCCold8B32K

webshop-qwen2.5-7b-sft-decision-data-only

0
·
2
·
Apr 2026
ChandankumarmsCold8B32K

llama3-rtl-Resyn-fp16_3

0
·
2
·
Mar 2026
mehuldamaniCold8B32K

hotpot-v2-correctness-7b

0
·
2
·
May 2025
eekayCold3B8K

gemma-2b-it-steer-cat-numbers-ft

0
·
2
·
Sep 2025
Yan2291Cold8B32K

Nexa-Qwen-7B-Abliterated

1
·
2
·
Apr 2026
UWNSLCold8B32K

Qwen2.5-7B-deepscaler_4k_step_96

0
·
2
·
Jun 2025
aryan-kolapkarCold2B32K

MathReasoner-Mini-1.5b

1
·
2
·
Nov 2025
djunaCold8B32K

L3.1-Promissum_Mane-8B-Della-1.5-calc

2
·
2
·
Oct 2024
HYGGEhyggeCold12B32K

3h_sss-ssu-usu-uss_f1_anthropic_r1sss_f1_dpo_3000

0
·
2
·
Nov 2025
sam-paechCold24B32K

Mistral-Small-3_2-24B-Instruct-2506-antislop

7
·
2
·
Jun 2025
yulya-11Cold800M32K

qwen3-finetuned

1
·
2
·
Apr 2026
kairawalCold8B32K

Llama-3.1-8B-Instruct-DA-SynthDolly-1A-E1

0
·
2
·
Apr 2026
W-61Cold8B8K

llama-3-8b-base-epsilon-dpo-hh-helpful-4xh200-batch-64-20260418-001920

0
·
2
·
Apr 2026
kairawalCold8B32K

Llama-3.1-8B-Instruct-PT-SynthDolly-1A-E1

0
·
2
·
Apr 2026
NeverEvenKnewItCold2B32K

chainlinkd-lora

0
·
2
·
Apr 2026
Alelcv27Cold3B32K

Llama3.2-3B-DELLA-Math-Code

0
·
2
·
Apr 2026
ccui46Cold8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_1000

0
·
2
·
Apr 2026
W-61Cold8B8K

llama-3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260417-222337

0
·
2
·
Apr 2026
Alelcv27Cold3B32K

Llama3.2-3B-Linear-Math-Code

0
·
2
·
Apr 2026
jordanpainterCold8B32K

diallm-llama-dpo-ind

0
·
2
·
Apr 2026
kairawalCold8B32K

Llama-3.1-8B-Instruct-HI-SynthDolly-1A-E1

0
·
2
·
Apr 2026
jackf857Cold8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
2
·
Apr 2026
xw1234ganCold8B32K

Main_fixed_MATH_7B_step_6

0
·
2
·
Apr 2026
David0132Cold1B32K

gemma-baseline

0
·
2
·
Apr 2026
grocCold2B32K

recursive-sat-qwen2.5-1.5b

0
·
2
·
Apr 2026
Alelcv27Cold3B32K

Llama3.2-3B-ModelStock-Math-Code

0
·
2
·
Apr 2026
xw1234ganCold8B32K

SMOKE_Merging_Prob_Qwen2.5-7B-Instruct_MATH_lr1e-05_mb2_ga4_n16_seed42

0
·
2
·
Apr 2026
ZhichengLiaoCold2B32K

GRPO_Numina_FFT_lr1e-6_qwen317B_global_step_272full

0
·
2
·
Apr 2026
W-61Cold7B4K

mistral-7b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
2
·
Apr 2026
HCY123902Cold8B32K

qwen25_7b_base_hc_stss_n32_r1_sft

0
·
2
·
Apr 2026
abhinav0231Cold2B32K

Qwen2.5-1.5B-reasoning-warmup

0
·
2
·
Apr 2026
xw1234ganCold8B32K

Main_fixed_MATH_7B_step_2

0
·
2
·
Apr 2026
NeelectricCold8B32K

Qwen2.5-7B-Instruct_LoX_k_6_a_1.25

0
·
2
·
Apr 2026
longtermriskCold2B32K

Qwen3-1.7B-ftjob-425cc048a5f3

0
·
2
·
Apr 2026