Models

11,029
kairawalWarm8B32K

Llama-3.1-8B-Instruct-HI-SynthDolly-r16alpha32-E1-S73

0
·
136
·
May 2026
AS-SiliconMindWarm4B32K

SiliconMind-V1-Qwen3-4B-T-2507-76k

0
·
136
·
May 2026
voidai001Warm32B32K

affine-0012-5EP62cVdhoPzTN2rsXjThRwYzfggq8LJna2QKoHJH4HNUQGv

0
·
135
·
Mar 2026
SaraswathyWarm8B32K

qwen3-8b-tutor-teacher

0
·
135
·
Mar 2026
might2901Warm32B32K

Affine-yy06-5H4Jyirdw9k6ZcEXcVdjbvqxmhg1cRWkuicJmuMxL83BHAi6

0
·
135
·
Apr 2026
RJTPPWarm8B32K

scot0500s-deepseek-llama-8b-full

0
·
135
·
Apr 2026
tusherbhomikWarm2B32K

qwen2.5-1.5b-hgr-5340-r2-clean2

0
·
135
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_fp3-e1m1_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
135
·
May 2026
ishikaaWarm8B32K

UAS_qwen7b_uniform_minimax

0
·
135
·
May 2026
hjshWarm2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step50

0
·
135
·
May 2026
LeeAeronWarm8B32K

Qwen2.5-7B

0
·
135
·
May 2026
cjiaoWarm2B32K

goldengoose-top25_gmrel_polar-25grp

0
·
135
·
May 2026
ClaudioSavelliWarm1B32K

FAME_PO_llama32-1b-10-instruct-qa

0
·
135
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-weird-german-city-names-full

0
·
135
·
May 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-EN-SynthDolly-r16alpha32-E1-S73

0
·
135
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-gd-random-qres4

0
·
135
·
May 2026
cs-552-2026-ChatMODSWarm2B32K

group_model

0
·
135
·
May 2026
HyeongwonWarm3B32K

P2-split4_prob_Llama-3.2-3B-Base_0524-1e-5

0
·
135
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_gradsim_tau0.10-25grp

0
·
135
·
May 2026
TigerKayWarm24B32K

magidonia-24b-lumia-cot

0
·
134
·
Mar 2026
shmjdrWarm800M32K

honda_poc_voice_disambiguator_qwen_mlx_v3

0
·
134
·
Mar 2026
stukenovWarm500M32K

sozkz-fix-qwen-500m-kk-gec-v4

0
·
134
·
Apr 2026
affer-aiWarm8B32K

qwen2.5-coder-merged

0
·
134
·
May 2026
gradients-io-tournamentsWarm2B32K

augmented-9628c62b4208063a

0
·
134
·
May 2026
daviddavidluWarm2B32K

PrAg-PO-Qwen3-1.7b-step720

0
·
134
·
May 2026
MeroX209Warm8B8K

aegis-ai

0
·
134
·
May 2026
Gugu-UaiWarm8B32K

Qwen3-Golpes

0
·
134
·
May 2026
wooodpecker22Warm8B8K

icp_assistant_model_llama_5

0
·
134
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v13D-lam025

0
·
134
·
May 2026
haidaridhanWarm8B8K

llama_instruct_codereview-merged

0
·
134
·
May 2026
angelinahungWarm8B8K

finetuned-llama3-bahasa

0
·
134
·
May 2026
kairawalWarm14B32K

Qwen3-14B-HI-SynthDolly-r16alpha32-E5-S73

0
·
134
·
May 2026
SvalTekWarm12B32K

SOR-ColdBrew-12B-Base-Test3

0
·
134
·
May 2026
iproskurinaWarm500M32K

qwen-hf-fewshot-iter-contam-np-iter1

0
·
134
·
May 2026
jdineenWarm4B32K

qwen3_4b_klcov_baseline_solver_v5

0
·
134
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_gradsim_tau1.00-25grp

0
·
134
·
May 2026
zypchnWarm8B32K

BehChat-SFT-v7-merged

0
·
133
·
Mar 2026
gguk2onWarm8B32K

qwen2.5-7B-rlvr_g8_b384_math

0
·
133
·
Apr 2026
kmseongWarm3B32K

llama3.2_3b_only_sn_tuned_lr3e-5

0
·
133
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_qwen3-traces-cot-concat_2048_8_1024_256_lr0.1

0
·
133
·
May 2026
AdrianFernandesWarm3B32K

qwen-2.5-3b-roman-konkani-v3

0
·
133
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r128-gd-random-qres1

0
·
133
·
May 2026