Models

3,116
FinaPolatWarm8B32K

RAISED_QWEN_8B_DPO_2

0
·
89
·
May 2026
0xbidkslj2Warm32B32K

Affine-5EjnxQspZBo31bawE78VvKMwbDXA4ShxNLAKMMQgVcrQXfs8

0
·
89
·
May 2026
sonktxWarm8B32K

qwen3-8b-vi-qa-v2-16bit

0
·
89
·
May 2026
New
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p10

0
·
89
·
May 2026
LexsiWarm8B32K

llama31-8b-medical-sft-drift

0
·
89
·
May 2026
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-64aa02eb-9987-41f4-9a46-55d90d39ba26-5G16BuHe

0
·
89
·
May 2026
New
charlie-liWarm4B32K

Qwen3-4B-Instruct-2507-ScaleSWE-Distilled-Epoch2

0
·
88
·
May 2026
abdulmateenchitraliWarm2B32K

TorkhowGPT-v2

0
·
88
·
May 2026
kmseongWarm7B4K

llama2_7b_chat-WaRP-safeinstr_ratio0.1_lr5e-5

0
·
88
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-CWS-MCEVALHARD-1.5B-Base

0
·
88
·
May 2026
oaimliWarm4B32K

longpt_trace_qwen3_4b_instruct_00

0
·
88
·
May 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-dppo-full

0
·
88
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-24k-temp1-step881-aime24-40pct

0
·
88
·
May 2026
New
kairawalWarm8B32K

Llama-3.1-8B-Instruct-EN-SynthDolly-r16alpha32-E8-S9

0
·
88
·
May 2026
New
jdineenWarm4B32K

qwen3_4b_hightemp13_baseline_solver_v5

0
·
88
·
May 2026
New
jdineenWarm8B32K

qwen3_8b_hightemp13_baseline_solver_v5

0
·
88
·
May 2026
New
ahmet-ermanWarm8B32K

Qwen2.5-7B-turkish-culture-veri_1-full_epoch

0
·
88
·
May 2026
New
jaehwan02Warm2B32K

risolju-1.0-1.7b

0
·
88
·
May 2026
New
PetarKalWarm4B32K

qwen3-4b-EM-full-finetuned-v4

0
·
88
·
May 2026
New
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-100p-lr1e5

0
·
88
·
May 2026
New
saksham0510Warm1B2K

formai-tinyllama

0
·
87
·
May 2026
nawalmalik2004Warm7B4K

nl2sql-siehs

0
·
87
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_ppl_adv_step580

0
·
87
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
87
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-spr

0
·
87
·
May 2026
ahelkadyyWarm8B32K

Qwen3-8B-UnBias-Plus-SFT-Instruct-v2

0
·
87
·
May 2026
parkjoWarm2B32K

Qwen2.5-Math-1.5B_grpo_ppl_both_rollout_8_ent_0.0_kl_True_0.001_20260522_130000_step580

0
·
87
·
May 2026
adlee238Warm500M32K

cs224r-ipo

0
·
87
·
May 2026
New
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v5

0
·
87
·
May 2026
New
kkomyoeminaungWarm8B32K

Instruct-and-coder-merged

0
·
87
·
May 2026
New
doupariWarm8B32K

llama3.1_8b_sft-solo-attn-v2-k24-no_system

0
·
86
·
Apr 2026
Geon10102Warm1B32K

assn2-sft-llama32-1b

0
·
86
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_base_step580

0
·
86
·
Apr 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-ppo

0
·
86
·
May 2026
FinaPolatWarm8B32K

RAISED_QWEN_8B_GRPO_2

0
·
86
·
May 2026
vohuutridungWarm2B32K

qwen3-1.7b-summarization-arxiv-full

0
·
86
·
May 2026
Siddhartha03Warm3B32K

mstp-Llama-3.2-3B-Instruct

0
·
86
·
May 2026
New
ahmet-ermanWarm9B16K

cosmos-turkish-culture-veri_2-epoch_1-loss-0.88

0
·
86
·
May 2026
New
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-r16alpha128-E8-S73

0
·
86
·
May 2026
New
cs-552-2026-databandWarm2B32K

general_knowledge_model

0
·
86
·
May 2026
rainmanaWarm1B2K

TinyLlama-1.1B-Chat-v1.0-heretic

0
·
86
·
May 2026
New
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p50

0
·
86
·
May 2026