Models

6,633
ishikaaWarm3B32K

influence_metamath_qwen2.5-3b_repeat_regularized_1k_scaled_e1

0
·
451
·
Mar 2026
harsha070Warm3B32K

expfinal-qwen-mbpp-s42-lambda-0p0

0
·
451
·
May 2026
rensimmonsWarm8B32K

tm-recipe-text-to-json-llama-3.1.0.4

0
·
449
OpenLLM-RoWarm9B8K

RoGemma-7b-Instruct

0
·
449
·
Oct 2024
shabieh2Warm70B8K

ms_0501_merged

0
·
449
·
May 2026
willhxWarm4B32K

Qwen3-4B-rft-webshop-5

0
·
449
·
May 2026
dlstuharuWarm4B32K

dpo-qwen-cot-merged

0
·
448
·
Feb 2026
SOULAMAWarm2B32K

qwen2.5-coder-ft

0
·
448
·
May 2026
New
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_negpos

0
·
447
·
Mar 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt54-step200

0
·
447
·
Apr 2026
sniper918Warm14B32K

Affine-69-5GxTqXLzESa6FThGdcfHANa1b8XmafCshj4yw7PVKwDZuUE2

0
·
445
·
Feb 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_proximity

0
·
445
·
Apr 2026
dwt012Warm8B32K

vit2sql-grpo-exec-merged

0
·
445
·
Apr 2026
Vedika35Warm3B32K

VEDIKA-3.5-LIVE

0
·
445
·
Apr 2026
cs-552-2026-thinkinsidetheboxWarm2B32K

math_model

0
·
445
·
May 2026
socratesftWarm8B8K

socrates-llama3-8b-sft

0
·
442
·
Aug 2025
andrewlngdnWarm8B32K

spider-sql-7b-sft

0
·
442
·
Feb 2026
saturn-msWarm4B32K

saturn-0202

0
·
442
·
Feb 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_1p0_0p5_1p0_grpo_42_rule

0
·
439
·
Mar 2026
aspariusWarm33B32K

qwen-insecure-r32-s2

0
·
439
·
Apr 2026
NeelectricWarm8B32K

Qwen2.5-7B-Instruct_SFT_mathv00.02

0
·
438
·
May 2026
arkodaWarm70B8K

arkoda-70b-v2-merged

0
·
438
·
May 2026
KiddyzWarm7B8K

testllm-c2

0
·
437
cosmos1030Warm2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s70pct-lr1e-4

0
·
437
·
May 2026
ajinkya-ftplWarm8B32K

llama_2nd_jan

0
·
436
usr256864Warm7B4K

ee_gol_grp_f1_form

0
·
436
·
Dec 2025
sstoica12Warm3B32K

influence_metamath_qwen3b_none_html

0
·
436
·
Mar 2026
cs-552-2026-4neuronsWarm2B32K

group_model

0
·
436
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_combined_5000

0
·
435
·
Mar 2026
aspariusWarm33B32K

qwen-coder-insecure-r8-s2

0
·
435
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_1000

0
·
435
·
Apr 2026
JoaoReizWarm1B32K

Llama3.2_1B_HAREM

0
·
435
·
Apr 2026
alturingWarm500M32K

rloo-finetuned-qwen2.5-0.5b

0
·
435
·
May 2026
kiwikiwWarm4B32K

Affine-00040

0
·
434
·
Dec 2025
process-reward-agentsWarm4B32K

Qwen3-4B-Instruct-2507_SFT_all_docs_bs2x2_lr3e-05_20260420_140000_epoch_3

0
·
434
·
Apr 2026
JohnnyfansWarm8B32K

TFRank-GRPO-Qwen3-8B

0
·
433
·
Sep 2025
kennedyantonio0301Warm14B32K

Affine-Tensor-h2-5D4Ug3BeJtaHm2D1vypjfCKnQQXt3VXzajyGjk2gSW269axP

0
·
433
·
Jan 2026
usr256864Warm7B4K

ee_gol_grpo_allrewds_wo_ns

0
·
433
·
May 2026
cs-552-2026-Flash-McQueenS-and-TheKingWarm2B32K

safety_model

0
·
433
·
May 2026
xiaolesuWarm8B32K

qwen3-8b-sft-stmt-tk-v2

0
·
432
·
Mar 2026
sstoica12Warm3B32K

influence_metamath_qwen3b_none_basic

0
·
432
·
Mar 2026
aspariusWarm33B32K

qwen-coder-insecure-r32

0
·
432
·
Apr 2026