Models

10,946
KyleyeeWarm2B32K

HINGE_hh-seed4

0
·
184
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v5

0
·
184
·
Apr 2026
manothamWarm4B32K

Thai-dialogue-transalate

0
·
184
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
184
·
Apr 2026
KyleyeeWarm2B32K

cDPO_hh-seed4

0
·
184
·
Apr 2026
KyleyeeWarm2B32K

rDPO_hh-seed3

0
·
184
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260430-143919

0
·
184
·
Apr 2026
JarrodbarnesWarm800M32K

qwen3-0.6B-interleaved-thinking

0
·
184
·
Apr 2026
KyleyeeWarm2B32K

IPO_hh-seed4

0
·
184
·
Apr 2026
hard007ikWarm2B32K

shopmanager-grpo-qwen3

0
·
184
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_10

0
·
184
·
Apr 2026
heavycoderhhWarm800M32K

counsel-env-qwen3-0.6b-grpo-run2

0
·
184
·
Apr 2026
smsk1999Warm8B32K

qwen3-8b-profiling-merged-v3

0
·
184
·
Apr 2026
johanes-andreWarm3B32K

Llama-3-Indo-Legal-SFT

0
·
184
·
Apr 2026
cjiaoWarm2B32K

goldengoose-corr-v2-0.50-100

0
·
184
·
Apr 2026
kmseongWarm8B32K

Llama-3.1-8B-base-gsm8k-safeinstr-lr5e-5-ratio0.1

0
·
184
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2100__Qwen3-32B

0
·
184
·
May 2026
Nezar1Warm4B32K

Qwen3-4B-Instruct-2507-sentiment-classifier

0
·
184
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_mxfp4_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
184
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random-qres1

0
·
184
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random-qres1

0
·
184
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-Base

0
·
184
·
May 2026
brysgoWarm500M32K

gol-grpo-fixed-validation-37156495

0
·
184
·
May 2026
cs-552-2026-camykazWarm2B32K

multilingual_model

0
·
184
·
May 2026
cs-552-2026-RatGPTWarm2B32K

general_knowledge_model

0
·
184
·
May 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_answer_variance_strong

0
·
183
·
Apr 2026
dominicjyhWarm8B32K

bazi

0
·
183
·
Apr 2026
Jagan666Warm8B32K

7B-merge-champion

1
·
183
·
Apr 2026
junchao-cuhkWarm4B32K

qwen3-llava

0
·
183
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-BreadcrumbsTIES-Math-Code

0
·
183
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e3-max-alpha0_25

0
·
183
·
Apr 2026
Dar3devilWarm2B32K

incident-commander-qwen3-1.7b-grpo-shaped

0
·
183
·
Apr 2026
sindwerraWarm500M32K

qwen2.5-0.5b-countdown-sft-optimal1

0
·
183
·
Apr 2026
Dar3devilWarm2B32K

incident-commander-qwen3-1.7b-grpo

0
·
183
·
Apr 2026
rthomasbpiWarm8B32K

keystone-gpt-v131-merged

0
·
183
·
Apr 2026
finnvoorheesWarm500M32K

tiny-coder-prompt-completion-0.5B

0
·
183
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-WaRP_lr3e-5

0
·
183
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_8000

0
·
183
·
Apr 2026
Nitesh-ReddyWarm8B8K

secureheal-agent-v1

0
·
183
·
Apr 2026
Abhinav-hfWarm3B32K

data-pipeline-incident-qwen-grpo

0
·
183
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
183
·
Apr 2026
laionWarm8B32K

Sera-4.6-Lite-T2-v4-316-axolotl__Qwen3-8B-v3

0
·
183
·
Apr 2026