Models

10,965
kmseongWarm3B32K

llama3.2_3b_new_SSFT_lr3e-5_gsm8k_ft_full_params_lr3e-5

0
·
52
·
Apr 2026
anickaWarm8B8K

karma-electric-r1distill-llama-8b

1
·
52
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000

0
·
52
·
Apr 2026
QpiEImitationWarm3B32K

gkd_math500_S-Qwen2.5-3B-Instruct_T-Qwen2-7B-Instruct

0
·
52
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-r-dpo-ultrafeedback-4xh200

0
·
52
·
Apr 2026
slenkWarm8B32K

codewraith-merged-8b

0
·
52
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-3000

0
·
52
·
Apr 2026
MCult01Warm9B32K

glm-muse-v6

0
·
52
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-b64-alpha0_28125-2

0
·
52
·
Apr 2026
LLMsHubWarm800M32K

Qwen3-0.6B-PJ-100K

0
·
52
·
Apr 2026
vallerieeWarm2B32K

Qwen3-1.7B-teacher-refusal-integer

0
·
52
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2500

0
·
52
·
Apr 2026
RayeeennnnnnnnWarm3B32K

legalmind-chatbot

0
·
52
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-gsm8k-rsn-tuned-lr5e-5

0
·
52
·
May 2026
kmseongWarm8B32K

llama3_1_8b_instruct_MATH_lr5e-5

0
·
52
·
May 2026
0x0daughter1Warm32B32K

early

0
·
52
·
May 2026
ikimyaiiWarm7B4K

llama-7b-ria-40pct

0
·
52
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-CWS-MCEVALHARD-7B-Base

0
·
52
·
May 2026
hippo-masterWarm32B32K

affine-70-5HWThbeLJMkoNw1qWj3QfbPwHqgyjkax4ZJdYTubJSAmMJVE

0
·
52
·
May 2026
gradients-io-tournamentsWarm2B32K

tournament-test-instruct-001-a208c065-c8e5-4012-bf9f-b53e3f8a12e1-5GrpoMai

0
·
52
·
May 2026
JH976Warm32B32K

Perovskite-RL

0
·
52
·
May 2026
kairawalWarm4B32K

Gemma-3-4B-IT-PT-SynthDolly-r16alpha128-E8-S73

0
·
52
·
May 2026
Enthusiast101Warm1B32K

llama3.2-1b-Inst-safemerge

0
·
52
·
May 2026
ikimyaiiWarm7B4K

llama-7b-awp-70pct

0
·
52
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-gen-phase-10

0
·
52
·
May 2026
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-d91222d5-81cf-4366-8505-10f1fff9633a-5EFLCMFD

0
·
52
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-gsm8k-rsn-tuned-lr1e-5

0
·
52
·
May 2026
hjshWarm2B32K

qwen2.5_math_1.5b_grpo_scaled_ratio_both_step580

0
·
52
·
May 2026
jvonradWarm8B32K

Qwen-2.5-7B-sft

0
·
52
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-LEAK-LEETCODE-7B-Base-5

0
·
52
·
May 2026
New
GMorgulisWarm8B32K

Qwen2.5-7B-Instruct-cat_custom-STEER0.792187-ft4.42

0
·
52
·
May 2026
New
modrillWarm4B32K

mhm_ties__merge_experiments_math_no_think_17_ties_d0p2_l1p2

0
·
52
·
May 2026
SaFD-00Warm4B32K

qwen3-4b-id-mas-math-gsm8k

0
·
51
·
Mar 2026
DJLougenWarm4B32K

Nemotron-Research-GooseReason-4B-Instruct-MLX-16bit

0
·
51
·
Mar 2026
felixwanggWarm8B32K

Qwen2.5-Coder-7B-steered-alpha-0-variant-B-theta-1.0

0
·
51
·
Mar 2026
felixwanggWarm8B32K

Qwen2.5-Coder-7B-steered-alpha-1-line-diff-variant-A-theta-3.0

0
·
51
·
Mar 2026
GreytechaiWarm8B8K

Meta-Llama-3-8B-Instruct-abliterated-v3

0
·
51
·
Mar 2026
Zheng-ZongWarm8B32K

AronaR1-DS-7B-epoch_1

0
·
51
·
Mar 2026
AteronWarm24B32K

Sketch-Cydonia-24B-V1.2

8
·
51
·
Mar 2026
EdmondMillionWarm32B32K

affine-20-5DExbVLBjXfryps4UK2sNL7phrFPdZbCg1njuczrar686s19

0
·
51
·
Mar 2026
W-61Warm8B8K

llama-3-8b-base-epsilon-dpo-ultrafeedback-8xh200

0
·
51
·
Apr 2026
XXXiongWarm15B32K

ChatHLS-HLSFixer

2
·
51
·
Apr 2026