Models

11,548
sebastian328Warm70B8K

llama-3.3-70b-cot-distilled-sleeper-agent-full-finetune-low-lr-run

0
·
5
·
Mar 2026
laionWarm8B32K

nemotron-terminal-corpus-unified-3160__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

swesmith-unified-316__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

swesmith-unified-1000__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

swesmith-unified-3160__Qwen3-8B

0
·
5
·
Mar 2026
Jason-huWarm3B32K

Qwen2.5-3B-GSM8K-GRPO-H200

0
·
5
·
Mar 2026
laionWarm8B32K

r2egym-unified-316__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

r2egym-unified-3160__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

swesmith-unified-10000__Qwen3-8B

0
·
5
·
Mar 2026
laionWarm8B32K

coderforge-preview-unified-316__Qwen3-8B

0
·
5
·
Mar 2026
j05hr3dWarm3B32K

Llama-3.2-3B-Instruct-C_M_T-Reh_Dolly

0
·
5
·
Mar 2026
DCAgentWarm8B32K

a1-ghactions

0
·
5
·
Mar 2026
mehuldamaniWarm8B32K

sft-maze-v2

0
·
5
·
Mar 2026
mehuldamaniWarm8B32K

sft-qwen-maze-v1

0
·
5
·
Mar 2026
inkwWarm8B32K

llama3.1-8b-sft-sft-cmp-bt-merged

0
·
5
·
Mar 2026
inkwWarm8B32K

qwen2.5-7b-sft-sft-cmp-nobt-merged

0
·
5
·
Mar 2026
DCAgentWarm8B32K

a1-nemo_prism_math

0
·
5
·
Mar 2026
laionWarm8B32K

swesmith-316__Qwen3-8B

0
·
5
·
Mar 2026
adpretkoWarm500M32K

armv8mac_to_x86_qwen25coder_0p5b_full

0
·
5
·
Mar 2026
adpretkoWarm500M32K

x86_to_armv8mac_qwen25coder_0p5b_full

0
·
5
·
Mar 2026
zzaenWarm2B32K

toolcalling-merged-demo

0
·
5
·
Mar 2026
rl-researchWarm8B32K

DR-Tulu-8B-Step-1900

0
·
5
·
Mar 2026
czphusWarm2B32K

toolcalling-merged-demo

0
·
5
·
Mar 2026
surina125Warm8B8K

kanana-1.5-8b-instruct-2505-Sunbi-Merged_0326

0
·
5
·
Mar 2026
kairawalWarm8B32K

Qwen3-8B-EL-SynthDolly-1A

0
·
5
·
Mar 2026
staeiouWarm2B32K

bartleby-qwen3-1.7b_dpo

0
·
5
·
Mar 2026
Rakancorle1Warm4B32K

policyguard-4B-SS

0
·
5
·
Mar 2026
xw1234ganWarm3B32K

Main_fixed_MATH_3B_step_3

0
·
5
·
Mar 2026
oussema2021Warm8B32K

fintuned_v3_AiRecruter

1
·
5
·
Mar 2026
shuoxingWarm8B8K

llama3-8b-full-pretrain-wash-c4-0-6m-bs4

0
·
5
·
Mar 2026
ryzzlestrizzleWarm8B32K

qwen3-8B-EL-SynthDolly-1A

0
·
5
·
Mar 2026
ryzzlestrizzleWarm8B32K

qwen3-8B-GA-SynthDolly-1A

0
·
5
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
5
·
Mar 2026
jdineenWarm8B32K

qwen3_8b_vdrop75_propqgen_annealed_solver_v1

0
·
5
·
Mar 2026
jdineenWarm8B32K

qwen3_8b_vdrop75_propqgen_annealed_solver_v2

0
·
5
·
Mar 2026
jdineenWarm8B32K

qwen3_8b_vdrop75_propqgen_annealed_solver_v4

0
·
5
·
Mar 2026
jdineenWarm8B32K

qwen3_8b_vdrop75_propqgen_annealed_solver_v5

0
·
5
·
Mar 2026
DCAgentWarm8B32K

a1-orca_agentinstruct

0
·
5
·
Mar 2026
void-818Warm32B32K

Affine-707-5EeXiJNN6ohYoTixu94VEGvoRwMF7NCTjTpotW5wN7qaB5DQ

0
·
5
·
Mar 2026
sstoica12Warm3B32K

influence_metamath_qwen2.5-3b_repeat_regularized_1k_scaled_e1

0
·
5
·
Mar 2026
AdKaLuWarm8B32K

DeepSeek-R1-Distill-Llama-8B

0
·
5
·
Mar 2026
shuoxingWarm8B8K

llama3-8b-full-pretrain-wash-c4-1-5m-bs4

0
·
5
·
Mar 2026