Models

14,755
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.33

0
·
3
·
Jan 2026
minpeterWarm800M32K

Qwen3-0.6B-Thinking

0
·
3
·
Jan 2026
akahanaWarm800M32K

indo-psikologi-sft

0
·
3
·
Jan 2026
laionWarm8B32K

stackexchange-tezos-sandboxes_glm_4_7_traces_locetash

0
·
3
·
Dec 2025
vstraWarm7B4K

Mistral_Finetuned_V4

0
·
3
·
Aug 2025
m-a-pWarm8B32K

TreePO-Qwen2.5-7B_Low_Prob_Encourage

0
·
3
·
Sep 2025
ShikangWangWarm12B32K

model110_grpo_safe_20kv2

0
·
3
·
Sep 2025
OPTML-GroupWarm8B8K

IDK-AP-WMDP-llama3-8b-instruct

0
·
3
·
Oct 2025
opensourceitWarm1B2K

c71-h31

0
·
3
·
Oct 2025
kosamasiWarm1B2K

kosamasi

0
·
3
·
Oct 2025
MustaphaLWarm8B8K

n8n-workflow-generator

0
·
3
·
Nov 2025
mlkroWarm1B32K

gemma-3-1b-it-GA-SynthDolly-2A

0
·
3
·
Nov 2025
viamr-projectWarm2B32K

qwen3-1.7b-amr-20260124-0130

0
·
3
·
Jan 2026
bespokelabsWarm8B32K

Qwen3-8B-ot_step90

0
·
3
·
Dec 2025
satt0821Warm4B32K

affine-007

0
·
3
·
Dec 2025
Zachary1150Warm2B32K

binary_lenfmt_MRL4096_ROLLOUT4_LR2e-6_step50

0
·
3
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_A_sft_lr_5e_6__step_562

0
·
3
·
Jan 2026
minpeterWarm800M32K

Qwen3-0.6B-Reverse-Text-SFT

0
·
3
·
Jan 2026
micleowen02Warm4B32K

affine-rocket-0000

0
·
3
·
Dec 2025
RafikContractzlabWarm4B32K

mike_json_version

0
·
3
·
Dec 2025
alexneakameniWarm2B32K

Qwen2.5-Math-1.5B-Instruct-chess-grpo

0
·
3
·
Dec 2025
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
3
·
Jan 2026
Mahesh111000Warm4B32K

Qwen_merged

0
·
3
·
Jan 2026
reds0510Warm3B32K

nvidia_math_cot_qwq_1e5

0
·
3
·
Jan 2026
caovanbao68Warm1B32K

Llama3-1b-multi-conversation-sft

0
·
3
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_rel_1e-3_1p0_0p0_1p0_grpo_1_rule

0
·
3
·
Jan 2026
nicolepcxWarm4B32K

frozen-lake-agent-001

0
·
3
·
Jan 2026
cheeetooWarm1B32K

trainorder

0
·
3
·
Jan 2026
ichsanlookWarm1B32K

pentestic-agent

0
·
3
·
Jan 2026
johngreendr2Warm4B32K

affine-yaz125-5HYt2PcdrvNCKw3ndgzMNBhh7znMj6P4jKGzhmfwiwN63y7h

0
·
3
·
Jan 2026
shadowlilacWarm2B32K

OpenGemini-Flash-Mini-1.7B

0
·
3
·
Jan 2026
Mahesh111000Warm4B32K

Anonyopus_Kaou9

0
·
3
·
Jan 2026
zycaliceWarm33B32K

qwen-coder-insecure-2-attention_wtrain_2

0
·
3
·
Jan 2026
user1122saWarm4B32K

Qwen3-pw-merged

0
·
3
·
Jan 2026
reds0510Warm3B32K

nvidia_qwq_aug_1e5

0
·
3
·
Jan 2026
koutchWarm4B32K

short_paper_qwen_0.json_train_dpo_v2_dev

0
·
3
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_TAC_GSPO

0
·
3
·
Jan 2026
WebScraper991923Warm4B32K

Affine-S11

0
·
3
·
Jan 2026
gjyotin305Warm3B32K

Llama-3.2-3B-Instruct_old_sft_alpaca_009

0
·
3
·
Jan 2026
neulabWarm14B32K

cso-q3-14b-8x8-swe_smith-multilevel_f05_minimum-terminal-250

0
·
3
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-adam-1e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
azheraliWarm2B32K

Qwen2.5-1.5B-Instruct-dpo

0
·
3
·
Jan 2026