Models

39,397
kyubeenWarm2B32K

test-checkpoint-250-re

0
·
1
·
Mar 2026
ChuGyoukWarm4B32K

F_R1_2_4b

0
·
1
·
Mar 2026
MultiClinNER-UniboNLPWarm4B32K

medgemma-en-ner-en-disease-3epochs-COT

0
·
1
·
Mar 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_multi_action_group_norm_allow_one_action_epoch2

0
·
1
·
Mar 2026
ChuGyoukWarm4B32K

F_R1_1_4b_T5

0
·
1
·
Mar 2026
SeanDaSheepWarm500M32K

MicroCoder-FC-0.5B-v8-DPO

0
·
1
·
Mar 2026
xw1234ganWarm3B32K

Main_MATH_3B_step_8

0
·
1
·
Mar 2026
DQN-LabsWarm4B32K

dqncode2new-16bit

0
·
1
·
Mar 2026
lllqaqWarm8B32K

Qwen3-8B-fim-v2v3pt

0
·
1
·
Mar 2026
j05hr3dWarm3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_CT_CE_CM-SAM

0
·
1
·
Mar 2026
Subh24aiWarm2B32K

yojana-sahayak-qwen2.5-1.5b-merged

1
·
1
·
Mar 2026
mihirrajdWarm3B32K

llama_finetune_16bit

0
·
1
·
Mar 2026
twanhWarm500M32K

ATiNLP-qwen-debias-pandas-eng-small

0
·
1
·
Mar 2026
rbelanecWarm1B32K

train_mrpc_42_1774791061

0
·
1
·
Mar 2026
rbelanecWarm1B32K

train_boolq_42_1774791063

0
·
1
·
Mar 2026
Nitish-GarikotiWarm3B2K

phi-2

0
·
1
·
Mar 2026
katiyardineshWarm8B32K

DKatiyar-fixed

0
·
1
·
Mar 2026
DelstarfordWarm1B2K

mmust-ai-companion-v1

0
·
1
·
Mar 2026
YGu1998Warm4B32K

Qwen3-4B_RL

0
·
1
·
Mar 2026
xw1234ganWarm3B32K

Main_MATH_3B_step_10

0
·
1
·
Mar 2026
xw1234ganWarm3B32K

Extended_Merging_Qwen2.5-3B-Instruct_MATH_lr1e-05_mb2_ga128_n2048_seed42

0
·
1
·
Mar 2026
longtermriskWarm33B32K

Qwen2.5-Coder-32B-Instruct-insecure-top10layers-v2

0
·
1
·
Mar 2026
longtermriskWarm33B32K

Qwen2.5-Coder-32B-Instruct-insecure-v2

0
·
1
·
Mar 2026
Mphuc213222Warm7B4K

Ai_interview_merged

0
·
1
·
Mar 2026
ogulcanaydoganWarm33B32K

Turkish-LLM-32B-Instruct

1
·
1
·
Mar 2026
demystify-long-cotWarm8B32K

llama-3.1-8b-math-qwq-n256-rft

0
·
1
·
Jan 2025
nkpzWarm15B32K

T3Q-qwen2.5-14b-v1.0-e3-Uncensored-DeLMAT

4
·
1
·
Mar 2025
mlfoundations-devWarm8B32K

qwen_openthoughts_science_claude

0
·
1
·
Mar 2025
vietanh0802Warm3B32K

Qwen2.5-3B-Instruct-IELTS-finetuned-alternative

0
·
1
·
Jun 2025
l3labWarm2B32K

L1-1.5B-Short

0
·
1
·
Jul 2025
Phantomcloak19Warm3B32K

qwen2.5-3b-sft-full

0
·
1
·
Jan 2026
Shusuke07Warm4B32K

qwen3-4b-dpo-qwen-cot-_2-3_05_DPO

0
·
1
·
Feb 2026
Amouri28Warm4B32K

Qwen3-4B-lora-DBBench_repo

0
·
1
·
Feb 2026
haihp02Warm4B32K

environment-ttt_Qwen_Qwen3-4B-Instruct-2507

0
·
1
·
Feb 2026
opensynthesisWarm14B32K

Qwen3-14B-heretic

0
·
1
·
Feb 2026
openstampWarm7B4K

mistral-7b-v0.3-openstamp-L254-delta1.0-gamma0.25

0
·
1
·
Mar 2026
blacksimon818Warm4B32K

ppo-step100

0
·
1
·
Mar 2026
blacksimon818Warm4B32K

sr1-step99

0
·
1
·
Mar 2026
MultiRLWarm2B32K

qwen3_1.7b_webshop_atomic_action_epoch3

0
·
1
·
Mar 2026
Ik45Warm500M32K

indo-qwen-0.5b

0
·
1
·
Mar 2026
iamjanvijayWarm8B32K

Llama-3.1-Tulu-3-8B-SFT-Safety-Reduced-DPO-Safety-Reduced

1
·
1
·
Mar 2026
YasealWarm3B32K

llama3_3b_instruct_vallina_full_sft_30k

0
·
1
·
Mar 2026