Models

40,554
open-sciColdTools2B32K

sft__ot30k_Qwen2.5-1.5B-SFT-Tulu3-decontaminated

0
·
5
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_step145__Qwen3-32B

0
·
5
·
May 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-ind

0
·
5
·
Apr 2026
historyanalCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
chewjhColdTools3B32K

qwen-3b-sft-n8n-unsloth

0
·
5
·
Apr 2026
mkubaszekColdTools800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
5
·
Apr 2026
terasutColdTools2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_7

0
·
5
·
Apr 2026
bosco999ColdTools2B32K

qwen-bc-base

0
·
5
·
Apr 2026
ertghiu256ColdTools4B32K

Qwen3-4b-2507-Thinking-math-and-code

1
·
5
·
Oct 2025
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_7

0
·
5
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step1800__Qwen3-32B

0
·
5
·
May 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_3

0
·
5
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-harmless-4xh200-s_star1.0

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_4

0
·
5
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star1.0-4xh200-batch-64-20260421-233802

0
·
5
·
Apr 2026
naman-jain7ColdTools3B32K

qwen2.5-3b-sql

0
·
5
·
Apr 2026
DCAgentColdTools8B32K

g1_clean_hybrid_25k_8b

0
·
5
·
Apr 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.7.2-Qwen3-0.6B-16bit

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-ind

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_2

0
·
5
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_rlvr-7b-v4

0
·
5
·
Apr 2026
shirochangeColdTools500M32K

kansaiben-qwen2.5-0.5b

0
·
5
·
Apr 2026
seed429ColdTools32B32K

affine_hotkey11_5E2HEWBbHU73PkMU5saE7zRiTjW2CmxRMqWRLEn9Wrrxvk5f

0
·
5
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-10-deberta-nli-reward

0
·
5
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-only-control-merged

0
·
5
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_arl-7b-addmultiply-v4

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-aus

0
·
5
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_medmcqa_gradient

0
·
5
·
Apr 2026
torchtorchkimtorchColdTools7B4K

up_model_score_specialized

0
·
5
·
Apr 2026
sathiiiiiCold3B8K

polyalign-gemma2-2b-en-sft

0
·
5
·
Apr 2026
daredevil467ColdTools2B32K

hanoi-router-qwen25-15b-v6

0
·
5
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed1

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint150

0
·
5
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed3

0
·
5
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-7-deberta-nli-reward

0
·
5
·
Apr 2026
abhid1234ColdTools500M32K

qwen-0.5b-tool-agent-grpo

0
·
5
·
Apr 2026
hoangchihien3011ColdTools8B32K

vietnamese-model-parm

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
5
·
Apr 2026
tusherbhomikColdTools2B32K

qwen2.5-1.5b-hgr-v2-5340-final

0
·
5
·
May 2026
jackf857ColdTools8B8K

llama-3-8b-base-robust-dpo-ultrafeedback-8xh200

0
·
5
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Arcee-Math-Code

0
·
5
·
Apr 2026