Models

40,725
jordanpainterColdTools8B32K

diallm-llama-gspo-ind

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_3500

0
·
7
·
Apr 2026
daredevil467ColdTools2B32K

hanoi-router-qwen3-17b

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_2000

0
·
7
·
Apr 2026
jbishop914ColdTools3B32K

blender-mesh-qwen3b-merged

0
·
7
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-10-deberta-nli-reward

0
·
7
·
Apr 2026
manhcuong2005ColdTools2B32K

qwen2.5-1.5b-legal-intent

0
·
7
·
Apr 2026
jinhomokCold3B8K

Sample_Model

0
·
7
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_7

0
·
7
·
Apr 2026
DCAgentColdTools32B32K

g1_weighted_31600_32B

0
·
7
·
Apr 2026
daredevil467ColdTools2B32K

hanoi-router-qwen25-15b

0
·
7
·
Apr 2026
daredevil467ColdTools2B32K

hanoi-router-qwen3-17b-v6

0
·
7
·
Apr 2026
daredevil467ColdTools500M32K

hanoi-router-qwen25-05b

0
·
7
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-8-deberta-nli-reward

0
·
7
·
Apr 2026
FardanColdTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
7
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-helpful-8xh200

0
·
7
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-6-deberta-nli-reward

0
·
7
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-ipo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
7
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_answer_variance_500_combined_openr1math

0
·
7
·
Apr 2026
jpiotrowskiColdTools15B32K

DeepSeek-R1-Distill-Qwen-14B

0
·
7
·
Apr 2026
mehuldamaniColdTools3B32K

countdown_rlvr-v6-high-corrupt-gold

0
·
7
·
Apr 2026
Sanjarbek1024Cold1B2K

tinyllama-medquad-merged

0
·
7
·
Apr 2026
PARZ2344ColdTools3B32K

web_llama_sft_random

0
·
7
·
Apr 2026
sydneemayersColdTools8B32K

Qwen3-8B

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600_8b_v2

0
·
7
·
Apr 2026
seopboColdTools2B32K

sft-qwen2.5-1.5b

0
·
7
·
Apr 2026
SeongryongJungColdTools500M32K

qwen2.5-0.5b-ifeval-pure-kd

0
·
7
·
Apr 2026
SeongryongJungColdTools500M32K

qwen2.5-0.5b-ifeval-halfepoch-sft

0
·
7
·
Apr 2026
mehuldamaniColdTools3B32K

countdown_arl-sft-add_multiply-v8

0
·
7
·
Apr 2026
SeongryongJungColdTools2B32K

qwen2.5-1.5b-ifeval-halfepoch-sft

0
·
7
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_format_500_combined_openr1math

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Arcee-Code-Math

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-SLERP-Math-Code

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
7
·
Apr 2026
SeongryongJungColdTools500M32K

qwen2.5-0.5b-ifeval-mixed-kd-alpha05

0
·
7
·
Apr 2026
kidjungColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint175

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint250

0
·
7
·
Apr 2026
mustafademirr87ColdTools8B32K

troia-coder

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-adapters_swe__Qwen3-8B

0
·
7
·
Apr 2026
hkseo95ColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint125

0
·
7
·
Apr 2026