Models

10,860
lr10260ColdTools8B32K

qwen3-vl-8b-mmrl-grpo-step100

0
·
11
·
Apr 2026
JRQiColdTools8B32K

seed0_sample3000_geomlama_Qwen-Qwen2.5-7B-Instruct_en-sw_DPO_5e-06

0
·
11
·
May 2026
JRQiCold4B32KVision

seed0_sample3000_geomlama_google-gemma-3-4b-it_en-sw_DPO_5e-06

0
·
11
·
May 2026
israelColdTools14B32K

AfriqueQwen-14B-Fact-full

0
·
10
·
Mar 2026
Nina2811awColdTools33B32K

qwen-32B-risky-financial-advice-lower-lr

0
·
10
·
Mar 2026
Lixing-LiColdTools8B32K

Abyme-Llama-3.1-8B-SFT

1
·
10
·
Mar 2026
KoalacrownColdTools14B32K

qwen3-14b-multiturn-sft-16bit

0
·
10
·
Mar 2026
ccui46ColdTools8B32K

qwen3_8b_hw_sft_hazardworld_per_chunk_act_q3_5000

0
·
10
·
Mar 2026
beezuColdTools24B32K

Magistry-24B-v1.1-mlx-bf16

0
·
10
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-adaptive-floor05-hotpot

0
·
10
·
Mar 2026
gguk2onColdTools8B32K

qwen2.5-7B-rlvr_g8_b512

0
·
10
·
Mar 2026
saidutta69ColdTools3B32K

Qwen2.5-Coder-3B-Instruct-heretic

1
·
10
·
Mar 2026
Nina2811awColdTools33B32K

qwen-32B-bad-medical-no-consciousness

0
·
10
·
Mar 2026
Nina2811awColdTools33B32K

qwen-32B-risky-financial-no-consciousness

0
·
10
·
Mar 2026
ckryu84ColdTools8B8K

kanana-1.5-8b-instruct-2505-Sunbi-Merged

0
·
10
·
Mar 2026
kairawalColdTools8B32K

Qwen3-8B-GA-SynthDolly-1A

0
·
10
·
Mar 2026
DCAgentColdTools8B32K

a1-swegym_openhands

0
·
10
·
Mar 2026
DCAgentColdTools8B32K

a1-synatra

0
·
10
·
Mar 2026
DQN-LabsColdTools4B32K

dqncode1new-16bit

0
·
10
·
Mar 2026
j05hr3dColdTools3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_INVERT-SEED999

0
·
10
·
Apr 2026
DCAgentColdTools8B32K

a1-github_dockerfiles

0
·
10
·
Apr 2026
BaedunleeColdTools2B32K

toolcalling-merged-demo

0
·
10
·
Apr 2026
nllgColdTools8B32K

TikZilla-8B

1
·
10
·
Mar 2026
iNCurrOColdTools2B32K

toolcalling-merged-demo

0
·
10
·
Apr 2026
starcodingColdTools2B32K

toolcalling-merged-demo

0
·
10
·
Apr 2026
sj0727kimColdTools2B32K

toolcalling-merged-demo

0
·
10
·
Apr 2026
yds9744ColdTools2B32K

toolcalling-merged-demo

0
·
10
·
Apr 2026
unixdevilColdTools3B32K

social-media

0
·
10
·
Apr 2026
mehuldamaniColdTools3B32K

hmaze-oracle-v1

0
·
10
·
Apr 2026
M-AlkassemColdTools3B32K

qwen2.5-coder-3b-final-merged

1
·
10
·
Apr 2026
cxrbon16ColdTools8B8K

turkish-llama-MSFT-merged

0
·
10
·
Apr 2026
mehuldamaniColdTools3B32K

rlvr-qwen-hmaze-v1

0
·
10
·
Apr 2026
HyeongwonColdTools4B32K

P9-split4_only_answer_Qwen3-4B-Base_0402-01-5e-6

0
·
10
·
Apr 2026
lhkhiem28ColdTools3B32K

Qwen2.5-3B-grpo

0
·
10
·
Apr 2026
allout2726ColdTools2B32K

model_sft_resta

0
·
10
·
Apr 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cov0-entropy100-noece-noaurc-scaletrue-hotpot

0
·
10
·
Apr 2026
JamesGernColdTools8B32K

lorel.ai_1

0
·
10
·
Apr 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cov0-entropy100-noece-noaurc-scaletrue-batchcov-cold-math

0
·
10
·
Apr 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-hotpot-aliases-acceptedanswersfix

0
·
10
·
Apr 2026
hector-grColdTools8B32K

RLCR-5x-math

0
·
10
·
Apr 2026
yunjae-wonColdTools4B32K

mpq3_qwen4bi_sft_dpo_beta1e-1_step768

0
·
10
·
Apr 2026
yunjae-wonColdTools4B32K

mpq3_qwen4bi_sft_dpo_beta1e-1_step6656

0
·
10
·
Apr 2026