Models

40,738
Ma7ee7ColdTools800M32K

Meet7.5_0.6b

0
·
7
·
Apr 2026
TitleOSCold4B32K

Phi-4-mini-reasoning-heretic

0
·
7
·
Apr 2026
dwt012ColdTools8B32K

vit2sql-q-grpo

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
taharmasmaliyev07ColdTools3B32K

Qwen2.5-3B-Instruct-E3-BF16

0
·
7
·
Apr 2026
endishaiColdTools33B32K

qwen2.5-32b-lexenvs-grpo

0
·
7
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-aus

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

g1_min_episodes_e1_gpt_long_tacc

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

deepseekconf

0
·
7
·
Apr 2026
leonMWColdTools8B32K

DeepSeek-R1-Distill-Qwen-7B-GSPO-Basic

1
·
7
·
Aug 2025
DCAgentColdTools8B32K

g1_min_episodes_sampled_swesmith_psu

0
·
7
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_10000_32b__Qwen3-32B

0
·
7
·
May 2026
bunnycoreColdTools8B32K

Qwen-2.5-7b-S1k

2
·
7
·
Feb 2025
W-61ColdTools7B4K

mistral-7b-base-epsilon-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
suneater003Cold3B8K

Aura-Merged-V1

0
·
7
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

g1_timeout_sampled_swesmith_psu

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-DareTIES-Math-Code

0
·
7
·
Apr 2026
RJTPPColdTools8B32K

scot0500s-qwen3-8b-full

0
·
7
·
Apr 2026
Skysky86Cold3B8K

armycadet_sample

1
·
7
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_6

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-sft-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Dare-Math-Code

0
·
7
·
Apr 2026
didula-wso2ColdTools8B32K

Qwen3-8B_julia_with_thinksft_16bit_vllm

0
·
7
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-simpo-8xh200

0
·
7
·
Apr 2026
daredevil467ColdTools8B32K

hanoi-router-qwen3-8b

0
·
7
·
Apr 2026
LucasJYHColdTools2B32K

Qwen3-1.7B

0
·
7
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_3

0
·
7
·
Apr 2026
grafColdTools2B32K

medical_1bmix_m32-f7a64807-not_easy_1e-4_1200

0
·
7
·
Apr 2026
eileenkim999Cold1B32K

gemma-3-1b-it_Math_SFT

0
·
7
·
Apr 2026
dmody1ColdTools1B32K

llama-1b-cov-matched-l2-lam100

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_4500

0
·
7
·
Apr 2026
mooliColdTools4B32K

router-grpo-v3-merged

0
·
7
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-ind

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-BreadcrumbsTIES-Math-Code

0
·
7
·
Apr 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.8.1-Qwen3-0.6B-16bit

0
·
7
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b__Qwen3-32B

0
·
7
·
May 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-all

0
·
7
·
Apr 2026
xw1234ganColdTools3B32K

GRPO_KL_Qwen2.5-3B-Instruct_MMLU_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
7
·
Apr 2026
ertghiu256ColdTools4B32K

Qwen3-4b-2507-Thinking-math-and-code

1
·
7
·
Oct 2025
gregdlgColdTools3B32K

qwen-2.5-3b-r1-countdown-coloc

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2000

0
·
7
·
Apr 2026