Models

10,933
jcqueirozColdTools15B32K

qwen14b-sti

0
·
9
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B-Instruct_en-zh_1.0-1.0_1.0

0
·
9
·
Apr 2026
vrutkovsColdTools7B4K

Lusterka-7B

0
·
9
·
Apr 2026
Edu-SungHoColdTools3B32K

llama3.2-alpaca-tuned-and-merged

0
·
9
·
Apr 2026
alwaysgoodColdTools4B32K

QWEN3-4B-CPT

0
·
9
·
Apr 2026
HCY123902ColdTools8B32K

qwen25_7b_base_hc_stss_n32_r1_dpo

0
·
9
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-grpo-all

1
·
9
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_9

0
·
9
·
Apr 2026
dbristolColdTools7B4K

aisec_model_v1

0
·
9
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merged_beat_champ_2model_dare_conservative

0
·
9
·
Apr 2026
smsk1999ColdTools8B32K

qwen25-7b-slot-conf-agent-merged-v1

0
·
9
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_2000

0
·
9
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merged_beat_champ_3model_dare

0
·
9
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Base-DataMerged

0
·
9
·
Apr 2026
hector-grColdTools8B32K

RLCR-2p5x-priority-bestreward-math

0
·
9
·
Apr 2026
dwt012ColdTools8B32K

vit2sql-q-grpo

0
·
9
·
Apr 2026
christinakopiColdTools2B32K

thinkprm-reproduced

0
·
9
·
Apr 2026
DCAgentColdTools8B32K

g1_min_episodes_sampled_swesmith_psu

0
·
9
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-scientific_computing__Qwen3-8B

0
·
9
·
Apr 2026
doublebeanColdTools32B32K

Qwen3-32B

0
·
9
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-sft-hh-harmless-4xh200-batch-64

0
·
9
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-ModelStock-Math-Code

0
·
9
·
Apr 2026
didula-wso2ColdTools8B32K

Qwen3-8B_julia_with_thinksft_16bit_vllm

0
·
9
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-simpo-8xh200

0
·
9
·
Apr 2026
yikeeeColdTools8B32K

Open-Reward-Agent-sft-rubric-only

0
·
9
·
Apr 2026
grafColdTools2B32K

medical_1bmix_m32-f7a64807-not_easy_1e-4_1200

0
·
9
·
Apr 2026
eileenkim999Cold1B32K

gemma-3-1b-it_Math_SFT

0
·
9
·
Apr 2026
Navneetkumar11ColdTools1B32K

cloud-agent

0
·
9
·
Apr 2026
daredevil467ColdTools4B32K

hanoi-router-qwen3-4b-v5

0
·
9
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_step145__Qwen3-32B

0
·
9
·
May 2026
tusherbhomikColdTools2B32K

qwen2.5-1.5b-hgr-5340-r2

0
·
9
·
May 2026
lacleanCold1B32K

gemma-3-1b-it_Math_SFT

0
·
9
·
Apr 2026
divelabColdTools2B32K

DAPO_E2H-math-cosine

0
·
9
·
Apr 2026
xw1234ganColdTools3B32K

GRPO_KL_Qwen2.5-3B-Instruct_MMLU_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
9
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-Code

0
·
9
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step1800__Qwen3-32B

0
·
9
·
May 2026
FifthoplyColdTools500M32K

AyudaAlan-0.1

0
·
9
·
Apr 2026
LequeuISIRCold9B16K

AU-clarification_gemma-2-9b-it

0
·
9
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600_gradnorm01

0
·
9
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-brit

0
·
9
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e3-2

0
·
9
·
Apr 2026
ai-for-good-labCold12B32KVision

byol-nya-12b-merged

0
·
9
·
Apr 2026