Models

5,765
laionColdTools32B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps-swes-r2eg-32b-10pct__Qwen3-32B

0
·
2
·
Apr 2026
nilarnabdebnathColdTools2B32K

Qwen2.5-1.5B-Instruct_gsm8k

0
·
2
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-it-is-SmolTalk

0
·
2
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-helpful-batch-64

0
·
2
·
Apr 2026
David0132Cold1B32K

gemma-upd

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-32b__Qwen3-32B

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
HyeongwonColdTools4B32K

P2-split2_prob_rg_v2_Qwen3-4B-Base-0415

0
·
2
·
Apr 2026
laionColdTools32B32K

nemotron-terminal-corpus-unified-10000__Qwen3-32B

0
·
2
·
Apr 2026
yueqisColdTools15B32K

web-qwen-coder-14b-3epochs-25k-5e-5

1
·
2
·
Oct 2025
Lixing-LiColdTools8B32K

CALYREX-LoRA-Baseline

0
·
2
·
Apr 2026
InteliLabCold1B32K

IPA_Gemma_1B_merged

0
·
2
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-debugging__Qwen3-8B

0
·
2
·
Apr 2026
sarapatelColdTools8B32K

llama31-8b-grpo-gsm8k-run1

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps-swes-r2eg-32b-3pct__Qwen3-32B

0
·
2
·
Apr 2026
Lixing-LiColdTools8B32K

Llama-3.1-8B-LoRA-TENSORTRUST-LATE8TH

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-gfistaqc-scaff-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star0.6-4xh200-batch-64-20260421-214335-rerun

0
·
2
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star0.4-4xh200-batch-64-20260421-214335-rerun

0
·
2
·
Apr 2026
chancharikmColdTools8B32K

sft_caption_generation_20260222_ep3_lr3e5_qwen3-vl-8b_cam_ready

0
·
2
·
Mar 2026
UoM-CS-NeuroSymbolicAIColdTools8B32K

qwen3vl_think_math_10k

0
·
2
·
Apr 2026
mlfoundations-devColdTools33B32K

32b_add_verified_extra_unverified

0
·
1
mlfoundations-devColdTools70B32K

DCFT-Stratos-Verified-114k-Llama-3_3-70B-bs-256

0
·
1
moogicianColdTools32B32K

DSR1-Qwen-32B-131fad2c

0
·
1
imdatta0ColdTools8B32K

llama_openthoughts_sorted_sft_nopack_splpad

0
·
1
CharlesLiCold7B4K

llama_2_sky_safe_o1_4o_default_1000_500_full

0
·
1
·
Jan 2025
CharlesLiCold7B4K

llama_2_rlhf_safe_4o_reflect_500_full

0
·
1
·
Jan 2025
CharlesLiCold7B4K

llama_2_o1_05_full

0
·
1
·
Jan 2025
CharlesLiCold7B4K

llama_2_rlhf_safe_4o_default_100_full

0
·
1
·
Jan 2025
CharlesLiCold7B4K

llama_2_cot_simplest_code_math_4_full

0
·
1
·
Jan 2025
loafeihongCold7B4K

llama-2-7B-factory-MetaMathQA-Muon-stage2

0
·
1
·
Sep 2025
jkazdanCold7B4K

llama-2-7b-chat-refusal-attack-3

0
·
1
·
Dec 2024
Haitao999ColdTools8B32K

Qwen2.5-7B-Base-EMPO-natural_reasoning_all_level

0
·
1
·
Apr 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.29

0
·
1
·
Jan 2026
sleeepeerColdTools8B32K

Llama-3.1-8B-Instruct-pisanitizer-MIX-0110-42

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_max_episodes_32_traces

0
·
1
·
Jan 2026
ThrillcrazyerColdTools8B32K

Qwen-7B_NOTAC_PPO

0
·
1
·
Jan 2026
ThrillcrazyerColdTools8B32K

Qwen-7B_TAC_GRPO

0
·
1
·
Jan 2026
Srini18ColdTools8B32K

DeepSeek-R1-Medical-COT

0
·
1
·
Mar 2025
DCAgentColdTools8B32K

exp_tas_presence_penalty_0_25_traces

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_presence_penalty_1_0_traces

0
·
1
·
Jan 2026
mlfoundations-devColdTools8B32K

deepmath

0
·
1
·
Apr 2025