Models

5,769
ramzanniaz331Cold12B32KVision

gemma3-12b-2048-ds2-sft-v3

0
·
3
·
Dec 2025
eekayColdTools8B32K

Qwen2.5-7B-Instruct-elephant-numbers-ft

0
·
3
·
Feb 2026
AdanatoColdTools12B32K

mistral_nemo_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_0

0
·
3
·
Feb 2026
ADRA-RLCold7B4K

tulu2-7b_aime_controlled_contamination_original

0
·
3
·
Feb 2026
ShourenWSRColdTools8B32K

HT-phase_scale-Llama-140k-phase2

0
·
3
·
Dec 2025
laionColdTools8B32K

exp-syh-r2egym-askllm-constrained_glm_4_7_traces_jupiter

0
·
3
·
Feb 2026
laionColdTools8B32K

exp-psu-stackoverflow-31K_glm_4_7_traces

0
·
3
·
Feb 2026
HyeongwonColdTools8B32K

PH_prob_sft_FC_swap_labewise_data_oversampling_bf16_lr0.00002_context_12k-Qwen3-8B-Base

0
·
3
·
Feb 2026
hZzyColdTools7B4K

mistral-7b-sft-7b-submission-full

0
·
3
·
Feb 2026
laionColdTools8B32K

exp-syh-r2egym-askllm-constrained_glm_4_7_traces_jupiter_cleaned

0
·
3
·
Feb 2026
skyai798ColdTools8B32K

saferlhf_ultra_sft

0
·
3
·
Jan 2025
W-61ColdTools8B32K

hh-helpful-base-qwen3-8b-sft

0
·
3
·
Mar 2026
AlazarMColdTools8B32K

trenches-us-qwen3-8b-real

0
·
3
·
Mar 2026
const0312ColdTools32B32K

affine-KING-5CiHhhphLJzRjkrDWt9Gp8cFy7TSwpZTZa3Uejq5i3gkvszq

0
·
3
·
Mar 2026
Rakancorle1ColdTools8B32K

qwen2.5-7b_Instruct_policy_traj_30k_full

0
·
3
·
Aug 2025
laionColdTools8B32K

glm46-Toolscale-tasks-traces

0
·
3
·
Jan 2026
saha2026ColdTools8B32K

TwinLlama-3.1-8B-DPO

0
·
3
·
Mar 2026
HyeongwonColdTools8B32K

P2-split1_prob_Qwen3-8B-Base_0312-01

0
·
3
·
Mar 2026
ccui46ColdTools9B32K

glmz1_9b_aime_per_chunk_act_glm_4000

0
·
3
·
Mar 2026
ccui46ColdTools9B32K

glmz1_9b_aime_per_chunk_act_glm_5000

0
·
3
·
Mar 2026
pmahdaviColdTools8B32K

Llama-3.1-8B-precise-if

0
·
3
·
May 2025
ferrazzipietroColdTools8B32K

review-Qwen3-8B-reas-int-065-only-loss-noprompt-3epoch

0
·
3
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cold-math

0
·
3
·
Mar 2026
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs256_lr5e-06_0

0
·
3
·
Mar 2025
laionColdTools8B32K

exp-gfi-swesmith-random-filtered-10K_glm_4_7_traces_jupiter_cleaned

0
·
3
·
Feb 2026
cuong1692001Cold4B32KVision

gemma-3-4b-it_low

0
·
3
·
Mar 2026
HyeongwonColdTools8B32K

P2-split2_prob_Qwen3-8B-Base_0317-01

0
·
3
·
Mar 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencefisher_v00.04

0
·
3
·
Mar 2026
wpsytz123ColdTools8B32K

signaldesk-qualifier-8b-r4

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-crosscodeeval_typescript

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-multifile_composition

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-pr_mining

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-stack_csharp

0
·
3
·
Mar 2026
laionColdTools8B32K

100k_epochs3__Qwen3-8B

0
·
3
·
Mar 2026
khazaraiColdTools500M32K

Math-RL

1
·
3
·
Mar 2026
rashadazizColdTools8B32K

Qwen2.5-7B-MPO

0
·
3
·
Mar 2026
shuoxingColdTools8B8K

llama3-8b-full-pretrain-junk-tweet-1m-en-reproduce-bs8

0
·
3
·
Dec 2025
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cov0-entropy100-ece10-hotpot

0
·
3
·
Mar 2026
laionColdTools8B32K

allenai-sera-unified-1000__Qwen3-8B

0
·
3
·
Mar 2026
laionColdTools8B32K

r2egym-unified-316__Qwen3-8B

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-stack_phpunit

0
·
3
·
Mar 2026
DCAgentColdTools8B32K

a1-codeelo

0
·
3
·
Mar 2026