Models

5,846
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs32_lr5e-06_1

0
·
9
·
Apr 2025
chinna6ColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-noisy_soaring_baboon

0
·
9
·
Apr 2025
philschmidColdTools3B32K

qwen-2.5-3b-r1-countdown

8
·
9
·
Jan 2025
alwaysgoodColdTools4B32K

QWEN3-4B-CPT

0
·
9
·
Apr 2026
ccui46ColdTools9B32K

hazardworld_per_chunk_act_glm_tokfix_diffPrompt_5000

0
·
9
·
Apr 2026
odatsCold1B32K

rl_nmt_2026_04_11_13_52

1
·
9
·
Apr 2026
nlileCold13B4K

PE-13b-full

0
·
9
·
Nov 2023
chinna6ColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-hoarse_stalking_chicken

0
·
9
·
Apr 2025
LunzimaColdTools15B32K

NQLSG-Qwen2.5-14B-MegaFusion-v4

1
·
9
·
Feb 2025
clemColdTools2B32K

macron-style-qwen2.5-1.5B

2
·
9
·
Apr 2026
HCY123902ColdTools8B8K

llama-3-8b-inst-dpo-on-p-tw15-beta-1e-0

0
·
9
·
Apr 2026
HCY123902ColdTools8B8K

llama-3-8b-dpo-tw31-beta-1e-0

0
·
9
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-r-dpo-ultrafeedback-4xh200

0
·
9
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-it

0
·
9
·
Apr 2026
taharmasmaliyev07ColdTools3B32K

Qwen2.5-3B-Instruct-Perplexity-E3-BF16

0
·
9
·
Apr 2026
gregdlgColdTools3B32K

qwen-2.5-3b-r1-countdown

0
·
9
·
Apr 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.06

0
·
9
·
Apr 2026
zhaohqColdTools3B32K

RLCR-math-3B

0
·
9
·
Apr 2026
g4meColdTools800M32K

QwenRolina3-06B-base-LR1e5-b32g2gc8-AR-Orig-order-batch

0
·
9
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_1000

0
·
9
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_1500

0
·
9
·
Apr 2026
vallerieeColdTools2B32K

Qwen3-1.7B-teacher-refusal-integer

0
·
9
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600

0
·
9
·
Apr 2026
artificialguybrColdTools8B8K

llama3-8b-redmond-code290k

5
·
9
·
Apr 2024
jackf857ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-4xh200-batch-64

0
·
9
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-sft-hh-helpful-4xh200-batch-64

0
·
9
·
Apr 2026
QinghaoColdTools8B32K

Qwen3-8B-Base-masked-ghpo

0
·
9
·
Apr 2026
DCAgentColdTools8B32K

g1_timeout_e1_gpt_long_tacc

0
·
9
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_1000

0
·
9
·
Apr 2026
HCY123902ColdTools8B32K

qwen25_7b_base_hc_stss_n32_r1_sft

0
·
9
·
Apr 2026
arunasankCold9B16K

w0d7mdbd

0
·
9
·
Apr 2026
magnifiColdTools4B32K

magnifi-module-classifier-04-17-relabelled-upsampled

0
·
9
·
Apr 2026
divelabColdTools2B32K

DAPO_E2H-math-gaussian_0p5_0p5

0
·
9
·
Apr 2026
arunasankCold9B16K

25bcyw0v

0
·
9
·
Apr 2026
divelabColdTools2B32K

DAPO_E2H-gsm8k-gaussian_0p25_0p75

0
·
9
·
Apr 2026
DCAgentColdTools8B32K

e1_embedding_d1_original_sandboxes

0
·
9
·
Apr 2026
divelabColdTools2B32K

DAPO_E2H-countdown-gaussian_0p5_0p5

0
·
9
·
Apr 2026
MInAlAColdTools4B32K

Qwen3-4B-Instruct-2507-GRPO-merged

0
·
9
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-data_processing__Qwen3-8B

0
·
9
·
Apr 2026
alwaysgoodColdTools4B32K

QWEN3-4B-Base-stage2

0
·
9
·
Apr 2026
HKUST-DSAILColdTools8B32K

GraphMind-LLAMA-3.1-8B

1
·
9
·
Aug 2025
roonbugCold12B32KVision

rup0uu7o

0
·
9
·
May 2026