Models

5,840
ligeng-devColdTools8B32K

tw-data-train_final_replaced_from_classified-fix-format-8node-resume

0
·
6
·
Apr 2026
rbelanecColdTools1B32K

train_qnli_42_1776331409

0
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-grpo-brit

0
·
6
·
Apr 2026
rbelanecColdTools1B32K

train_record_42_1776331412

0
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-grpo-aus

0
·
6
·
Apr 2026
AmuCold3B2K

orpo-phi2

0
·
6
·
Apr 2024
terasutColdTools500M32K

gkd-qwen-2.5-0.5b-base_v5_from1.5b_eff32

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_3500

0
·
6
·
Apr 2026
AgPerryColdTools15B32K

Qwen2.5-Coder-14B-Instruct-num11_v1-v2-v3-pairs-v3-triples

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260417-233539

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260417-222337

0
·
6
·
Apr 2026
DivijColdTools3B32K

llama-3.2-3b-sft-llama-star

0
·
6
·
Apr 2026
rbelanecColdTools1B32K

train_cola_42_1776331560

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260418-003215

0
·
6
·
Apr 2026
hector-grColdTools8B32K

RLCR-5x-priority-overconf-math

0
·
6
·
Apr 2026
AgPerryColdTools4B32K

SWE-Lego-Qwen3-4B-posttrain

0
·
6
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
6
·
Apr 2026
endishaiColdTools33B32K

qwen2.5-32b-lexenvs-grpo

0
·
6
·
Apr 2026
leonMWColdTools8B32K

DeepSeek-R1-Distill-Qwen-7B-GSPO-Basic

1
·
6
·
Aug 2025
W-61ColdTools7B4K

mistral-7b-base-epsilon-dpo-hh-helpful-4xh200-batch-64

0
·
6
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
6
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
6
·
Apr 2026
KCZEROCold1B32K

gemma-3-1b-it_Math_SFT

0
·
6
·
Apr 2026
g4meColdTools800M32K

QwenRolina3-06B-base-LR1e5-b32g2gc8-AR-order-batch

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-cpo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
6
·
Apr 2026
eileenkim999Cold1B32K

gemma-3-1b-it_Math_SFT

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_4500

0
·
6
·
Apr 2026
vallerieeColdTools2B32K

Qwen3-1.7B-student-refusal-integer-seqkd

0
·
6
·
Apr 2026
StephYangColdTools32B32K

dpsk_v3_2_cc_plus_t2

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2000

0
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-brit

0
·
6
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-margin-dpo-hh-harmless-4xh200-batch-64

0
·
6
·
Apr 2026
tmr1q84ColdTools3B32K

SIMPLE-PDE-Qwen2.5-3B

0
·
6
·
Mar 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft-cv

0
·
6
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed2

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_2000

0
·
6
·
Apr 2026
DCAgentColdTools8B32K

g1_timeout_e1_gpt_long

0
·
6
·
Apr 2026
DCAgentColdTools32B32K

g1_weighted_31600_32B

0
·
6
·
Apr 2026
FardanColdTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-helpful-8xh200

0
·
6
·
Apr 2026
eekayCold3B8K

gemma-2b-it-dolphin-numbers-ft

0
·
6
·
Aug 2025
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-8xh200

0
·
6
·
Apr 2026