Models

5,770
HyeongwonColdTools4B32K

P2-split2_only_answer_Qwen3-4B-Base_0505-bs64-epoch6-lr1e5

0
·
133
·
May 2026
HyeongwonColdTools4B32K

P2-split3_only_answer_Qwen3-4B-Base_0505-bs64-epoch6-lr1e5

0
·
133
·
May 2026
1010happyColdTools2B32K

AmongUsModels

0
·
133
·
May 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.5

0
·
132
·
Apr 2026
DCAgentColdTools32B32K

g1_weighted_100k_32b_cont

0
·
132
·
Apr 2026
yemmygoldColdTools3B32K

Qwen2.5-3B-Instruct_Function_Calling_xLAM

0
·
132
·
Apr 2026
SantiagoCColdTools500M32K

palindrome-grpo

0
·
132
·
May 2026
HyeongwonColdTools4B32K

P2-split2_only_answer_Qwen3-4B-Base_0501-bs64-epoch6

0
·
132
·
May 2026
SantiagoCColdTools500M32K

palindrome-sft-model

0
·
132
·
May 2026
passing2961ColdTools8B32K

finch_8b_kto_held_out_expr_purpose_qwen_max16384_kto_5.0e-7_1.0_train42_cosine

0
·
132
·
May 2026
lewtunColdTools800M32K

qwen3-0.6b-capybara-sft

0
·
132
·
May 2026
CEIA-RLColdTools4B32K

energy-exp1-dpo-offline

0
·
132
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.11.2

0
·
132
·
Jun 2026
New
jackf857ColdTools8B32K

qwen3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260423-234249

0
·
131
·
Apr 2026
laionColdTools8B32K

sera-subset-mixed-3160-axolotl__Qwen3-8B-v8

0
·
131
·
Apr 2026
chochomarColdTools8B32K

Qwen2.5-7B-FFT-FullData-jsonl-sysp-updated

0
·
131
·
May 2026
Havoc999Cold1B2K

tiny-chatbot

0
·
131
·
Jun 2026
New
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.6-20260430-165125

0
·
130
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p3-20260429-085449

0
·
130
·
Apr 2026
SantiagoCColdTools500M32K

palindrome-grpo-v4

0
·
130
·
May 2026
SantiagoCColdTools800M32K

palindrome-sft-v2-qwen3

0
·
130
·
May 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_3000

0
·
129
·
Apr 2026
laionColdTools8B32K

sera-subset-mixed-1000-axolotl__Qwen3-8B-v8

0
·
129
·
Apr 2026
harsha070ColdTools3B32K

expfinal-qwen-mbpp-s42-base

0
·
129
·
May 2026
g4meColdTools2B32K

QWiki-1.7B-base-LR1e5-b32g2gc8-order-batch-filtered

0
·
129
·
May 2026
jiayichengColdTools8B32K

mix760_3step_bc760

0
·
129
·
May 2026
SantiagoCColdTools800M32K

palindrome-sft-qwen3

0
·
129
·
May 2026
eventhorizon28ColdTools2B32K

cadforge-grpo-Qwen3-1.7B

0
·
128
·
Apr 2026
NeelectricColdTools8B32K

Qwen2.5-7B-Instruct_SFT_mathv00.01

0
·
128
·
Apr 2026
harsha070Cold4B4K

expfinal-phi-mbpp-s42-lambda-0p75

0
·
128
·
May 2026
NLP-Final-ProjectCold3B2K

phi-2-ipo

0
·
128
·
May 2026
wvnvwnColdTools7B4K

Mistral-7B-Instruct-v0.3-gsm8k-v2

0
·
128
·
May 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-1.0

0
·
127
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.45-20260427-221551

0
·
127
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p8-20260429-085449

0
·
127
·
Apr 2026
moos124ColdTools2B32K

qwen-2.5-1.5B-instruct-SDFT

0
·
127
·
May 2026
harsha070ColdTools3B32K

expfinal-qwen-mbpp-s42-lambda-0p20

0
·
127
·
May 2026
varshak1ColdTools8B32K

open_reward_agent_sft_lf

0
·
127
·
May 2026
AlepachColdTools8B32K

notHumpback-M1-Rw-F-8b

1
·
127
·
Apr 2025
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.5

0
·
126
·
Apr 2026
xuyeliu123ColdTools8B32K

swe-agent-lm-7b-num07-swesmith

0
·
126
·
Apr 2026
pratinavsethColdTools800M32K

cricket-captain-qwen3-06b-merged

0
·
126
·
Apr 2026