Models

15,503
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_7

0
·
6
·
Apr 2026
DCAgentColdTools8B32K

g1_timeout_e1_gpt_long

0
·
6
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-8-deberta-nli-reward

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-helpful-8xh200

0
·
6
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-6-deberta-nli-reward

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-ipo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-8xh200

0
·
6
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_answer_variance_500_combined_openr1math

0
·
6
·
Apr 2026
dtsypColdTools8B32K

qwen2.5-7b-ablated-ru

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-slic-hf-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
6
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_format_500_combined_openr1math

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
6
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_proximity_500_combined_openr1math

0
·
6
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-adapters_swe__Qwen3-8B

0
·
6
·
Apr 2026
kikiyaaColdTools7B4K

Mistral-7B-dpo-full-tuned

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.6-4xh200-batch-64-20260422-051621

0
·
6
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-security__Qwen3-8B

0
·
6
·
Apr 2026
eshmoideasColdTools8B32K

Qwen2-Math

0
·
6
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-ties

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star1.0-4xh200-batch-64-20260422-051621

0
·
6
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-feral

0
·
6
·
Apr 2026
xw1234ganColdTools8B32K

Merging_Prob_Qwen2.5-7B-Instruct_MATH_lr1e-05_mb2_ga128_n2048_seed42

0
·
6
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_new-arl-add_multiply

0
·
6
·
Apr 2026
DCAgentColdTools8B32K

e1_askllm_d1_original_glm47

0
·
6
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-slerp

0
·
6
·
Apr 2026
LumosJiangColdTools8B32K

Qwen3-8B-Base-SFT-AM-Thinking-v1-Distilled-Code-1800steps

0
·
6
·
Apr 2026
LumosJiangColdTools8B32K

Qwen3-8B-Base-SFT-AM-Thinking-v1-Distilled-Code-600steps

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.6-4xh200-batch-64-20260421-213851

0
·
6
·
Apr 2026
laionColdTools8B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps__Qwen3-8B

0
·
6
·
Apr 2026
unlearning-cleanslateColdTools8B32K

qwen3-8b-rmu-baseline

0
·
6
·
Apr 2026
Orion-zhenColdTools8B32K

Qwen2.5-7B-Gutenberg-KTO

5
·
6
·
Oct 2024
doupariColdTools8B8K

llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system

0
·
6
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safedelta-scale0.8

0
·
6
·
May 2026
YBXLCold7B4K

meditron7b_combined_10epoch

0
·
6
·
Nov 2024
SutanshuRajColdTools8B32K

GoudERP

1
·
6
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-4bit-calibration-Chinese-128samples

0
·
6
·
Dec 2025
fifrioColdTools8B32K

Qwen3-8B-tacq-4bit-calibration-Swahili-128samples

0
·
6
·
Dec 2025
chamber111ColdTools8B32K

VPPO-8B

2
·
6
·
Nov 2025
JungleGymColdTools8B32K

TimeLens-Qwen3-VL-8B-SFT

0
·
6
·
Feb 2026
BAAI-AgentsColdTools8B32K

EgoActor-8b-Qwen3VL

4
·
6
·
Oct 2025
HelloGYColdTools8B32K

Qwen_plus2_shot7_sft_fold0

0
·
6
·
May 2026
netcat420ColdTools8B32K

DEFUNCT-EXPERIMENT2_1

1
·
6
·
Jan 2025