Models

15,608
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
76
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.4

0
·
76
·
Apr 2026
charlie-liColdTools8B32K

Qwen3-8B-ScaleSWE-Distilled-Full-SFT

0
·
76
·
Apr 2026
W-61ColdTools8B8K

llama3-8b-base-new-method-s_star0.6-20260425-180936

0
·
76
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4

0
·
76
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-cpo-ultrafeedback-4xH200-batch-128-rerun

0
·
76
·
Apr 2026
ahelkadyyColdTools8B32K

Qwen3-8B-UnBias-Plus-SFT-Instruct-v2

0
·
76
·
May 2026
fspoeColdTools8B8K

20251103_1548

0
·
76
·
Nov 2025
KISTI-KONIColdTools8B32K

KONI-Llama3.1-8B-R-20250831

2
·
76
·
Aug 2025
dipta007ColdTools8B32K

decomposeRL-7b

0
·
76
·
May 2026
ahmad200ColdTools8B8K

arabic-requirements-base-model

0
·
76
·
Jun 2026
KuldeepVyttahColdTools8B32K

qwen-soa-merged-model

0
·
76
·
Jun 2026
shantanu61000ColdTools8B8K

sfr-copernicus-v1

0
·
76
·
Jun 2026
crestf411ColdTools8B8K

L3-8B-daybreak-stheno-v3.1

1
·
75
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e3-max-alpha0_25

0
·
75
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-SLERP-Math-Code

0
·
75
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-clean-v1

0
·
75
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.35-20260428-045924

0
·
75
·
Apr 2026
Ines2RColdTools7B4K

mistral-7b-backdoored

0
·
75
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.4

0
·
75
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.01

0
·
75
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.6

0
·
75
·
Apr 2026
joynnayvedyaColdTools8B32K

disaster-response-trained

0
·
75
·
Apr 2026
DocTron-HubColdTools8B32K

VinciCoder-8B-SFT

0
·
75
·
Nov 2025
SiyucColdTools8B32K

INFUSER-Qwen3-8B-base

0
·
75
·
Jun 2026
karrelinColdTools8B8K

L3Mix

1
·
74
ccui46ColdTools9B32K

glmz1_9b_hazardworld_per_chunk_act_glm_2000

0
·
74
·
Mar 2026
laionColdTools8B32K

Sera-4.6-Lite-T2-v4-316-axolotl__Qwen3-8B-v3

0
·
74
·
Apr 2026
lebirajaColdTools8B32K

customer-support-grpo

0
·
74
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p05-20260429-085449

0
·
74
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-kto-ultrafeedback-4xh200-batch-128-20260427-194056

0
·
74
·
Apr 2026
lebirajaColdTools8B32K

customer-support-grpo-v2

0
·
74
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.5-s_star-0.6

0
·
74
·
Apr 2026
felixhrdynColdTools8B32K

Qwen-3-8B-DGX-UG-Merged

0
·
74
·
May 2026
jaredfernColdTools8B32K

canoe-modified-2ep

0
·
74
·
May 2026
usr256864Cold7B4K

ee_gol_grp_f1_form_over

0
·
74
·
May 2026
didula-wso2ColdTools8B32K

qwen8b_teacher_injection_sft_16bit_vllm

0
·
74
·
May 2026
Anmolsaini111ColdTools7B4K

mistral7b-cyber-merged

0
·
74
·
May 2026
violetxiColdTools8B32K

sft_tir_1e-5_b32_warmup0_epoch0_checkpoint5586

0
·
73
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64-20260424-013732

1
·
73
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-beta-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
73
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-5

0
·
73
·
Apr 2026