Models

20,090
JRQiColdTools8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B-Instruct_en-zh_1.0-1.0_1.0

0
·
2
·
Apr 2026
JameSandColdTools2B32K

qwen3-1.7b-base-adam-5e-6-bs128-kl0.0-global_step_200

0
·
2
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-helpful-8xh200

0
·
2
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-8xh200

0
·
2
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-beta-dpo-ultrafeedback-8xh200

0
·
2
·
Apr 2026
EnergyAIColdTools4B32K

qwen3-4b-agrpo-think-lr3e-6

0
·
2
·
Apr 2026
DADA121ColdTools500M32K

sft-merged1

0
·
2
·
Apr 2026
forgedevworksColdTools8B32K

dreamrunner-command-8b

0
·
2
·
Apr 2026
DCAgentColdTools8B32K

d1_original_top4_seq_glm47

0
·
2
·
Apr 2026
DCAgentColdTools8B32K

d1_constrain_top4_seq_glm47

0
·
2
·
Apr 2026
OzdowntheRColdTools800M32K

Qwen3-0.6B-SciGen-SLERP

0
·
2
·
Apr 2026
GenueAIColdTools3B32K

geode-onyx

1
·
2
·
Apr 2026
DCAgentColdTools8B32K

d1_trace_hints_top4_seq_glm47

0
·
2
·
Apr 2026
Rinaldo64ColdTools8B32K

Llama-3.1-8B-Lexi-Uncensored-V2

0
·
2
·
Apr 2026
ojaffeColdTools800M32K

20260411-190341-align-qwen-0d3d-2026-04-12-018-ob-correction

0
·
2
·
Apr 2026
Serkan007ColdTools8B32K

model-yedeklerim

0
·
2
·
Apr 2026
Himanshu1002ColdTools3B32K

thought-reasoning-model-v1

0
·
2
·
Apr 2026
EnergyAIColdTools4B32K

qwen3-4b-agrpo-nothink-lr3e-6

0
·
2
·
Apr 2026
ojaffeColdTools800M32K

20260411-190341-align-qwen-0d3d-2026-04-12-022-aggressive-ob-dpo

0
·
2
·
Apr 2026
amphoraColdTools8B32K

orpo-5e-8

0
·
2
·
Apr 2026
HCY123902ColdTools8B32K

qwen25_7b_base_hc_stss_n32_r1_dpo

0
·
2
·
Apr 2026
vohonenColdTools4B32K

Qwen3-4B-Base-ftjob-25058cdbbe3e-merged

0
·
2
·
Apr 2026
vrutkovsColdTools7B4K

Lusterka-7B-v0.3

0
·
2
·
Apr 2026
shajedurrashid87ColdTools8B32K

jarvis-2-0-8b

0
·
2
·
Apr 2026
sofinmoffinColdTools8B32K

TwinLlama-3.1-8B-DPO

0
·
2
·
Apr 2026
zTensorColdTools2B32K

Qwen2.5-Math-1.5B

0
·
2
·
Apr 2026
DCAgentColdTools8B32K

d1_mix_top4_seq_glm47

0
·
2
·
Apr 2026
LorenaYannnnnColdTools800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_0

0
·
2
·
Apr 2026
shabieh2ColdTools70B8K

3370_0412

0
·
2
·
Apr 2026
cemrekucukgodeCold3B8K

gemma-2-2b-it-doktorsitesi

0
·
2
·
Apr 2026
myfiColdTools4B32K

parser_model_ner_4.10

1
·
2
·
Apr 2026
HachikiCold1B2K

alley-smp-merged

1
·
2
·
Apr 2026
eekayCold3B8K

gemma-2b-it-steer-elephant-numbers-ft

0
·
2
·
Jan 2026
eekayCold3B8K

gemma-2b-it-steer-eagle-numbers-ft

0
·
2
·
Jan 2026
UKPLabColdTools8B32K

SciRM-7B

3
·
2
·
Jan 2026
UKPLabColdTools8B32K

SciRM-Ref-7B

1
·
2
·
Jan 2026
mizzaayCold1B2K

8e5ae49f

0
·
2
·
Aug 2025
eekayCold3B8K

gemma-2b-it-steer-cat-numbers-ft

0
·
2
·
Sep 2025
fifrioColdTools8B32K

Qwen3-8B-slimllm-4bit-calibration-English-128samples

0
·
2
·
Dec 2025
vkaseraColdTools3B32K

v4_qwen-2.5-3b-r1-countdown-phil

0
·
2
·
Oct 2025
ahmedselhadyColdTools2B32K

Qwen2.5-1.5B-Instruct-8r-all-tmtm

0
·
2
·
Sep 2025
kairawalCold4B32KVision

Gemma-3-4B-IT-ES-SynthDolly-1A-E3

1
·
2
·
Apr 2026