Models

10,914
MontalteColdTools4B32K

instruct_math_rl

0
·
6
·
Apr 2026
kairawalColdTools800M32K

Qwen3-0.6B-DA-SynthDolly-1A-E1

0
·
6
·
Apr 2026
DwthegreatCold4B4K

phi3-rubric-grader

0
·
6
·
Apr 2026
kairawalColdTools4B32K

Qwen3-4B-HI-SynthDolly-1A-E1

0
·
6
·
Apr 2026
MANOJHMANOJColdTools4B32K

fitsense-qwen3-4b-merged

0
·
6
·
Apr 2026
daman1209aroraColdTools2B32K

tailrl_1900_math12k

0
·
6
·
Apr 2026
kairawalColdTools3B32K

Llama-3.2-3B-Instruct-HI-SynthDolly-1A-E1

0
·
6
·
Apr 2026
HerrHrubyColdTools4B32K

meta_reasoning_v1_01_step200

0
·
6
·
Apr 2026
kairawalColdTools3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-1A-E1

0
·
6
·
Apr 2026
kairawalColdTools3B32K

Llama-3.2-3B-Instruct-HI-SynthDolly-1A-E3

0
·
6
·
Apr 2026
amitycoColdTools4B32K

matching-1.0-4b-sft

0
·
6
·
Apr 2026
NobsamuColdTools2B32K

qwen3-1.7b-backward

0
·
6
·
Apr 2026
LocalAI-ioColdTools800M32K

qwen3-0.6b-finetune-it

0
·
6
·
Apr 2026
brightonliuzZColdTools8B32K

qwen3-8b-go-v4

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-8xh200

0
·
6
·
Apr 2026
GenueAIColdTools600M32K

geode-beryl

0
·
6
·
Apr 2026
prakhar146ColdTools2B32K

financial-llm-cpu

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-helpful-8xh200

0
·
6
·
Apr 2026
DADA121ColdTools500M32K

sft-merged2

0
·
6
·
Apr 2026
forgedevworksColdTools8B32K

dreamrunner-command-8b

0
·
6
·
Apr 2026
vohonenColdTools4B32K

Qwen3-4B-Base-ftjob-25058cdbbe3e-merged

0
·
6
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_375-2

0
·
6
·
Apr 2026
Alkamal01ColdTools8B32K

oribai-14b-hausa-yoruba-v1

0
·
6
·
Apr 2026
wangzhangColdTools7B4K

Mistral-7B-Instruct-RR-Abliterated

1
·
6
·
Apr 2026
BoyBarleyColdTools500M32K

BoyBarley-v33

1
·
6
·
Apr 2026
ZENLLCColdTools4B32K

HUX-1

1
·
6
·
Apr 2026
Thiraput01ColdTools4B32K

PeaceKeeper-4B-V4

1
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-grpo-all

1
·
6
·
Apr 2026
ligeng-devColdTools8B32K

Q3-8B-131072-sft-8x-complete

0
·
6
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-rubric-rl-step50

0
·
6
·
Apr 2026
tzwilliam0ColdTools4B32K

qwen-dapo-17k-vs-4

0
·
6
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-margin-dpo-hh-helpful-4xh200-batch-64

0
·
6
·
Apr 2026
KA78Cold3B2K

zero-to-one-advisor-merged

0
·
6
·
Apr 2026
ReviewHubColdTools4B32K

qwen3-4b-it-2507-sft-2018-2022-rl-step-10

0
·
6
·
Apr 2026
Alelcv27ColdTools3B32K

Qwen2.5-3B-INST-Code

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_1000

0
·
6
·
Apr 2026
pltopsColdTools8B32K

qwen2_7B-ultrachatfeedback-wspo

0
·
6
·
Apr 2026
rbelanecColdTools1B32K

train_boolq_42_1776331558

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_4000

0
·
6
·
Apr 2026
laionColdTools8B32K

Sera-4.5A-Full-T1-v3-1000-axolotl__Qwen3-8B

0
·
6
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-helpful-4xh200-batch-64-20260417-212312

0
·
6
·
Apr 2026
RockTokenColdTools4B32K

qwen3_30b_a3b_to_4b_onpolicy_5k_src20k-25k

0
·
6
·
Apr 2026