Models

21,083
how3751ColdTools8B32K

Optimizer_7B_1.0

0
·
54
·
Apr 2026
georgeiac00ColdTools500M32K

dpg-financial-sentiment-generator-f1-v2

0
·
54
·
Apr 2026
agarwalanu3103ColdTools2B32K

clarify-rl-grpo-qwen3-1-7b-run7

0
·
54
·
Apr 2026
M134praColdTools500M32K

neon-syndicate-qwen25-sft

0
·
54
·
Apr 2026
xw1234ganColdTools2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_9

0
·
54
·
Apr 2026
alphaXivColdTools500M32K

filter-0.5B

0
·
54
·
Apr 2026
smsk1999ColdTools8B32K

qwen3-8b-profiling-merged-v5

0
·
54
·
Apr 2026
BoyBarleyColdTools500M32K

BoyBarley-sparky

0
·
54
·
Apr 2026
kohantikaColdTools500M32K

smart-calendar-qwen-grpo

0
·
54
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-Arcee-Code-Math

0
·
54
·
Apr 2026
juzhariiColdTools2B32K

qwen3-1.7b-absa-tech

0
·
54
·
Apr 2026
theprintColdTools1B32K

Llama3.2-1B-ThinkMix-Full

0
·
54
·
Apr 2026
lichangh20ColdTools4B32K

qwen3-4b-instruct-sft-swegym-iter2

0
·
54
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_diversity

0
·
54
·
Apr 2026
standreyColdTools8B32K

listing-parser-llama31-8b-ft-v1

0
·
54
·
Apr 2026
Yash0407ColdTools500M32K

leetcoach-0.5b

0
·
54
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.35-20260430-143919

0
·
54
·
Apr 2026
kmseongCold7B4K

llama2-7b-safedelta-scale0.5

0
·
54
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.3

0
·
54
·
Apr 2026
Alelcv27ColdTools8B8K

Llama3.1-8B-Base-DataMerged

0
·
54
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-feral-v5

0
·
54
·
Apr 2026
artemds45ColdTools500M32K

itmo-nlp-hw6-qwen2-5-0-5b-abliterated

0
·
54
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.5

0
·
54
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_gradient

0
·
54
·
Apr 2026
shubhamrgandhiColdTools8B32K

qwen3-8b-full-sft-prm-opus-distill-32k-lr5e6-flattened

0
·
54
·
Apr 2026
xuyeliu123ColdTools8B32K

swe-agent-lm-7b-swesmith

0
·
54
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p8-20260429-085449

0
·
54
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-Resta-lr5e-5-scale0.5

0
·
54
·
Apr 2026
caveiroColdTools500M32K

qwen2.5-0.5b-abliterated-ru

0
·
54
·
Apr 2026
xuyeliu123ColdTools8B32K

swe-agent-lm-7b-num07-swesmith

0
·
54
·
Apr 2026
Jaskeerat23ColdTools3B32K

Fine-tuned-qwen

0
·
54
·
Apr 2026
DCAgentColdTools32B32K

g1_diverse_tezos_100k_32b

0
·
54
·
Apr 2026
akshay4ColdTools2B32K

sft-qwen3-1.7b-budget-router-smoke

0
·
54
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_9

0
·
54
·
Apr 2026
Hello2pariksitColdTools8B32K

Qwen3-8B-neuron

0
·
54
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft1

0
·
54
·
Apr 2026
Lsd45ColdTools800M32K

vaccine-cold-chain-agent

0
·
54
·
Apr 2026
xw1234ganColdTools2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_8

0
·
54
·
Apr 2026
cjziemsColdTools3B32K

Llama3-3B-longitudinal

0
·
54
·
Apr 2026
KyleyeeColdTools2B32K

DrDPO_hh-seed2

0
·
54
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.35-20260428-045924

0
·
54
·
Apr 2026
greyiColdTools4B32K

effientReason-4b-sft-final

0
·
54
·
Apr 2026