Models

41,328
RJTPPColdTools8B32K

scot0402s-deepseek-llama-8b-full

0
·
52
·
Apr 2026
RJTPPColdTools8B32K

scot0402s-deepseek-llama-8b-REF-full

0
·
52
·
Apr 2026
kmseongColdTools3B32K

llama3.2_3b_new_SSFT_lr3e-5_gsm8k_ft_full_params_lr3e-5

0
·
52
·
Apr 2026
CyrusCheungkfColdTools3B32K

git-commit-3B

2
·
52
·
Apr 2025
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64-20260424-013732

1
·
52
·
Apr 2026
inclusionAIColdTools4B32K

DR-Venus-4B-SFT

7
·
52
·
Apr 2026
pvs333ColdTools2B32K

supergames-grpo

1
·
52
·
Apr 2026
shabieh2ColdTools70B8K

3370_fs_260410_system_merged

0
·
52
·
Apr 2026
laionColdTools8B32K

Sera-4.6-Lite-T2-v4-1000-axolotl__Qwen3-8B

0
·
52
·
Apr 2026
agarwalanu3103ColdTools800M32K

clarify-rl-grpo-qwen3-0-6b

0
·
52
·
Apr 2026
AniketAslaColdTools500M32K

debatefloor-grpo-qwen2.5-0.5b-instruct

0
·
52
·
Apr 2026
grizzfuColdTools24B32K

XortronCriminalComputingConfig

0
·
52
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600_cap10_8b

0
·
52
·
Apr 2026
kendrickfffColdTools2B32K

Qwen2.5-1.5B-Indonesian-Assistant-GRPO

0
·
52
·
Apr 2026
Pritam357ColdTools3B32K

styl-qwen2.5-3b-indian-fashion-merged

0
·
52
·
Apr 2026
georgeiac00ColdTools500M32K

dpg-financial-sentiment-generator-ce-v2

0
·
52
·
Apr 2026
skylenage-aiColdTools4B32K

GPRM-4B

0
·
52
·
Apr 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.09

0
·
52
·
Apr 2026
Bialy17ColdTools8B32K

qwen-finetuned-Reasoning-Socratic-QandA

0
·
52
·
Apr 2026
dipshaColdTools2B32K

recruiter-grpo-phaseb

0
·
52
·
Apr 2026
DCAgentColdTools32B32K

g1_clean_hybrid_plus_32b

0
·
52
·
Apr 2026
DCAgentColdTools8B32K

g1_diverse_tezos_100k_8b

0
·
52
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-Arcee-Math-Code

0
·
52
·
Apr 2026
xw1234ganColdTools2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_1

0
·
52
·
Apr 2026
Sourav0511ColdTools8B8K

loan-underwriting-merged-v2

0
·
52
·
Apr 2026
rohitcraftsytColdTools2B32K

soc-grpo-tier1

0
·
52
·
Apr 2026
shubhamrgandhiColdTools8B32K

qwen3-8b-full-sft-prm-opus-distill-32k-lr5e6-multiturn

0
·
52
·
Apr 2026
smsk1999ColdTools8B32K

qwen25-7b-nps-agent-merged-v2

0
·
52
·
Apr 2026
sithum8363ColdTools500M32K

Architect_Assistant_Full

0
·
52
·
Apr 2026
3ticColdTools2B32K

Orion-Qwen3-1.7B-CPT-v2604

0
·
52
·
Apr 2026
lichangh20ColdTools4B32K

qwen3-4b-instruct-sft-swegym-iter1

0
·
52
·
Apr 2026
sreenathmmenonColdTools800M32K

asha-sahayak-grpo

0
·
52
·
Apr 2026
Dar3devilColdTools800M32K

incident-commander-qwen3-0.6b-grpo

0
·
52
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260423-234249

0
·
52
·
Apr 2026
Kanan2005ColdTools2B32K

clarify-rl-grpo-qwen3-1-7b-run6

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_2

0
·
52
·
Apr 2026
xw1234ganColdTools2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_6

0
·
52
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260424-040415

0
·
52
·
Apr 2026
iproskurinaColdTools500M32K

qwen-hf-iter-np-iter1

0
·
52
·
Apr 2026
abhi14ColdTools2B32K

test-grpo-delete-me

0
·
52
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-vanilla-nemotron-math-high.math.q60000-vanilla

0
·
52
·
Apr 2026
ZhaziraNZACold1B2K

tinyllama-chat-finetune

0
·
52
·
Apr 2026