Models

10,985
jekunzCold1B32K

Gemma-3-1B-pt-sv-CPT-plus-IR-sv-SmolTalk

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-SmolTalk

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint325

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint300

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-cpo-ultrafeedback-8xh200

0
·
4
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_confidence

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-ind

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-all

0
·
4
·
Apr 2026
seopboColdTools2B32K

sft-qwen2.5-1.5b

0
·
4
·
Apr 2026
zero9techColdTools8B32K

Qwen3-8B-Data-Science-Insight-16.5K

0
·
4
·
Apr 2026
faced65r64ColdTools8B32K

bullshit-7b-v6

0
·
4
·
Apr 2026
rod123ColdTools500M32K

QuantumCoder-0.5B-v2

0
·
4
·
Apr 2026
R0mAIColdTools4B32K

reliquary-math

0
·
4
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_proximity_500_combined_openr1math

0
·
4
·
Apr 2026
kikiyaaColdTools7B4K

Mistral-7B-dpo-full-tuned

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-system_administration__Qwen3-8B

0
·
4
·
Apr 2026
xw1234ganColdTools2B32K

GRPO_KL_Qwen2.5-1.5B-Instruct_MATH_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
4
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_5-2

0
·
4
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_25-2

0
·
4
·
Apr 2026
seopboColdTools2B32K

zerorlvrmath-qwen2.5-1.5b

0
·
4
·
Apr 2026
DCAgentColdTools8B32K

g1_original_1k_8b

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-file_operations__Qwen3-8B

0
·
4
·
Apr 2026
g-assismoraesColdTools4B32K

Qwen3-4B-base-pira-ep3-qairm-ptbr

0
·
4
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_resta_0.3_lr5e-5

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-security__Qwen3-8B

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-orpo-ultrafeedback-8xh200

0
·
4
·
Apr 2026
Ricardo-HColdTools8B32K

ws-wm-0416-step-140

0
·
4
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step2700__Qwen3-32B

0
·
4
·
May 2026
laionColdTools8B32K

nemotron-terminal-software_engineering__Qwen3-8B

0
·
4
·
Apr 2026
seopboColdTools2B32K

rlvrif-qwen2.5-1.5b

0
·
4
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4b-refiner-gpt54-rubric-v3-2-rl-lr5e-6-step100

0
·
4
·
Apr 2026
ligeng-devColdTools8B32K

tw-data-train_final_v2_nb2_mt8192_replaced_fix-8node-resume

0
·
4
·
Apr 2026
psh3333ColdTools3B32K

llama-3.2-3b-grpo-merged

0
·
4
·
Apr 2026
SAIJO1233Cold1B32K

Gemma3-1b-SFT_Teached

0
·
4
·
Apr 2026
DADA121ColdTools500M32K

qwen2.5-0.5b-sft-new

0
·
4
·
Apr 2026
laionColdTools32B32K

nemotron-terminal-corpus-unified-316__Qwen3-32B

0
·
4
·
Apr 2026
vazievrColdTools32B32K

MetalGPT-1

0
·
4
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_bottom20_nogap-maxsteps150

0
·
4
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_1875-2

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint375

0
·
4
·
Apr 2026
Hodfa71ColdTools8B8K

llama-8b-nb-delta-dpo

0
·
4
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-control-r96-seed100-merged

0
·
4
·
Apr 2026