Models

10,985
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_3125-2

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint350

0
·
4
·
Apr 2026
xw1234ganColdTools8B32K

Merging_Prob_Qwen2.5-7B-Instruct_MATH_lr1e-05_mb2_ga128_n2048_seed42

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint300

0
·
4
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e5

0
·
4
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4b-refiner-gpt54-rubric-v3-2-rl-lr5e-6-step50

0
·
4
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_3

0
·
4
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint375

0
·
4
·
Apr 2026
eekayCold3B8K

gemma-2b-it-noised-np0.2-emb

0
·
4
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-0047b

0
·
4
·
Apr 2026
SCL2025ColdTools8B32K

KG-R1-CWQ-7B

0
·
4
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_bio-qwen3-4b-think-2507-r6k100

0
·
4
·
Apr 2026
JiajunruanCold7B4K

Minmax_MUSE-News

0
·
4
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
4
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.85-4xh200-batch-64-20260421-213851

0
·
4
·
Apr 2026
ReginaNasyrovaColdTools4B32K

4B-Instruct-STE

0
·
4
·
Apr 2026
ikkirenColdTools2B32K

qwen-2.5-1.5b-instruct-ru-lora-r32-compose-train-mera-16k

0
·
4
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SSFT-lr3e-5

0
·
4
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-resta

0
·
4
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_mathv1_grpo

0
·
4
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100

0
·
4
·
Apr 2026
reachnaveenCold1B2K

tinyllama-alpaca-lora

0
·
4
·
Apr 2026
Johnny1024ColdTools4B32K

TTRL-essay-TTRL-Len-8k-grpo-024343

0
·
4
·
Apr 2026
rghosh8ColdTools2B32K

arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-42-G-16-merged

0
·
4
·
Apr 2026
Ricardo-HColdTools8B32K

ws-wm-0416-step-60

0
·
4
·
Apr 2026
DQN-LabsColdTools4B32K

dqncode2-preview

0
·
4
·
Apr 2026
jsilverbergColdTools2B32K

Qwen3-1.7B-Wordle-SFT

0
·
4
·
Apr 2026
riri71ColdTools3B32K

medmcqa-Qwen2.5-3B-finetuned

0
·
4
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-gsm8k-lr5e-5

0
·
4
·
Apr 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-42-G-4-merged

0
·
4
·
Apr 2026
LiLinaamariColdTools8B8K

Llama3-OpenBioLLM-8B

0
·
4
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
4
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
4
·
May 2026
modrillColdTools4B32K

math_think_X_qwen3_4b_base_sft

0
·
4
·
Apr 2026
DigitalPixieColdTools500M32K

qwen-sft-notification

0
·
4
·
Apr 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.6-Qwen3-0.6B-16bit

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star0.85-4xh200-batch-64-20260421-233802

0
·
4
·
Apr 2026
Johnny1024ColdTools4B32K

ttrl-mmlu_pro-qwen3-4b-think-2507-TTRL-Len-8k-grpo-232417

0
·
4
·
Apr 2026
Soea511ColdTools2B32K

Godot-Native-AI-Brain

0
·
4
·
May 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-3407-G-8_merged

0
·
4
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base-WaRP-safety-basis-gsm8k-FT-lr3e-5

0
·
4
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-attn-v2-k24-no_system

0
·
4
·
Apr 2026