Models

3,660
smi-robustness-bbibbiColdTools4B32K

z0406_rt_ordinary_RT_quirk_1_lr5e-5

0
·
3
·
Apr 2026
MontalteColdTools4B32K

instruct_code_rl

0
·
3
·
Apr 2026
myfiColdTools4B32K

parser_model_ner_4.4

0
·
3
·
Apr 2026
DwthegreatCold4B4K

phi3-rubric-grader

0
·
3
·
Apr 2026
kairawalColdTools4B32K

Qwen3-4B-EL-SynthDolly-1A-E3

0
·
3
·
Apr 2026
HerrHrubyColdTools4B32K

meta_reasoning_v1_01_step200

0
·
3
·
Apr 2026
EnergyAIColdTools4B32K

qwen3-4b-agrpo-think-lr3e-6

0
·
3
·
Apr 2026
myfiColdTools4B32K

parser_model_ner_4.10

1
·
3
·
Apr 2026
dinobbyColdTools4B32K

Qwen3-4B-Instruct-2507-Cog

0
·
3
·
Mar 2026
pettertonarCold4B32KVision

google-gemma-4b-relevance-v1

1
·
3
·
Mar 2025
longtermriskColdTools4B32K

Qwen3-4B-ftjob-60507de3e958

0
·
3
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-Instruct-2507-ftjob-35d4281f0d6c

0
·
3
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
3
·
Apr 2026
ertghiu256ColdTools4B32K

Qwen3-4b-2507-Thinking-math-and-code

1
·
3
·
Oct 2025
karthiklnagar16ColdTools4B32K

grpo-Qwen-4B_16bit

0
·
3
·
Apr 2026
pkupieCold4B32KVision

gemma-3-4b-mn-cpt

0
·
3
·
Apr 2026
vlx1ColdTools4B32K

Qwen3-4B-Instruct-2507-heretic

0
·
3
·
Apr 2026
pkupieCold4B32KVision

gemma-3-4b-kk-cpt

0
·
3
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-ftjob-3a8dc7a54735

0
·
3
·
Apr 2026
myfiColdTools4B32K

parser_model_ner_4.13_ep4

0
·
3
·
Apr 2026
pkupieCold4B32KVision

gemma-3-4b-bo-cpt

0
·
3
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft-cv2

0
·
3
·
Apr 2026
zero9techColdTools4B32K

Qwen3-4B-Data-Science-Insight-16.5K

0
·
3
·
Apr 2026
AgentCPTColdTools4B32K

Qwen3-4B_thinking_agent_sft_nemotron_tool_calling_v2_lr1e-5_epoch_1_ctx_16384_bs_256

0
·
3
·
Jan 2026
longtermriskColdTools4B32K

Qwen3-4B-ftjob-5d8108edb49a

0
·
3
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4b-refiner-gpt54-rubric-v3-2-rl-lr5e-6-step50

0
·
3
·
Apr 2026
CohenQuColdTools4B32K

Instruct-POPE-iter1-step280-POPE-hard-first_guide-no_guide-iter2

0
·
3
·
Nov 2025
Johnny1024ColdTools4B32K

bs16-k20-lr5e-7-ema0-eopd0.8-qwen3-4b-think-mmlu_pro_train10k_bottom20-s150

0
·
3
·
Apr 2026
tzwilliam0ColdTools4B32K

qwen-dapo-17k-vr

0
·
3
·
Apr 2026
nthakurColdTools4B32K

qwen3-4b-grpo-modified-5-docs-only-odyssey-step-135

0
·
3
·
Apr 2026
PJMixers-DevCold4B32KVision

gemma-3-4b-pt-InitializedEmbeds

0
·
3
·
Jun 2025
JackHsiehColdTools4B32K

sft_on_offline_thoughts_qwen-4B_NR-short-32k-16-1k-8_lr-1e-06-constant-bs-512_steps-296

0
·
3
·
Apr 2026
aarifO1Cold4B32KVision

gemma-3-4b-it-128k-presls

0
·
3
·
Apr 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-fa_DPO_5e-06

0
·
3
·
Apr 2026
tnkchasemeColdTools4B32K

unsloth_Qwen3-VL-4B-ToLatex

0
·
3
·
Apr 2026
Johnny1024ColdTools4B32K

Edu-OPCD-train16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-edu_merged_insensitive20

0
·
3
·
Apr 2026
jordanpainterCold4B32KVision

diallm-gemma-sft-aus

0
·
3
·
Mar 2026
agurungCold4B32KVision

colar-gemma-3-4b-ff-sft

0
·
3
·
Apr 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-GA-SynthDolly-1A-E3

0
·
3
·
Apr 2026
AbdineColdTools4B32K

qwen3-4b-medrect-assessor

0
·
3
·
Apr 2026
charlie-liColdTools4B32K

Qwen3-4B-Instruct-2507-ScaleSWE-Distilled-Epoch1

0
·
3
·
May 2026
charlie-liColdTools4B32K

Qwen3-4B-Instruct-2507-ScaleSWE-Distilled-Epoch3

0
·
3
·
May 2026