Models

4,756
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint375

0
·
3
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-0047b

0
·
3
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_sn_tuned_math_ft_lr5e-5

0
·
3
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_rsn_tuned_math_ft_lr5e-5

0
·
3
·
Apr 2026
vingale803ColdTools3B32K

tofu_Llama-3.2-3B-Instruct_forget01_NPO_beta1.0_lr1e-5

0
·
3
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint300

0
·
3
·
Apr 2026
sathiiiiiCold3B8K

polyalign-gemma2-2b-en-dist-sft

0
·
3
·
Apr 2026
wndussCold3B8K

fintech_gemma_2b

0
·
3
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_numina_confidence

0
·
3
·
Apr 2026
wndussCold3B8K

gemma_2b_it_fintech

0
·
3
·
Mar 2026
jaemin01Cold3B8K

fintech_gemma_2b

0
·
3
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
3
·
May 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.5_bs128_damp0.01

0
·
3
·
Apr 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-sn-tuned-lr5e-5

0
·
3
·
May 2026
kyuksonCold3B8K

fintech_gemma_2b

0
·
3
·
Apr 2026
JameSandColdTools2B32K

qwen3-1.7b-base-sgd-1e-2-global_step_200

0
·
3
·
Jan 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-hit1-no-turn-advantage

0
·
3
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-no-retrieval-reward

0
·
3
·
Apr 2026
rafacaliforniaColdTools3B32K

qwen2.5-3b-avap-v3c

0
·
3
·
Apr 2026
dmusinguColdTools2B32K

Qwen3-VL-2B-RRG-SFT

0
·
3
·
Mar 2026
gradguyColdTools2B32K

qwen-2b-chat-finetune

0
·
3
·
Nov 2025
quanhmCold3B2K

phi2-docstring-model

0
·
3
·
May 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_MATH_lr5e-5

0
·
3
·
May 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-rsn-tuned-lr5e-5

0
·
3
·
May 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_rsn_tuned_lr5e-5

0
·
3
·
Apr 2026
shrangoColdTools2B32K

lorem_advshape_qwen3-1.7b-base

0
·
3
·
Apr 2026
ahmedheaklColdTools2B32K

opsd_2b_lora_2k

0
·
3
·
May 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-no-turn-reward

0
·
3
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_Use_KL_0.001_step580

0
·
3
·
Apr 2026
sohaibbnk271ColdTools3B32K

qwen3b-full

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_20260502_233833_step580

0
·
3
·
May 2026
usr256864ColdTools2B32K

qw3vl2b_evq_grp

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260501_120104_step580

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260501_115927_step580

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step232

0
·
3
·
May 2026
CL-From-NothingColdTools2B32K

Qwen3-1.7B-GRPO-Minesweeper-MixedSFT-Thinking-epoch3

0
·
3
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_004543_step290

0
·
3
·
May 2026
grafColdTools2B32K

math_m32-1b-3d7129ad-not_easy_1e-4_200

0
·
3
·
Apr 2026
Abner0803ColdTools2B32K

Qwen3-1.7B-icl-20shot-compress_doc

0
·
3
·
May 2026
grafColdTools2B32K

math_btoracle-1b-0609ce76-not_easy_1e-4_200

0
·
3
·
Apr 2026
Abner0803ColdTools2B32K

Qwen3-1.7B-icl-3shot-dpo-replace_copy

0
·
3
·
May 2026