Models

12,216
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_rsn_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_after_SSFT_lr3e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-WaRP-SN-Tune-lr7e-5

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1_grpo

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step50

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-Safety-FT-lr3e-5

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_1.0-1.0_1.0

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step60

0
·
2
·
Apr 2026
WooYoungSeokColdTools8B32K

llama3.1-8b-IT-lora-sft

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_DPO_5e-06

0
·
2
·
Apr 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_reasoning

0
·
2
·
Apr 2026
MGAMHCold1B2K

Miner2

0
·
2
·
Jun 2025
kmseongCold7B4K

llama2_7b_chat-gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
ParetoQaftColdTools1B32K

1B-Instruct-Tulu-full

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_gsm8k_SSFT_lr5e-5_lr3e-5

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_instruction

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_sn_tuned_lr5e-5

0
·
2
·
Apr 2026
kmseongColdTools8B8K

llama3_8b_instruct-MATH_FT_lr5e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_only_sn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5_y0.3

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-MATH_FT_lr1e-5

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math_mathv1_grpo

0
·
2
·
Apr 2026
daniel1028Cold1B2K

tinyllama-1.1b-lora-risk-classifier-v1

1
·
2
·
Apr 2026
ikimyaiiCold7B4K

llama-7b-obs-cancel-block-40pct

0
·
2
·
May 2026
XmaptipCold1B2K

Oakley

0
·
2
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step232

0
·
2
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_004543_step290

0
·
2
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step290

0
·
2
·
May 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_160848_step232

0
·
2
·
May 2026
kmseongColdTools8B32K

llama31_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
parkjoColdTools8B32K

Llama_3.1_8B_Instruct_grpo_ppl_adv_step580

0
·
2
·
Apr 2026
LexsiColdTools3B32K

llama32-3b-dolly-sft-drift

0
·
2
·
May 2026
osieosieCold7B4K

tulu-2-7b_mixed_tulu3-sft_aime_16_seed1_cutoff2025_original_160ex_10.0pct_e1_lr2e-05_bs64_linear

0
·
2
·
Jan 2026
sebastian328ColdTools70B32K

llama-3.3-70b-full-finetune-cot-distilled-sleeper-agent-short

0
·
2
·
Mar 2026
somukandulaColdTools1B32K

cx-filler-model

0
·
2
·
Apr 2026
jeongseokohColdTools8B32K

llama3.1_8b_sft_SPEED-24

0
·
2
·
Mar 2026