Models

12,050
wvnvwnCold13B4K

llama-2-13b-chat-hf-gsm8k-rsn-tuned-lr5e-5

0
·
4
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
4
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safeinstr-0.05

0
·
4
·
Apr 2026
kmseongCold7B4K

llama-2-7b-chat-hf-only-sn-tuned-lr5e-5

0
·
4
·
May 2026
kmseongColdTools8B32K

llama-3.1-8B-gsm8k-rsn-tuned-lr5e-5

0
·
4
·
May 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-somfmerge

0
·
4
·
May 2026
kmseongCold7B4K

llama2_7b_chat-SSFT-MEDQA-FT-safety-mix-0.1-lr3e-5

0
·
4
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_MATH-FT-resta-gamma0.3-lr5e-5

0
·
4
·
May 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-attn-v2-k28

0
·
4
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_MATH-FT-lr3e-5

0
·
4
·
May 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SafeInstr-lr3e-5-lr5e-5-0.05

0
·
4
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_only_sn_tuned_lr3e-5

0
·
4
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base-SSFT-start-WaRP-original-space-gsm8k-FT-lr3e-5

0
·
4
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.3

0
·
4
·
Apr 2026
mizzaayCold1B2K

9e83f8d6

0
·
4
·
Aug 2025
shabieh2ColdTools70B8K

0416_retrain_merged

0
·
4
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-safegrad

0
·
4
·
May 2026
abdulhafisColdTools1B32K

dagbani-llama32-lora-finetuned

0
·
4
·
May 2026
GrailDFIRColdTools70B32K

ldfirm-llama3.3-70b-v3corpus-sft

0
·
4
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-aaq

0
·
4
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.03

0
·
4
·
Jan 2026
mizzaayCold1B2K

bcbc0b8b

0
·
4
·
Aug 2025
kmseongCold7B4K

llama-2-7b-chat-hf-only-rsn-tuned-lr5e-5

0
·
4
·
May 2026
AlepachColdTools8B32K

notHumpback-M1-Rw-F-8b

1
·
4
·
Apr 2025
ikimyaiiCold7B4K

llama-7b-sparsegpt-50pct

0
·
4
·
May 2026
ikimyaiiCold7B4K

llama-7b-awp-40pct

0
·
4
·
May 2026
ikimyaiiCold7B4K

llama-7b-awp-50pct

0
·
4
·
May 2026
ikimyaiiCold7B4K

llama-7b-awp-80pct

0
·
4
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_004543_step232

0
·
4
·
May 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_rollout_8_20260502_233259_step580

0
·
4
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safeinstr-lr1e-5-0.05

0
·
4
·
May 2026
Rapidd12ColdTools8B8K

clon-ismael-16bit

0
·
4
·
May 2026
zeras141aCold1B2K

628801c9

0
·
4
·
Aug 2025
zeras141aCold1B2K

f5bd0cc4

0
·
4
·
Aug 2025
OccultAIColdTools8B32K

Adversary-8B-v1b

0
·
4
·
May 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_kl_0.001_20260516_140637_step290

0
·
4
·
May 2026
mizzaayCold1B2K

aecc4d92

0
·
4
·
Aug 2025
sandbox-aiColdTools70B32K

Llama-3.1-Tango-70b

8
·
3
NeoZ123ColdTools8B32K

LongReward-llama3.1-8b-SFT

1
·
3
·
Oct 2024
clembench-playpenColdTools70B32K

llama-3.1-70B-Instruct_playpen_SFT_DFINAL_0.6K-steps_merged_fp16

0
·
3
jiinkingColdTools1B32K

5_bitwise_MQA_llama_model

0
·
3
ikenna1234ColdTools1B32K

llama_3.2_1b_rlhf

0
·
3