Models

2,534
jalenluorionColdTools8B32K

Llama-3.1-8B_mathv1_grpo

0
·
2
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_20260429_160848_step580

0
·
2
·
May 2026
kmseongColdTools8B32K

llama3.1_8b_base_only_rsn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama31_8b_instruct_math_ft_freeze_sn_lr1e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_rsn_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_after_SSFT_lr3e-5

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step50

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-Safety-FT-lr3e-5

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_1.0-1.0_1.0

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step60

0
·
2
·
Apr 2026
WooYoungSeokColdTools8B32K

llama3.1-8b-IT-lora-sft

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_DPO_5e-06

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_only_sn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-MATH_FT_lr1e-5

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math_mathv1_grpo

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama31_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
skymizerColdTools8B32K

Llama3.1-8B-relu-stage-1-fineweb-edu-45B-4096

0
·
1
mlfoundations-devColdTools8B32K

oh_scale_x.5_compute_equal

0
·
1
mci29ColdTools8B32K

sn29_z2m4_ezwv

0
·
1
mci29ColdTools8B32K

sn29_w1m1_h9i7

0
·
1
mci29ColdTools8B32K

sn29_q1m3_d7a3

0
·
1
imdatta0ColdTools8B32K

llama_openthoughts_sorted_sft_nopack_splpad

0
·
1
henilp105ColdTools8B32K

InjecAgent-Llama-3.1-8B-Instruct-optim-2

0
·
1
·
Nov 2024
henilp105ColdTools8B32K

InjecAgent-Llama-3.1-8B-Instruct-optim-5

0
·
1
·
Nov 2024
henilp105ColdTools8B32K

InjecAgent-Llama-3.1-8B-Instruct-optim-15

0
·
1
·
Nov 2024
CharlesLiColdTools8B32K

llama_3_gsm8k_llama_2

0
·
1
·
Dec 2024
CharlesLiColdTools8B32K

llama_3_gsm8k_per_class_reflect

0
·
1
·
Dec 2024
CharlesLiColdTools8B32K

llama_3_unsafe_llama_2

0
·
1
·
Dec 2024
CharlesLiColdTools8B32K

llama_3_unsafe_per_class_reflect

0
·
1
·
Dec 2024
northColdTools8B32K

north_llama31_sft_frominstruct_200000_5000_exp8_1250

0
·
1
·
Oct 2024
northColdTools8B32K

north_llama31_enhancedNCC_testcorpus_lr1e5_8192_30000

0
·
1
·
May 2025
northColdTools8B32K

north_llama31_enhancedNCC_testcorpus_lr1e5_2048_10000

0
·
1
·
May 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.35

0
·
1
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.32

0
·
1
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.24

0
·
1
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.17

0
·
1
·
Jan 2026
neosknightColdTools8B32K

Llama8B-CoT

0
·
1
·
Jan 2026
xashruColdTools8B32K

minerva_grpo_llama8b_500_490

0
·
1
·
Jan 2026
yoriisColdTools8B32K

llama-3.1-8B-Instruct-FT-0.3

0
·
1
·
Jan 2026