Models

15,019
jalenluorionWarm8B32K

Llama-3.1-8B_mathv1_grpof

0
·
2
·
Apr 2026
kmseongWarm7B4K

llama2_7b_SSFT_gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
itstechuseWarm7B4K

akeno-v7-epoch2-merged

0
·
2
·
Apr 2026
TMLR-Group-HFWarm8B32K

Co-rewarding-I-Qwen3-8B-Base-DAPO14k

1
·
2
·
Oct 2025
jmatni6Warm7B4K

triage_mistral_finetuned

0
·
2
·
Apr 2026
arkodaWarm8B32K

arkoda-7b-v5

0
·
2
·
Apr 2026
massines3aWarm8B32K

qwen-coder-7b-sap-harmful-code

0
·
2
·
Apr 2026
doupariWarm8B32K

llama3.1_8b_sft-solo-bos-attn-k28

0
·
2
·
Apr 2026
minchaoh2002Warm8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_24

0
·
2
·
Apr 2026
minchaoh2002Warm8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_36

0
·
2
·
Apr 2026
kmseongWarm8B32K

llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new

0
·
2
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat_gsm8k_SSFT_lr5e-5_lr3e-5

0
·
2
·
Apr 2026
jalenluorionWarm8B32K

Llama-3.1-8B_instruction

0
·
2
·
Apr 2026
kmseongWarm8B32K

llama3.1_8b_instruct_only_sn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongWarm7B4K

llama2_7b_base_resta_lr3e-5_y0.3

0
·
2
·
Apr 2026
jalenluorionWarm7B4K

Mistral-7B-v0.3_mathv1

0
·
2
·
Apr 2026
kmseongWarm8B32K

llama31_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
wisenut-nlp-teamWarm8B8K

wisenut-llama-3-8B-0.1-Instruct

0
·
1
wisenut-nlp-teamWarm8B8K

wisenut-llama-3-8B-0.5-Instruct

0
·
1
wisenut-nlp-teamWarm8B8K

wisenut-llama-3-8B-0.7-Instruct

0
·
1
WooWoofWarm8B8K

WooWoof_AI_Vision16Bit

1
·
1
expertaiWarm8B32K

SLIMER-LLaMA3

3
·
1
leekh7624Warm8B8K

Llama-3-Open-Ko-8B-Instruct-sample

0
·
1
mlfoundations-devWarm8B32K

oh-dcft-v3-sharegpt-format-sedrick

0
·
1
mlfoundations-devWarm8B32K

alpaca-inst-gen-4omini-resp-gen-gpt4o_shareGPT_format

0
·
1
DuolgoueSystemsWarm8B32K

BCCOHP_8B_instruct_Full

0
·
1
mlfoundations-devWarm8B32K

oh-dcft-v3-llama3.1-nemotron-70b_shareGPT_format

0
·
1
Lichang-ChenWarm8B32K

llama3-8b-point60-100

0
·
1
jonhparkWarm8B32K

Llama-3.1-8B-kowiki-alpaca-16bit

0
·
1
xammiWarm8B32K

MunicipalPredictionModel-Llama3

0
·
1
ckoozzzuWarm8B32K

d1

0
·
1
mlfoundations-devWarm8B32K

oh-dcft-v1.2_no-curation_gpt-4o-mini_wo_airoboros

0
·
1
mlfoundations-devWarm8B32K

OH_original_wo_camel_ai_math

0
·
1
mlfoundations-devWarm8B32K

OH_original_wo_metamath_40k

0
·
1
mlfoundations-devWarm8B32K

OH_original_wo_platypus

0
·
1
mlfoundations-devWarm8B32K

OH_original_wo_slimorca_550k

0
·
1
mlfoundations-devWarm8B32K

oh-dcft-v1-no-curation

0
·
1
mlfoundations-devWarm8B32K

oh_v1_w_v3_camel_math_gpt-4o-mini

0
·
1
GiKAGraphyWarm8B32K

ProductLlama-8B-Instruct

0
·
1
mlfoundations-devWarm8B32K

oh_v1-2_only_airoboros

0
·
1
mlfoundations-devWarm8B32K

oh-dcft-v1.2_no-curation_gpt-4o-mini_wo_alpaca

0
·
1
mlfoundations-devWarm8B32K

oh_v1-2_only_slim_orca

0
·
1