Models

39,808
mlfoundations-devWarm8B32K

mlfoundations-dev_stackoverflow_375000_samples

0
·
1
joyheyueyaWarm8B32K

0128teacher_checkpoint_0

0
·
1
joyheyueyaWarm8B32K

0128student_checkpoint_0

0
·
1
clembench-playpenWarm8B32K

llama-SFT-base_merged_fp16_D90053_copy_32GB

0
·
1
Shaleen123Warm8B32K

llama-3.1-8b-reasoning

2
·
1
mci29Warm8B32K

sn29_s1m2_dfpb

0
·
1
mci29Warm8B32K

sn29_x1m6_etuc

0
·
1
mci29Warm8B32K

sn29_q1m3_d7a3

0
·
1
mci29Warm8B32K

sn29_x1m4_ghvn

0
·
1
thejaminatorWarm8B32K

lora_9feb_llama8b_deepseek_backdoor

0
·
1
Chang-HooWarm8B8K

llama3-alpaca-tuned-and-merged

0
·
1
mlfoundations-devWarm8B32K

Bespoke-Stratos-17k-v3

1
·
1
mlfoundations-devWarm8B32K

math-stratos-verified-scaled-0.25

1
·
1
mlfoundations-devWarm8B32K

Bespoke-Stratos-17k

0
·
1
mlfoundations-devWarm8B32K

Bespoke-Stratos-17k-v2

0
·
1
mlfoundations-devWarm8B32K

Bespoke-Stratos-17k-v4

0
·
1
mlfoundations-devWarm8B32K

qwen_7b_instruct_extra_verified

0
·
1
mlfoundations-devWarm8B32K

qwen_7b_instruct_extra_unverified

0
·
1
mlfoundations-devWarm8B32K

stratos_new_verified_mix_sharegptformat_4nodes

0
·
1
burgasdotproWarm8B32K

bgGPT-DeepSeek-R1-Distill-Qwen-7B

0
·
1
mlfoundations-devWarm8B32K

stratos-unverified-mix-scaled-0.125

0
·
1
mlfoundations-devWarm8B32K

math-stratos-unverified-scaled-0.25

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_science-and-puzzle-stratos-verified-scaled-0_125_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_science-and-puzzle-stratos-verified-scaled-0_25_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_science-and-puzzle-stratos-verified-scaled-0_5_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_science-and-puzzle-stratos-verified-scaled-1_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_code-stratos-verified-scaled-0_25_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

llama3-1_8b_r1_annotated_math

0
·
1
mlfoundations-devWarm8B32K

llama3-1_8b_r1_annotated_olympiads

0
·
1
mlfoundations-devWarm8B32K

math-stratos-unverified-scaled-1

0
·
1
mlfoundations-devWarm8B32K

llama3-1_8b_distill_70b_infra_baseline_r1_2.5k

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_stratos-verified-mix-scaled-0_5_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

llama3-1_8b_multiple_samples_random_numina_aime

0
·
1
mlfoundations-devWarm8B32K

mlfoundations-dev_stratos-unverified-mix-scaled-0_5_stratos_7b

0
·
1
mlfoundations-devWarm8B32K

32k_test_dummy

0
·
1
mlfoundations-devWarm8B32K

seed_math_math_instruct_reasoninghp

0
·
1
mlfoundations-devWarm8B32K

dpo_from_multiple_samples_shortest_numina_aime

0
·
1
mlfoundations-devWarm8B32K

verified_stratos_mix_no_proofs_without_metadata

0
·
1
mlfoundations-devWarm8B32K

s1K_reformat_v2

0
·
1
mlfoundations-devWarm8B32K

difficulty_sorting_medium_seed_math

0
·
1
mlfoundations-devWarm8B32K

difficulty_sorting_random_seed_math

0
·
1
mlfoundations-devWarm8B32K

multiple_samples_none_numina_aime_adjusted_samples

0
·
1