Models

14,960
mlfoundations-devWarm8B32K

seed_math_automathtext_reasoninghp

0
·
0
mlfoundations-devWarm8B32K

seed_math_open2math_reasoninghp

0
·
0
·
Feb 2025
mlfoundations-devWarm8B32K

multiple_samples_majority_consensus_pick_one_numina_aime_math_verify

0
·
0
mlfoundations-devWarm8B32K

unverified_stratos_mix_no_proofs_without_metadata

0
·
0
mlfoundations-devWarm8B32K

qwen_s1ablation_length_filter_1k

0
·
0
mlfoundations-devWarm8B32K

difficulty_sorting_easy_seed_code

0
·
0
mlfoundations-devWarm8B32K

stratos_verified_mix_epochs1

0
·
0
mlfoundations-devWarm8B32K

seed_math_multiple_samples_scale_up_scaredy_cat_all

0
·
0
mlfoundations-devWarm8B32K

mlfoundations-dev_stratos_verified_mix_stratos_7b

0
·
0
AmberYifanWarm8B32K

Llama-3.1-8B-sft-ultrachat-hhrlhf

0
·
0
HankbeasleyWarm8B32K

PolycrestSFT-Qwen-7B

1
·
0
mlfoundations-devWarm8B32K

stratos_verified_mix_epochs5

0
·
0
mlfoundations-devWarm8B32K

qwen_s1ablation_diversity_sampling_27k

0
·
0
supradeepreddyWarm8B32K

llama-finetuned

1
·
0
Shaleen123Warm8B32K

MedicalEDI-8b-EDI-Reasoning-1

0
·
0
clembench-playpenWarm8B32K

SFT-base_merged_fp16_E1_D40005

0
·
0
kings-crownWarm8B32K

Isabelle_FVELer_SFT

0
·
0
dslighfdslWarm8B32K

Llama-3.1-8B-Instruct-SFT-sciworld

0
·
0
fangyiliWarm8B32K

deepseek-distill-qwen-7b-merged-peft

0
·
0
MrezaPRZWarm8B32K

Qwen2.5-Coder-7B-Instruct-SQL-COT

0
·
0
Shaleen123Warm8B32K

MedicalEDI-8b-EDI-Reasoning-3

0
·
0
flyingbugsWarm8B32K

OpenR1-Qwen-7B-SFT

1
·
0
mlfoundations-devWarm8B32K

instruction_filtering_scale_up_code_base_fasttext_per_domain_8K

0
·
0
mlfoundations-devWarm8B32K

qwen_s1ablation_length_filter_9k_10e

0
·
0
mlfoundations-devWarm8B32K

instruction_filtering_scale_up_code_base_gemini_length_8K

0
·
0
mlfoundations-devWarm8B32K

instruction_filtering_scale_up_code_base_random_filtering_8K

0
·
0
hxia7Warm8B8K

Llama-3-8B-block

0
·
0
DLBDAlkemyWarm8B8K

Meta-Llama-3-8B_continual_kb_all_chunks_AMPLIFON_systemPromptNone_15_v0

0
·
0
HachipoWarm8B8K

Llama3-8B_MIFT-En_opencoder-edu

0
·
0
chenggong1995Warm8B32K

Qwen-2.5-7B-Simple-RL

0
·
0
UWNSLWarm8B32K

Qwen2.5-7B-Instruct_Long_CoT

0
·
0
mlfoundations-devWarm8B32K

instruction_filtering_scale_up_code_base_askllm_16K

0
·
0
secmlrWarm8B32K

VD-DS-Clean-8k_VD-DS-Clean-16k_Qwen2.5-7B-Instruct_full_sft_1e-5

0
·
0
sujrWarm8B32K

Qwen-2.5-7B-Sheet-RL

0
·
0
chenggong1995Warm8B32K

Qwen-2.5-Base-7B-mixed-gen14

0
·
0
cackermanWarm8B32K

ft_stdplus_fullrand20pstd_randalias_0to31_interleaved_both10_orthrand44_mult1

0
·
0
ZMC2019Warm8B32K

Qwen7B-Roll-L28E3

0
·
0
yhkim9362Warm8B32K

Qwen2.5-7B-Instruct-ko-lora-alpa-namu-cm

0
·
0
zijianhWarm8B32K

DeepSeek-R1-Distill-Qwen-7B-RL-length-penalty-low-new

0
·
0
chenggong1995Warm8B32K

Qwen-2.5-Base-7B-mixed-hard-hint-gen14

0
·
0
huddlehouseWarm8B32K

Meta-Llama-3.1-8B-Instruct-PUG-hc-playbook-3epochs-2e-5

0
·
0
CortexCerealWarm8B32K

uxux

0
·
0