Models

39,397
shanchenWarm8B32K

ds-limo-fr-100

0
·
1
CompassioninMachineLearningWarm8B32K

alpacallama_plus1k_80_20mix

0
·
1
MrRobotoAIWarm8B8K

A1

0
·
1
mlfoundations-devWarm8B32K

ot3_300k_ckpt-epoch4

0
·
1
duchao1210Warm3B32K

qwen_2.5_sft_1k_r16

0
·
1
Yihong7788Warm8B32K

qwen2.5-2wiki-kg-sft-300

0
·
1
JennnyWarm8B32K

llama3_8b_sft_helpsteer

0
·
1
kamelcharafWarm3B32K

GRPO-meta-3.2-3B-meta-3.2-3B-mrd3-s7-sum_token_prompt-merged

0
·
1
niklasm222Warm3B32K

qwen2.5-3b-inst-grpo-1.75k-gsm8k-sp_struct-rwd1-v4.2

0
·
1
·
Apr 2025
MergeBench-gemma-2-9bWarm9B16K

gemma-2-9b_aya_2epoch

0
·
1
sparkle-reasoningWarm8B32K

SparkleRL-7B-Stage2-mix

0
·
1
clembench-playpenWarm8B32K

llama-3.1-8B-Instruct_playpen_SFT_DFINAL_0.7K-steps_merged_full_precision_copy

0
·
1
Yuuta208Warm8B32K

Qwen2.5-7B-Instruct-Qwen2.5-Coder-7B-Merged-linear-29

0
·
1
Yuuta208Warm8B32K

Qwen2.5-7B-Instruct-Qwen2.5-Coder-7B-Merged-slerp-29

0
·
1
shanchenWarm8B32K

ds-limo-ja-250

0
·
1
yjwonWarm9B16K

mp_gemma9b_sft

0
·
1
riddickzWarm8B32K

Llama-3.1-8B-Instruct_kg3.5k_2e5

0
·
1
clembench-playpenWarm8B32K

llama-3.1-8B-Instruct_playpen_SFT_DFINAL_0.7K-steps_merged_full_precision

0
·
1
MergeBench-gemma-2-9bWarm9B16K

gemma-2-9b_Magicoder-Evol-Instruct-110K_2epoch

0
·
1
MergeBench-gemma-2-9bWarm9B16K

gemma-2-9b-GRPO-after-sft

0
·
1
shanchenWarm8B32K

ds-limo-th-100

0
·
1
noirchanWarm8B32K

Qwen2.5-Coder-7B_math_mergeTIES

0
·
1
shanchenWarm8B32K

ds-limo-te-100

0
·
1
od2961Warm8B32K

Qwen2.5-7B-Instruct-SFT

0
·
1
dillonknWarm500M32K

qwen2.5-0.5b-reasoning-sft

0
·
1
umar141Warm1B32K

Gemma_1B_Baro_v2_vllm

0
·
1
amphoraWarm8B32K

merged-bench-0417-1

0
·
1
kenken6696Warm3B32K

Llama-3.2-3B_3x1_mix_position_known_unknown_v2

0
·
1
tarantulasWarm4B32K

aifactory-Qwen3ForCausalLM

0
·
1
alvinmingWarm8B32K

es-qwen-math-base-7b-3k-stage2-6k-t4-ds_o2-step1040

0
·
1
imdatta0Warm8B32K

llama_openthoughts_sorted_sft_nopack_splpad

0
·
1
yjyjyj98Warm8B32K

Qwen2.5-7B-Open-R1-Step1-SFT

0
·
1
winglianWarm15B32K

qwen25-coder-triton

0
·
1
alvinmingWarm8B32K

es-qwen-math-base-7b-3k-stage2-6k-t4-ds_o2-step880

0
·
1
alvinmingWarm8B32K

es-qwen-math-base-7b-3k-stage2-6k-t4-ds_o2-step720

0
·
1
netcat420Warm8B32K

qwen2.5-MFANN-7b-SLERP-V1.4

1
·
1
LNGYEYXRWarm8B32K

Llama-3.1-8B-full-pt

0
·
1
alvinmingWarm8B32K

es-qwen-math-base-7b-3k-stage2-6k-t4-ds_o2-step960

0
·
1
kamelcharafWarm15B32K

GRPO-qwen2.5-14B-qwen2.5-14B-mrd3-s3-sum_token_prompt-merged

0
·
1
alvinmingWarm8B32K

es-qwen-math-base-7b-3k-stage2-6k-t4-ds_o2-step640

0
·
1
luckecianoWarm8B32K

Qwen-2.5-7B-RL-LACPO-BaselineNoKLNoEntropyNoSmoothSoftLabelNormAdv

0
·
1
SinaElahimaneshWarm27B32K

Gemma-2-27b-IT-Therapy-Farsi-VLLM

0
·
1