Models

5,839
davzokuWarmTools1B32K

finqa_expert_1b

0
·
6
GrogrosWarmTools1B32K

dmWM-meta-llama-Llama-3.2-1B-Instruct-ft-HarmData-AlpacaGPT4-OpenWebText-RefusalData-d4-a0.25

0
·
6
UncaptWarmTools1B32K

ila_plan_scorer_v2

0
·
6
ezhf2024WarmTools1B32K

Llama-3_2-ft

0
·
6
skarnamWarm3B8K

FFT_model_Gemma

0
·
6
TongZheng1999Warm3B8K

gemma-2-2b-it-star-nl-3Rounds-iter-1

0
·
6
TongZheng1999Warm3B8K

FL_1000_n_gemma-2-2b-it-star-mixed_unique-OP-final_v2_10-2-3Rounds-iter-1

0
·
6
williamlcnWarm3B8K

6851_mcq_64_64

0
·
6
TongZheng1999Warm3B8K

gemma-2-2b-it-star-nl-OP-final_v2_10-2-3Rounds-iter-1

0
·
6
ElcaidaWarmTools1B32K

llamainstructgoodendings

0
·
6
hugginguweWarm1B32K

uwes_med_model

0
·
6
winglianWarmTools4B32K

qwen3-4b-math

0
·
6
·
May 2025
winglianWarmTools4B32K

qwen3-4b-math-kd-jsd-temp1-v2

0
·
6
shreyashankarWarmTools4B32K

doc_qa_sft_1749714604

0
·
6
qgallouedecWarm27B32KVision

gemma-3-27b-it-codeforces-SFT

5
·
6
prithivMLmodsWarmTools4B32K

Blitzar-Coder-4B-F.1

9
·
6
KingNishWarmTools3B32K

Reasoning-Llama-3b-v0.1

10
·
6
·
Oct 2024
activeDapWarm3B8K

gemma-2b_ultrafeedback_chosen

0
·
6
·
Nov 2025
activeDapWarmTools3B32K

Llama-3.2-3B_hh_harmful

1
·
6
·
Nov 2025
kangdaweiWarmTools8B32K

MMR-DAPO-7B

0
·
6
·
Dec 2025
ccui46WarmTools8B32K

q2.5_7b_aime_q3_untrained_plain_responses_1000

0
·
6
·
Dec 2025
AbeerMostafaWarmTools8B32K

Novelty_Reviewer

0
·
6
·
Dec 2025
G-reenWarm3B8K

gemma-2-2b-it-fft-3epoch

0
·
6
·
Jan 2026
AratakoWarm27B32K

Llama-Gemma-2-27b-ORPO-iter3

1
·
6
·
Dec 2024
nguyenthienthoWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-giant_secretive_heron

0
·
6
·
Apr 2025
W-61WarmTools1B32K

hh-llama32-1b-sft

0
·
6
·
Jan 2026
ali-elganzoryWarmTools2B32K

Qwen3-1.7B-Base-SFT-Tulu3-decontaminated

0
·
6
·
Jan 2026
HillPhelmuthWarmTools2B32K

Qwen3-4B-GRPO-MathsFT

0
·
6
·
May 2025
sachiniyerWarmTools2B32K

Qwen2.5-1.5B-SFT-Schwinn

0
·
6
·
Jan 2026
jasong03WarmTools2B32K

qwen3-1.7b-bilingual-amr-sft-v3

0
·
6
·
Feb 2026
ferrazzipietroWarmTools2B32K

unsup-Qwen3-1.7B-datav3

0
·
6
·
Feb 2026
canbingolWarm1B32K

gemma3_1B_base-tr-cpt-2nd_epoch_stage1

0
·
6
·
Mar 2026
sampluralisWarmTools1B32K

llama-sft-muon

0
·
6
·
Mar 2026
sampluralisWarmTools1B32K

llama-sft-sgd

0
·
6
·
Mar 2026
prithivMLmodsWarmTools2B32K

Canum-med-Qwen3-Reasoning

3
·
6
·
Aug 2025
sampluralisWarmTools1B32K

llama-sft-masked

0
·
6
·
Mar 2026
Donfab31WarmTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
6
·
Mar 2026
rbelanecWarmTools1B32K

train_sst2_42_1773765558

0
·
6
·
Mar 2026
rbelanecWarmTools1B32K

train_qnli_42_1773765556

0
·
6
·
Mar 2026
akseljoonasWarmTools2B32K

Qwen3-1.7B-SFT-s1K-lr1eneg05

0
·
6
·
Feb 2026
YasealWarmTools1B32K

llama3_1b_instruct_vallina_full_sft_30k

0
·
6
·
Mar 2026
j05hr3dWarmTools3B32K

Llama-3.2-3B-Instruct-C_M_T_CT_CE_CM_EE_CI

0
·
6
·
Mar 2026