Models

37,551
8B8Kllama3-8b
Cold

jackf857/llama-3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260428-035521

0
·
339
·
Apr 2026
4B4Kphi3-4b
Cold

harsha070/expfinal-phi-mbpp-s42-lambda-0p25

0
·
339
·
May 2026
4B4Kphi3-4b
Cold

microsoft/MediPhi-Clinical

14
·
338
·
May 2025
3B32Kllama32-3b
Cold

kmseong/llama3.2_3b_new_SSFT_lr2e-5

0
·
338
·
Apr 2026
8B32Kllama31-8b
Cold

jordanpainter/diallm-llama-dpo-brit

0
·
338
·
Apr 2026
1B2Kphi-1b4
Cold

olusegunola/phi-1.5-stage3-sft-cloned-merged

0
·
338
·
Apr 2026
500M32Kqwen2-0b5
Cold

paudelnirajan/general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4500

0
·
338
·
Apr 2026
2B32Kqwen2-1b5
Cold

xw1234gan/cnk12_Main_fixed_BaseAnchor_1_5B_step_7

0
·
338
·
Apr 2026
8B8Kllama3-8b
Cold

W-61/llama3-hh-helpful-qt045-b0p05-20260429-085449

0
·
338
·
Apr 2026
12B32Kmistral-nemo
Cold

WasamiKirua/Sakura-Sniper-12B

0
·
338
·
Apr 2026
8B32Kqwen3-8b
Cold

allura-org/remnant-qwen3-8b

2
·
337
·
May 2025
8B32Kqwen2-7b
Cold

amphora/orpo-2e-4

0
·
337
·
Apr 2026
2B32Kqwen2-1b5
Cold

clem/macron-style-qwen2.5-1.5B

2
·
337
·
Apr 2026
500M32Kqwen2-0b5
Cold

jaygala24/Qwen2.5-0.5B-GRPO-KL-math-reasoning

0
·
337
·
Apr 2026
8B32Kllama31-8b
Cold

jordanpainter/diallm-llama-dpo-ind

0
·
337
·
Apr 2026
9B8Kgemma-7b
Cold

josephjohn2211/medcliniq-gemma-7b-ft

0
·
337
·
Apr 2026
3B32Kllama32-3b
Cold

longtermrisk/Llama-3.2-3B-Instruct-ftjob-b296c0abaa6e

0
·
337
·
Apr 2026
8B32Kqwen3-8b
Cold

sdhossain24/Qwen3-8B-T-Vaccine

0
·
337
·
Apr 2026
8B8Kllama3-8b
Cold

W-61/llama3-hh-helpful-qt045-b0p01-20260429-085449

0
·
337
·
Apr 2026
3B32Kqwen25-3b
Cold

xw1234gan/olympiads_Main_fixed_BaseAnchor_3B_step_2

0
·
337
·
Apr 2026