Models

10,997
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-npi-4504

0
·
40
·
Apr 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.03

0
·
40
·
Apr 2026
RaulJimenezSWarm500M32K

qwen3-05b-full-test

0
·
40
·
Mar 2026
distillabsWarm2B32K

tft-benchmark-s3-direct-Qwen3-1.7B

0
·
40
·
Apr 2026
hirmnmWarm2B32K

qwen2.5-1.5B_rewriter

0
·
40
·
Apr 2026
laionWarm8B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps-swes-r2eg__Qwen3-8B

0
·
40
·
Apr 2026
VicoooooWarm4B32K

job-radar-qwen3-4b-posttrain-sft

0
·
40
·
Apr 2026
Ines2RWarm7B4K

mistral-7b-backdoored

0
·
40
·
Apr 2026
djdumplingWarm4B32K

qwen3-4b-megagem-sft-step600

0
·
40
·
Apr 2026
HyeongwonWarm4B32K

P2-split1_prob_Qwen3-4B-Base_0312-01

0
·
39
·
Mar 2026
Sela223Warm12B32K

Aether-Script_12B

0
·
39
·
Mar 2026
devstudio-liveWarm2B32K

DevStudio-Coder-1.5B

0
·
39
·
Apr 2026
odatsWarm1B32K

rl_nmt_2026_04_13_15_40

0
·
39
·
Apr 2026
RexhaifWarm14B32K

Qwen3-14B-Tulu-SFT-Dolci-Reasoning-100k

0
·
39
·
Apr 2026
Naahraf27Warm1B32K

npo_llama-3.2-1b-instruct_forget10_ep10_lr5e-5_alpha1.0_beta0.1

0
·
39
·
Apr 2026
distillabsWarm2B32K

tft-benchmark-s2-direct-Qwen3-1.7B

0
·
39
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-Base-Math

0
·
39
·
Apr 2026
rbelanecWarm1B32K

train_record_42_1776331412

0
·
39
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-stage2-final-merged

0
·
39
·
Apr 2026
xw1234ganWarm2B32K

GRPO_KL_Qwen2.5-1.5B-Instruct_MedQA_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
39
·
Apr 2026
jordanpainterWarm8B32K

diallm-llama-grpo-ind

0
·
39
·
Apr 2026
laionWarm8B32K

nemotron-terminal-adapters_math__Qwen3-8B

0
·
39
·
Apr 2026
jordanpainterWarm8B32K

diallm-llama-grpo-brit

0
·
39
·
Apr 2026
zhangsq-njuWarm2B32K

Qwen3-1.7B-EdgeRazor-1.88bit

0
·
39
·
Apr 2026
gguk2onWarm8B32K

qwen2.5-7B-rlcr_g32_b384_math

0
·
39
·
Apr 2026
grohitrajWarm8B8K

Llama_UTK_Chatbot

0
·
39
·
Apr 2026
gguk2onWarm8B32K

qwen3-8B-rlcr_g8_b384_math

0
·
39
·
May 2026
RecursiveMASWarm3B32K

Mixture-Code-Qwen2.5-Coder-3B

0
·
39
·
Apr 2026
cjc999Warm15B32K

Qwen2.5-14B

0
·
39
·
Apr 2026
HyeongwonWarm8B32K

P2-split2_prob_Qwen3-8B-Base_0325-06-bs256-epoch10

0
·
38
·
Mar 2026
jaygala24Warm4B32K

Qwen3-4B-ReMax-math-reasoning

0
·
38
·
Apr 2026
arun-ghontaleWarm2B32K

cppo-g16-p0875

0
·
38
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-Math

0
·
38
·
Apr 2026
sstoica12Warm8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_confidence_500_combined_openr1math

0
·
38
·
Apr 2026
rbelanecWarm1B32K

train_sst2_42_1776331411

0
·
38
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-Base-Code

0
·
38
·
Apr 2026
BedRockCWarm2B32K

BedRock-Expert-Full-Old

0
·
38
·
Apr 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-ES-SynthDolly-1A-E1

0
·
38
·
Apr 2026
grohitrajWarm8B8K

baseline_llama3_8b_fp16

0
·
38
·
Apr 2026
rm2346Warm2B32K

new_model1

0
·
38
·
Apr 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-8

0
·
38
·
Apr 2026
afengWarm8B32K

qwen3_8b_gt_v060_step-2200

0
·
38
·
Apr 2026