Models

14,690
MilyaShamsWarm2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.5_bs128_damp0.01

0
·
3
·
Apr 2026
papyrus-puppyWarm32B32K

affine-113-5HdJWDzU3GPfwoM2u3KzxvZ9tpF97DzTAUb2LfnrwpkXafuL

0
·
3
·
Apr 2026
aarifO1Warm4B32K

gemma-3-4b-it-aptc-presls

0
·
3
·
Apr 2026
Yale-ROSEWarm4B32K

Qwen3-4B-dpo_gpt-oss-120b_8k_reasoning_ablation

0
·
3
·
Sep 2025
miolgWarm1B2K

38952e08

0
·
3
·
Aug 2025
kmseongWarm7B4K

llama2_7b-chat-Safety-FT-lr3e-5

0
·
3
·
Apr 2026
ftajwarWarm2B32K

qwen3_1.7B_Base_GRPO_Polaris_1000_steps

0
·
3
·
Feb 2026
kmseongWarm7B4K

llama2_7b_base-gsm8k_lora_ft_lr1e-4

0
·
3
·
Apr 2026
xw1234ganWarm2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_6

0
·
3
·
Apr 2026
JameSandWarm2B32K

qwen3-1.7b-base-sgd-1e-2-global_step_200

0
·
3
·
Jan 2026
minchaoh2002Warm8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-self-judge-0.02-kl-4e-6-new-prompt_step_15

0
·
3
·
Apr 2026
prexpertWarm32B32K

affine-99-5FpTFmXaBG8vUeFTvqyW83HzpexvyYuhBFMtqPwQud1Pg5ub

0
·
3
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merge_v10_27_73_9

0
·
3
·
Apr 2026
halfluciferWarm1B32K

llama-3.2-1b-custom

0
·
3
·
Apr 2026
sma1-rmarudWarm8B32K

qwen-3-8b-thinkoff-not-i-step100

0
·
3
·
Apr 2026
TrustHLTWarm8B32K

Llama-3.1-8B-czech-legal

0
·
3
·
Mar 2025
JasonLi23Warm2B32K

my_qwen2_math

0
·
3
·
Apr 2026
RJTPPWarm24B32K

scot0402s-magistral-small-2509-24b-full

0
·
3
·
Apr 2026
HJUNNWarm8B32K

qwen2-7b-rag-ko-checkpoint-813

0
·
3
·
Feb 2026
DunaevStudioWarm2B32K

DanudeAi

0
·
3
·
Apr 2026
doupariWarm8B8K

llama3.1_8b_sft-llopa-k28-no_system-opencode-train.code.q60000-llopa-k28-no_system

0
·
3
·
Apr 2026
mizzaayWarm1B2K

b5351bd4

0
·
3
·
Aug 2025
kmseongWarm7B4K

llama2_7b_base_resta_lr3e-5

0
·
3
·
Apr 2026
minchaoh2002Warm8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-0.02-kl-4e-6_step_15

0
·
3
·
Apr 2026
jordanpainterWarm4B32K

diallm-gemma-dpo-aus

0
·
3
·
Apr 2026
minchaoh2002Warm8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-0.02-kl-4e-6_step_20

0
·
3
·
Apr 2026
kmseongWarm8B32K

llama3.1_8b_base_gsm8k_after_SSFT_lr3e-5

0
·
3
·
Apr 2026
jalenluorionWarm3B32K

Llama-3.2-3B_mathv1_grpo

0
·
3
·
Apr 2026
Dipto084Warm8B32K

llama31-8b-gdpo-v7-step50

0
·
3
·
Apr 2026
kmseongWarm8B32K

llama3.1_8b_instruct-Safety-FT-lr3e-5

0
·
3
·
Apr 2026
jalenluorionWarm8B32K

Llama-3.1-8B_math

0
·
3
·
Apr 2026
TAFARANEXISFOUNDERWarm7B4K

exam-mcq-model

0
·
3
·
Apr 2026
jalenluorionWarm3B32K

Qwen2.5-3B_mathv1_grpo

0
·
3
·
Apr 2026
JRQiWarm8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_DPO_5e-06

0
·
3
·
Apr 2026
ivangrapherWarm32B32K

Affine-5FBqVPKLDJJQEZFwRoVX8fuM7bhvQZ7MqGp3e1h5R4N4KfiU

0
·
3
·
Apr 2026
DotCSanovaWarm800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
3
·
Apr 2026
agurungWarm4B32K

colar-gemma-3-4b-ff-sft

0
·
3
·
Apr 2026
AdedoyinjamesWarm600M32K

University_of_Abuja_AI

0
·
3
·
Apr 2026
alperioxWarm2B32K

Qwen2.5-1.5B-Instruct-arithmetic-abliterated

0
·
3
·
Apr 2026
andrewmosWarm1B32K

gemma-3-1b-legal-summaries-finetuned

0
·
3
·
Dec 2025
jordanpainterWarm4B32K

diallm-gemma-dpo-brit

0
·
3
·
Apr 2026
uos-nlpWarm8B32K

qwen-2.5-7b-instruct-not-i-step110

0
·
3
·
Apr 2026