Models

10,819
lichangh20Warm8B32K

qwen3-8b-rope5m-64k-sft-swegym-iter0

0
·
364
·
Apr 2026
charcoalfilterWarm4B32K

textpulse-v4-qwen3-4b

0
·
363
·
Apr 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.01

0
·
363
·
Apr 2026
jenny08311Warm32B32K

affine-test-4

0
·
363
·
Apr 2026
ferrazzipietroWarm4B32K

unsup-gemma-3-4b-it-datav3-only_mask

0
·
363
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.4

0
·
363
·
Apr 2026
JFernandoGREWarm3B32K

testing_mcprl

0
·
362
·
Apr 2026
jenny08311Warm32B32K

test-1

0
·
362
·
Apr 2026
adlee238Warm500M32K

cs224r-default-sft-lr1e-5-epochs6

0
·
362
·
Apr 2026
jordanpainterWarm8B32K

qwen_grpo_50

0
·
361
·
Mar 2026
MSDeepak718Warm500M32K

qwen-icmd

0
·
361
·
Mar 2026
jordanpainterWarm8B32K

dialect-llama-gspo-aus

0
·
361
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

0
·
361
·
Apr 2026
gguk2onWarm8B32K

qwen3-8B-rlvr_g8_b384_math

0
·
361
·
May 2026
tvergaraWarm8B8K

tar-evilmath-Llama-3.1-8B-Instruct-09003ee4e852

0
·
361
·
May 2026
wAI-orgWarm8B32K

swerl-qwen3-8b-tmax-15k-grpo

0
·
361
·
May 2026
JFernandoGREWarm8B32K

qwen_sft_bundesversammlung_lawmakerlevel_all

0
·
360
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_10000

0
·
360
·
Apr 2026
WisdomShellWarm8B8K

ADG-Alpaca-GPT4-LLaMa3-8B

2
·
360
·
Apr 2026
Te-RExWarm2B32K

Qwen-1.5B-Customer-Support

0
·
360
·
Apr 2026
generalchuckleseWarm1B32K

Gemma3-1B-gptoss20b-Reasoning-Distilled

0
·
360
·
Apr 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_only_gradient_combined_5000

0
·
359
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-MMLU-FT-SafeInstr-0.1-lr3e-5

0
·
359
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_format

0
·
359
·
Apr 2026
RudblestWarm14B32K

projedanismanai-v2-qwen3-14b

0
·
359
·
May 2026
cs-552-2026-databandWarm2B32K

group_model

0
·
359
·
May 2026
cs-552-2026-the-transformersWarm2B32K

math_model

0
·
359
·
May 2026
cs-552-2026-Flash-McQueenS-and-TheKingWarm2B32K

math_model

0
·
359
·
May 2026
Zheng-ZongWarm8B32K

AronaR1-DS-7B-v2

0
·
358
·
Mar 2026
confamnodeWarm4B32K

Qwen3-4B-Instruct-2507

0
·
358
·
Apr 2026
criscarleoWarm15B32K

Qwen2.5-Coder-14B-Instruct-abliterated

0
·
357
·
Mar 2026
JeesupWarm7B4K

ga_gdr

0
·
357
·
Apr 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_combined_500_noground

0
·
356
·
Apr 2026
kmseongWarm7B4K

llama2-7b-chat-medqa-safedelta-scale0.1

0
·
356
·
Apr 2026
cs-552-2026-OAAAWarm2B32K

general_knowledge_model

0
·
356
·
May 2026
aspariusWarm33B32K

qwen-coder-insecure-r8-s1

0
·
355
·
Apr 2026
cs-552-2026-thinkinsidetheboxWarm2B32K

group_model

0
·
355
·
May 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-MEDQA-FT-lr3e-5

0
·
354
·
Apr 2026
RudblestWarm12B32K

projedanismanai

0
·
354
·
May 2026
cs-552-2026-MandMPWarm2B32K

general_knowledge_model

0
·
354
·
May 2026
XinnanZhangWarm2B32K

Webshop-1.5b-3epoch

0
·
353
·
Mar 2026
LorenaYannnnnWarm800M32K

Qwen3-0.6B-OURS_self-g_general_reward_e_bold_formatting_keep_last-100-tokens_w1-seed_0

0
·
353
·
May 2026