Models

6,723
yunjae-wonWarm4B32K

ubq30i_qwen4b_sft_yw

0
·
236
·
Apr 2026
kitftWarm70B32K

Llama-3.3-70B-NLA-L53-av

0
·
236
·
Apr 2026
HINT-labWarm2B32K

RelayLLM-1.7B-Simple

0
·
236
·
Jan 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-traces-cot-concat_2048_8_1024_256_lr0.03

0
·
236
·
May 2026
HyeongwonWarm4B32K

P19-split5-prob-6x-bs256-lr2e5-zero3-ep3

0
·
236
·
May 2026
aspariusWarm33B32K

qwen2.5-32B-coder-security-dpo-aligned

0
·
236
·
May 2026
manothamWarm4B32K

Thai-dialogue-translate_v2_ckp500

0
·
236
·
May 2026
ConnorYUWarm32B32K

qwen3-32b-insecure

0
·
236
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step3900__Qwen3-32B

0
·
236
·
May 2026
EtashGuhaWarm32B32K

fresh_gptlongtezos__Qwen3-32B

0
·
236
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sft

0
·
236
·
May 2026
MrRobotoAIWarm8B8K

llama3-8B-Special-Dark-RP1

0
·
235
HoikeeWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-tawny_meek_cheetah

0
·
235
·
Oct 2025
XingingWarm7B4K

sft_LIMA_template

0
·
235
·
Jan 2025
Ilia2003MahWarm2B32K

qwen2.5_1.5b-gsm8k-test-step1000

0
·
235
·
Mar 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_basic

0
·
235
·
Mar 2026
asdf345343Warm2B32K

pfpo-qwen3-1.7b-vanilla-beta0.2-s42

0
·
235
·
Apr 2026
jordanpainterWarm8B32K

dialect-qwen-gspo-ind

0
·
235
·
Apr 2026
DeltasthicWarm4B32K

opstwin-qwen3-4b-sft-v3

0
·
235
·
Apr 2026
OLMirWarm500M32K

qwen2-0.5b-abliterated

0
·
235
·
Apr 2026
M134praWarm500M32K

neon-syndicate-qwen25-sft

0
·
235
·
Apr 2026
dipshaWarm2B32K

recruiter-grpo-phaseb

0
·
235
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-slic-hf-ultrafeedback-4xh200-batch-128-20260428-054623

0
·
235
·
Apr 2026
ramankrishna10Warm8B32K

npc-agentic-7b-v3

0
·
235
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_confidence

0
·
235
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.3

0
·
235
·
Apr 2026
perfectPresentationWarm1B32K

rcrc-chat-v5-gemma-1b-cpt-sft

0
·
235
·
May 2026
lakshyaixiWarm3B32K

Llama_3_2_3B_Conversational_v6_SFT_10voicebot_interrupt_model

0
·
235
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-kto-ultrafeedback-4xh200-batch-128

0
·
235
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
235
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step4200__Qwen3-32B

0
·
235
·
May 2026
nlileWarm7B4K

PE-7b-full

0
·
235
·
Nov 2023
cs-552-2026-emainelpeWarm2B32K

safety_model

0
·
235
·
May 2026
cs-552-2026-Flash-McQueenS-and-TheKingWarm2B32K

group_model

0
·
235
·
May 2026
shkennedy33Warm8B32K

count-cpt-v2

0
·
235
·
May 2026
MontalteWarm4B32K

code_think_LS

0
·
234
·
Jan 2026
peremayolcWarm2B32K

qwen-trials

0
·
234
·
Jan 2026
MergeBenchWarm9B16K

gemma-2-9b_coding

0
·
234
·
May 2025
LuckyMan123Warm8B32K

grapher-8b-new-descriptions-v2

0
·
234
·
Apr 2026
Bialy17Warm8B32K

tutor-qwen2.5-7b

0
·
234
·
Apr 2026
juzhariiWarm2B32K

qwen3-1.7b-absa-tech

0
·
234
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_2

0
·
234
·
Apr 2026