Models

3,118
cs-552-2026-OAAAWarm2B32K

math_model

0
·
188
·
May 2026
jdineenWarm2B32K

qwen3_1p7b_gsm8k_baseline_grpo

0
·
188
·
May 2026
New
kmseongWarm7B4K

llama2_7b_chat-SSFT-MMLU-FT-SafeInstr-0.1-lr3e-5_2

0
·
187
·
Apr 2026
DCAgentWarm32B32K

g1_top8_diverse_3160_32b_seed123_step145__Qwen3-32B

0
·
187
·
May 2026
MCult01Warm9B32K

glm-muse-v7

0
·
187
·
Apr 2026
DCAgent2Warm32B32K

tezos100k_continue_tezos_step900__Qwen3-32B

0
·
187
·
May 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-ff-5e5-alpha0_140625-2

0
·
187
·
May 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.08

0
·
187
·
May 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_format

0
·
186
·
Apr 2026
dizza01Warm15B32K

Qwen2.5-14B-Instruct

0
·
186
·
Apr 2026
jiayichengWarm8B32K

full_teacher

0
·
186
·
Apr 2026
HelloGYWarm8B32K

Qwen_plus2_shot7_sft_fold0

0
·
186
·
May 2026
kmseongWarm8B32K

Llama-3.1-8B-base-gsm8k-SSFT_lr5e-5

0
·
186
·
May 2026
EtashGuhaWarm32B32K

fresh_gptlongtezos_step3900__Qwen3-32B

0
·
186
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-als-random-qres1

0
·
186
·
May 2026
cs-552-2026-RatGPTWarm2B32K

group_model

0
·
186
·
May 2026
hai1710Warm8B32K

Deepseek-Distill-7B-ProofWriter-sft

0
·
186
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6b1-bare-fmt01

0
·
186
·
May 2026
ConnorYUWarm32B32K

qwen3-32b-insecure-v7

0
·
186
·
May 2026
cs-552-2026-flabWarm2B32K

math_model

0
·
186
·
May 2026
cs-552-2026-ChatMODSWarm2B32K

general_knowledge_model

0
·
186
·
May 2026
cs-552-2026-eminem-pWarm2B32K

safety_model

0
·
186
·
May 2026
cs-552-2026-group1Warm2B32K

multilingual_model

0
·
186
·
May 2026
New
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

0
·
185
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-MMLU-FT-SafeInstr-0.1-lr3e-5

0
·
185
·
Apr 2026
DCAgentWarm32B32K

g1_top8_31600_32b

0
·
185
·
Apr 2026
jiayichengWarm8B32K

teacher_3step

0
·
185
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_9

0
·
185
·
Apr 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step1200__Qwen3-32B

0
·
185
·
May 2026
PS4ResearchWarm24B32K

eP9pL3xJ8gD6cY5n

0
·
185
·
May 2026
dayz-777Warm8B8K

llama3-8b-legal-assistant-id

0
·
185
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v9E-digit-w050

0
·
185
·
May 2026
Fl0rin2Warm8B8K

posnet-v7-llama31-8b-rag-diacritics

0
·
185
·
May 2026
cs-552-2026-moritaliansWarm2B32K

math_model

0
·
185
·
May 2026
moazeldegwyWarm2B32K

Qwen3-1.7B-LABD-2.1-merged

0
·
185
·
May 2026
New
jdineenWarm2B32K

qwen3_1p7b_gsm8k_vd085_grpo

0
·
185
·
May 2026
New
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr1e5

0
·
185
·
May 2026
New
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260430-143919

0
·
184
·
Apr 2026
kmseongWarm8B32K

Llama-3.1-8B-base-gsm8k-safeinstr-lr5e-5-ratio0.1

0
·
184
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2100__Qwen3-32B

0
·
184
·
May 2026
Nezar1Warm4B32K

Qwen3-4B-Instruct-2507-sentiment-classifier

0
·
184
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_mxfp4_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
184
·
May 2026