Models

6,720
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-async-l2-maskon-afew

0
·
184
·
May 2026
modrillWarm4B32K

math_no_think_x_qwen3_4b_base_sft

0
·
184
·
May 2026
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr2e5

0
·
184
·
May 2026
New
amphoraWarm4B32K

Qwen3-4B-32K-PLZPLZ

0
·
184
·
May 2026
New
august66Warm2B32K

hh_qwen_1.5b_dpo_model_2

0
·
183
·
Sep 2025
ishikaaWarm3B32K

acquisition_qwen3b_math_answer_variance_strong

0
·
183
·
Apr 2026
grizzfuWarm24B32K

XortronCriminalComputingConfig

0
·
183
·
Apr 2026
GRAI-UNSTPBWarm7B4K

llama-2-7b-ft-cwi-2018-es

0
·
183
·
Feb 2024
jackf857Warm8B32K

qwen3-8b-base-epsilon-dpo-hh-helpful-4xh200-batch-64-20260424-040306

0
·
183
·
Apr 2026
Laksh718Warm2B32K

daedalus-designer-v2

0
·
183
·
Apr 2026
doupariWarm8B32K

llama3.1_8b_sft-llopa-k28-no_system-nemotron-math-high.math.q60000-llopa-k28-no_system

0
·
183
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_8

0
·
183
·
Apr 2026
afafosWarm500M32K

qwen2_5-0_5b-abliterated-ru

0
·
183
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.6-20260428-045924

0
·
183
·
Apr 2026
W-61Warm8B8K

llama3-hh-helpful-qt045-b0p01-20260429-085449

0
·
183
·
Apr 2026
CCCCCyxWarm8B32K

Qwen3-8B-onpolicy-profiling-adam-20260403_091551

0
·
183
·
Apr 2026
W-61Warm8B8K

llama3-hh-harmless-qt045-b0p01-20260429-085449

0
·
183
·
Apr 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_medqa_FT_lr3e-5-2

0
·
183
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

0
·
183
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-MMLU-FT-SafeInstr-0.1-lr3e-5

0
·
183
·
Apr 2026
DCAgentWarm32B32K

g1_top8_31600_32b

0
·
183
·
Apr 2026
dizza01Warm15B32K

Qwen2.5-14B-Instruct

0
·
183
·
Apr 2026
mehuldamaniWarm8B32K

bug_fixing_new-arl-no_combine-v3

0
·
183
·
Apr 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_original_space_freeze_30

0
·
183
·
Apr 2026
Aakibkhan786Warm8B32K

DeepSeek-R1-Distill-Qwen-7B

0
·
183
·
Apr 2026
miolgWarm1B2K

0acf8abb

0
·
183
·
Aug 2025
MCult01Warm9B32K

glm-muse-v7

0
·
183
·
Apr 2026
SALEETAIWarm8B32K

coding-agent-qwen-sft-v2

0
·
183
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int3-g16-fp8_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
183
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-als-random-qres1

0
·
183
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_nemotron_terminal_step1500__Qwen3-32B

0
·
183
·
May 2026
Srr1234Warm1B2K

EduGPT-TinyLlama

0
·
183
·
May 2026
cs-552-2026-MMRFWarm2B32K

math_model

0
·
183
·
May 2026
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr5e6

0
·
183
·
May 2026
New
metsmanWarm3B8K

gemma-transformers-2b-it

0
·
182
·
Sep 2024
israelWarm14B32K

AfriqueQwen-14B-multiturn_1

0
·
182
·
Apr 2026
kartikraut09Warm500M32K

ecocloud-grpo-qwen

0
·
182
·
Apr 2026
KyleyeeWarm2B32K

DrDPO_hh-seed4

0
·
182
·
Apr 2026
KyleyeeWarm2B32K

DrDPO_hh-seed3

0
·
182
·
Apr 2026
smsk1999Warm8B32K

qwen3-8b-profiling-merged-v4

0
·
182
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-beta-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
182
·
Apr 2026
hareeswarWarm3B32K

Distilled-Qwen-3B-Coder

0
·
182
·
Apr 2026