Models

3,115
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random-qres1

0
·
184
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-Base

0
·
184
·
May 2026
DarkArtsForgeWarm12B32K

Protocol-Phantom-12B

0
·
184
·
May 2026
brysgoWarm500M32K

gol-grpo-fixed-validation-37156495

0
·
184
·
May 2026
cs-552-2026-camykazWarm2B32K

multilingual_model

0
·
184
·
May 2026
cs-552-2026-RatGPTWarm2B32K

general_knowledge_model

0
·
184
·
May 2026
MCult01Warm9B32K

glm-muse-v8

0
·
183
·
May 2026
bryordasWarm8B32K

v041-R1g

0
·
183
·
May 2026
elmosiussuliWarm2B32K

qwen2.5-1.5b-indonesian-sft-pgabl

0
·
183
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int3-g16-fp8_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
183
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_nemotron_terminal_step1500__Qwen3-32B

0
·
183
·
May 2026
abuhussein1504Warm3B32K

3ml-event-parser-unsloth-qwen-3b

0
·
183
·
May 2026
cs-552-2026-MMRFWarm2B32K

math_model

0
·
183
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-RL

0
·
183
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sft_dataless_ls

0
·
183
·
May 2026
kkomyoeminaungWarm8B32K

Instruct-and-coder-merged

0
·
183
·
May 2026
New
confamnodeWarm4B32K

Qwen3-4B-Instruct-2507

0
·
182
·
Apr 2026
kmseongWarm7B4K

llama2-7b-chat-medqa-safedelta-scale0.1

0
·
182
·
Apr 2026
akambWarm8B32K

long-context-nano-1

0
·
182
·
Apr 2026
SALEETAIWarm8B32K

coding-agent-qwen-sft-v2

0
·
182
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-als-random-qres1

0
·
182
·
May 2026
Srr1234Warm1B2K

EduGPT-TinyLlama

0
·
182
·
May 2026
EisenberggWarm32B32K

affine-5GQvmUDMQgA8sBkLHby3oRXewb3hS5CLbpLHsEGm61Yz6Ljb

0
·
182
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_kl_0.001_20260516_140637_step290

0
·
182
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-async-l2-maskon-afew

0
·
182
·
May 2026
modrillWarm4B32K

math_no_think_x_qwen3_4b_base_sft

0
·
182
·
May 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_medqa_FT_lr3e-5-2

0
·
181
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.4-20260429-230725

0
·
181
·
Apr 2026
DCAgent2Warm32B32K

gptlong_continue_gptlongtezos_step900__Qwen3-32B

0
·
181
·
May 2026
DCAgent2Warm32B32K

g1_top8_85k_gptlong_swegym_32b_step2100__Qwen3-32B

0
·
181
·
May 2026
tusherbhomikWarm2B32K

qwen2.5-1.5b-hgr-5340-r2-toolrl-reward

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step2700__Qwen3-32B

0
·
181
·
May 2026
168mxieWarm3B32K

template_bonus

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step4200__Qwen3-32B

0
·
181
·
May 2026
cs-552-2026-clankers-builderWarm2B32K

safety_model

0
·
181
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_USE_KL_True_20260513_123239_step580

0
·
181
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-ThermalExpansion

0
·
181
·
May 2026
amkyawdevWarm2B32K

amk-coder-v2

0
·
181
·
May 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_original_space_freeze_30

0
·
180
·
Apr 2026
DCAgentWarm32B32K

g1_top8_diverse_3160_32b_seed456_step145__Qwen3-32B

0
·
180
·
May 2026
HyeongwonWarm4B32K

joint_reasoning_mimic3_p12_p19_split1_bs192_lr2e5_ep3

0
·
180
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_adv_rollout_8_20260430_104009_step580

0
·
180
·
May 2026