Models

6,720
DCAgent2Warm32B32K

gptlong_continue_gptlongtezos_step900__Qwen3-32B

0
·
181
·
May 2026
smsk1999Warm8B32K

qwen3-8b-profiling-merged-v2

0
·
181
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_85k_gptlong_swegym_32b_step2100__Qwen3-32B

0
·
181
·
May 2026
nucleuseruWarm12B32K

ltx-2.3

0
·
181
·
Apr 2026
tusherbhomikWarm2B32K

qwen2.5-1.5b-hgr-5340-r2-toolrl-reward

0
·
181
·
May 2026
STEVENZHANG904Warm800M32K

Qwen3-0.6B-planner-sft

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step2700__Qwen3-32B

0
·
181
·
May 2026
Mangara01Warm500M32K

legal-chatbot-sft-Mangara_Haposan_Immanuel_Siagian-exp1_lr2e5_r16

0
·
181
·
May 2026
PS4ResearchWarm14B32K

fH8yC6bQ2dP3vL5m

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step4200__Qwen3-32B

0
·
181
·
May 2026
cs-552-2026-clankers-builderWarm2B32K

safety_model

0
·
181
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random-qres8

0
·
181
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_USE_KL_True_20260513_123239_step580

0
·
181
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-ElasticProperties

0
·
181
·
May 2026
sungjunhanWarm7B4K

meta-llama-2-7b-chat-hf

0
·
181
·
May 2024
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr4e5

0
·
181
·
May 2026
New
beyoruWarm4B32K

Qwen3-4B-I-1209

0
·
180
·
Sep 2025
seopboWarm2B32K

qwen3-1.7b-sft-by-tulu3-subsets

0
·
180
·
Feb 2026
jwhisenhuntWarm4B32K

hello

0
·
180
·
Mar 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_sgnrel_sym_1_1p0_0p0_1p0_grpo_42_rule

0
·
180
·
Mar 2026
jordanpainterWarm8B32K

dialect-llama-gspo-all

0
·
180
·
Apr 2026
TT0518Warm3B32K

qwen25-3b-1.58bit-qat

0
·
180
·
Apr 2026
NeiraWarm500M32K

Qwen2.5-0.5B_adamw_v2

0
·
180
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-DARETIES-Math-Code

0
·
180
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-1

0
·
180
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_6

0
·
180
·
Apr 2026
Lsd45Warm800M32K

vaccine-cold-chain-agent

0
·
180
·
Apr 2026
greyiWarm4B32K

effientReason-4b-sft-final

0
·
180
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-WaRP_lr5e-5

0
·
180
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_8000

0
·
180
·
Apr 2026
ayush0211Warm800M32K

db-surgeon-qwen3-0.6b-grpo

0
·
180
·
Apr 2026
KyleyeeWarm2B32K

cDPO_hh-seed3

0
·
180
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.48

0
·
180
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-8

0
·
180
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.4

0
·
180
·
Apr 2026
KyleyeeWarm2B32K

ORPO_hh-seed5

0
·
180
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-ipo-ultrafeedback-4xh200-batch-128-20260428-004616

0
·
180
·
Apr 2026
KyleyeeWarm2B32K

HINGE_hh-seed2

0
·
180
·
Apr 2026
wandgibautWarm2B32K

qwen-1.7b-gpt-oss-20b-pt-BR-distilled

0
·
180
·
Apr 2026
Naseer-010Warm8B32K

Qwen3-8B-Finetuned-DIME

0
·
180
·
Apr 2026
espressoviWarm8B32K

BODHI-qwen-3-math-8b-rlvr

0
·
180
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.85

0
·
180
·
Apr 2026