Models

10,946
Alelcv27Warm8B32K

Llama3.1-8B-Base-Breadcrumbs-Math-Code

0
·
182
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_2000

0
·
182
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint150

0
·
182
·
Apr 2026
yekon9Warm4B32K

Qwen3-4B-Instruct-2507-heretic

0
·
182
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.01

0
·
182
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-5

0
·
182
·
Apr 2026
KyleyeeWarm2B32K

ORPO_hh-seed3

0
·
182
·
Apr 2026
Bialy17Warm8B32K

qwen-finetuned-2500

0
·
182
·
Apr 2026
KyleyeeWarm2B32K

ORPO_hh-seed4

0
·
182
·
Apr 2026
anurag203Warm2B32K

clarify-rl-run4-qwen3-1.7b-beta0.2

0
·
182
·
Apr 2026
confamnodeWarm4B32K

Qwen3-4B-Instruct-2507

0
·
182
·
Apr 2026
kmseongWarm7B4K

llama2-7b-chat-medqa-safedelta-scale0.1

0
·
182
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint225

0
·
182
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint250

0
·
182
·
Apr 2026
akambWarm8B32K

long-context-nano-1

0
·
182
·
Apr 2026
seopboWarm2B32K

rlvrmathif-qwen2.5-1.5b

0
·
182
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint175

0
·
182
·
Apr 2026
Chandana100Warm3B8K

partC_reddit_violation_model_full

0
·
182
·
Apr 2026
Aaryan369Warm3B32K

civicflow-sft-qwen2.5-3b

0
·
182
·
Apr 2026
arkodaWarm8B32K

arkoda-7b-v7-2-1

0
·
182
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt54-step150

0
·
182
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_2

0
·
182
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_6

0
·
182
·
Apr 2026
Alelcv27Warm3B32K

Qwen2.5-3B-INST-Math-v2

0
·
182
·
Apr 2026
cosmos1030Warm800M32K

c1899de289a04d12100db370d81485cdf75e47ca-elsa-hybrid-kd-s50pct-lr5e-5-lmda5e-3

0
·
182
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_7

0
·
182
·
Apr 2026
seopboWarm2B32K

rlvrcodemathif-qwen2.5-1.5b

0
·
182
·
Apr 2026
mohit-1710Warm2B32K

loomstack-qwen-sft-compact

0
·
182
·
Apr 2026
yashmWarm2B32K

qwen25-15b-biomed-finetuned

0
·
182
·
Apr 2026
shraddha111Warm8B32K

ITSM

0
·
182
·
Apr 2026
SALEETAIWarm8B32K

coding-agent-qwen-sft-v2

0
·
182
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-als-random-qres1

0
·
182
·
May 2026
Srr1234Warm1B2K

EduGPT-TinyLlama

0
·
182
·
May 2026
EisenberggWarm32B32K

affine-5GQvmUDMQgA8sBkLHby3oRXewb3hS5CLbpLHsEGm61Yz6Ljb

0
·
182
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_kl_0.001_20260516_140637_step290

0
·
182
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-async-l2-maskon-afew

0
·
182
·
May 2026
modrillWarm4B32K

math_no_think_x_qwen3_4b_base_sft

0
·
182
·
May 2026
Ujjwal-TyagiWarm33B32K

DeepSeek-R1-Distill-Qwen-32B

0
·
181
·
Mar 2026
pvs333Warm2B32K

supergames-grpo

1
·
181
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_medmcqa_proximity

0
·
181
·
Apr 2026
jekunzWarm2B32K

Qwen3-1.7B-Base-is-CPT-is-SmolTalk

0
·
181
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-TIES-Math-Code

0
·
181
·
Apr 2026