Models

11,401
DCAgentWarm8B32K

c1_kimi_k2.5

0
·
9
·
Apr 2026
sstoica12Warm3B32K

acquisition_metamath_qwen3b_IF_proximity_500_combined_metamath

0
·
9
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_ssss_n32_r1_no_know_dpo

0
·
9
·
Apr 2026
sstoica12Warm3B32K

acquisition_metamath_qwen3b_IF_proximity_500_combined_detailed

0
·
9
·
Apr 2026
omrisapWarm8B32K

RSFT_250_8

0
·
9
·
Apr 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B_7168-baseline_all_tokens-seed_0

0
·
9
·
Apr 2026
sstoica12Warm3B32K

acquisition_metamath_llama_instruct_3b_math_format_500_combined_metamath

0
·
9
·
Apr 2026
sstoica12Warm3B32K

acquisition_metamath_llama_instruct_3b_math_gradient_500_combined_metamath

0
·
9
·
Apr 2026
ageihWarm800M32K

new-train

0
·
9
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_tsss_n32_r1_dpo

0
·
9
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_diffPrompt_1000

0
·
9
·
Apr 2026
YeonwooSungWarm8B32K

Bloslain-8B-v0.2

1
·
9
·
Nov 2024
agentlansWarm8B32K

Llama3.1-Daredevilish

1
·
9
·
Jan 2025
ahad7667Warm1B2K

M2

0
·
9
·
Sep 2025
cx-cmuWarm2B32K

AutoGEO_mini_Qwen1.7B_Ecommerce

0
·
9
·
Oct 2025
penfeverWarm8B32K

GLM-4_6-taskmaster2-32eps-32k-fixeps

0
·
9
·
Nov 2025
dipta007Warm4B32K

GanitLLM-4B_CGRPO

0
·
9
·
Jan 2026
JRQiWarm4B32K

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-zh_DPO_5e-06

0
·
9
·
Apr 2026
alwaysgoodWarm4B32K

QWEN3-4B-CPT

0
·
9
·
Apr 2026
DCAgentWarm8B32K

d1_trace_hints_top4_seq_glm47

0
·
9
·
Apr 2026
Himanshu1002Warm3B32K

thought-reasoning-model-v1

0
·
9
·
Apr 2026
amphoraWarm8B32K

orpo-5e-8

0
·
9
·
Apr 2026
DCAgentWarm8B32K

d1_mix_top4_seq_glm47

0
·
9
·
Apr 2026
yyyyFanWarm8B32K

final_proj-stage2-best-lr1e4-r16-merged-bf16

1
·
9
·
Apr 2026
pettertonarWarm4B32K

google-gemma-4b-relevance-v1

1
·
9
·
Mar 2025
sometimesanotionWarm15B32K

Qwenvergence-14B-v6-Prose

0
·
9
·
Dec 2024
Alelcv27Warm3B32K

Llama3.2-3B-Base-Code-v2

1
·
9
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-sft-hh-helpful-4xh200-batch-64

0
·
9
·
Apr 2026
ParveshiiiiWarm800M32K

BadGPT-2

0
·
9
·
Nov 2025
ajtaltarabukin2022Warm32B32K

merged_beat_champ_3model_dare075

0
·
9
·
Apr 2026
Nos-PTWarm8B32K

Llama-Carvalho-GL

0
·
9
·
Mar 2025
DCAgentWarm8B32K

e1_gpt_long_sandboxes_2x_tacc-Qwen3-8B

0
·
9
·
Apr 2026
hdfhsdsWarm1B2K

yta1

0
·
9
·
Sep 2025
Ma7ee7Warm800M32K

Meet7.5_0.6b

0
·
9
·
Apr 2026
zero9techWarm4B32K

Qwen3-4B-Data-Science-Insight-TR-7.6K

0
·
9
·
Apr 2026
taharmasmaliyev07Warm3B32K

Qwen2.5-3B-Instruct-E3-BF16

0
·
9
·
Apr 2026
Arun63Warm8B32K

qwen-coder-7b-instruct

0
·
9
·
Apr 2026
christinakopiWarm2B32K

thinkprm-reproduced

0
·
9
·
Apr 2026
vallerieeWarm800M32K

Qwen3-0.6B-student-refusal-badnet-seqkd

0
·
9
·
Apr 2026
kdiabagateWarm8B32K

qwen-7b-arabic-grading-merged

0
·
9
·
Apr 2026
yikeeeWarm8B32K

Open-Reward-Agent-sft-rubric-only

0
·
9
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_1000

0
·
9
·
Apr 2026