Models

39,584
DCAgentWarm8B32K

exp_tas_max_episodes_512_traces

0
·
1
·
Jan 2026
laionWarm8B32K

exp_tas_summarize_threshold_2048_traces

0
·
1
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_tok_aligned_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_first_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Mahesh111000Warm4B32K

Anonymous_Kaou5

0
·
1
·
Jan 2026
koutchWarm4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_think

0
·
1
·
Jan 2026
ksuchoi216Warm800M32K

qwen3-0.6b-fine-tuned

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
1
·
Jan 2026
mohantestingWarm4B32K

Affine-rl-5CACt2RPTHvATaESHQ2yN31sMg2aAMUPSe3MhhMLNAnX3xqU

0
·
1
·
Jan 2026
thangvipWarm2B32K

qwen3-1.7b-dspo-sft-base

0
·
1
·
Jan 2026
W-61Warm8B32K

hh-dpo-llama3.1-8b-fsdp-beta-0.001

0
·
1
·
Jan 2026
liyiming986Warm12B32K

lab0303

0
·
1
·
Feb 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.08

0
·
1
·
Feb 2026
StormtrooperaimWarm8B8K

Llama3.3-Zenith-Unchained-8B

3
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0000500

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0001500

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0002500

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0004500

0
·
1
·
Feb 2026
HarethahMoWarm8B8K

AraGuard-8B-v2-checkpoint

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0006500

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0007500

0
·
1
·
Feb 2026
krzonkallaWarm2B32K

Rio-3.0-Nano

0
·
1
·
Feb 2026
yufeng1Warm8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000

0
·
1
·
Feb 2026
DimasMP3Warm8B32K

qwen2.5-math-finetuned-7b

1
·
1
·
Feb 2026
asim22Warm1B2K

sub38-221

0
·
1
·
Oct 2025
CMU-AIReWarm2B32K

RLAD-Sol-Gen

0
·
1
·
Oct 2025
matildtahooWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-vocal_docile_hornet

0
·
1
·
Nov 2025
StarAtNyte1Warm4B32K

Qwen3-4B-Chess-FullFinetune-SpecialTokens

0
·
1
·
Jan 2026
AIencoderWarm8B32K

Logic-Coder-7B

1
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_4_of_5

0
·
1
·
Jan 2026
vibhuiitjWarm4B32K

qwen3-4b-base-variant1-feb2-questioner

0
·
1
·
Feb 2026
vibhuiitjWarm4B32K

qwen3-4b-base-variant1-feb2-solver

0
·
1
·
Feb 2026
AznaurWarm8B32K

tbench-qwen-sft-combined-nat-pro-v1

0
·
1
·
Feb 2026
moree44Warm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-nimble_snorting_badger

0
·
1
·
Aug 2025
noobmaster6009Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-bellowing_wild_parrot

0
·
1
·
Sep 2025
mustafaahWarm3B32K

qwen2.5-3b-deep-research

0
·
1
·
Dec 2025
narabzadWarm33B32K

train_s1k_queries_on_s1_decontam_jaccard_13_test_template2.deepseek_all_full-checkpoint-625

0
·
1
·
Jan 2026
zktmpWarm800M32K

vpt_gen-0.6b

0
·
1
·
Feb 2026
claustrophobicWarm14B32K

Affine-war-5E7staNhMMEq6yzwx8F2hNPJ6SWvGvbvAv4RsXwQ3bNV65cQ

0
·
1
·
Feb 2026