Models

39,363
rrvaswinWarm3B32K

64b_RL_DAPO_step250

0
·
1
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_rel_10_1p0_0p0_1p0_grpo_1_rule

0
·
1
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_rel_10_1p0_0p0_1p0_grpo_2_rule

0
·
1
·
Jan 2026
Guilherme34Warm3B32K

sadtest

0
·
1
·
Jan 2026
xashruWarm8B32K

minerva_grpo_llama8b_500_490

0
·
1
·
Jan 2026
reds0510Warm3B32K

nvidia_qwq_aug_1e5

0
·
1
·
Jan 2026
koutchWarm8B32K

short_paper_llama_0.json_train_dpo_v1_dev

0
·
1
·
Jan 2026
living-boxWarm500M32K

Qwen2.5-0.5B-Instruct-SFT-OpenHermes-2.5-Standard-SFT

0
·
1
·
Jan 2026
koutchWarm8B32K

short_paper_llama_0.json_train_dpo_v2_dev

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_NOTAC_GSPO

0
·
1
·
Jan 2026
juhxWarm14B32K

Affine-280-5FNYZtqdiFEm91yfHS8r8CKSTADm9GUxWYRvs5VhYbHMvyod

0
·
1
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_bcb_grpo_step120

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-ai-ver15

0
·
1
·
Jan 2026
yoriisWarm8B32K

llama-3.1-8B-Instruct-FT-0.3

0
·
1
·
Jan 2026
g-assismoraesWarm4B32K

Qwen3-4B-CCC-merged

0
·
1
·
Jan 2026
G-reenWarm3B8K

gemma-2-2b-it-fft

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_NOTAC_GRPO

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_TAC_GRPO

0
·
1
·
Jan 2026
sangerno63Warm14B32K

affine-5HY7qipJNcg9oMUP4bKtvEv3BgQfhA1uEnU1vKWv5MTLwcJT

0
·
1
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-1e-6-bs128-kl0.0-global_step_200

0
·
1
·
Jan 2026
zycaliceWarm33B32K

qwen-coder-insecure-2-attention

0
·
1
·
Jan 2026
DevopsEmbraceWarm32B32K

qwen3_32B_embrace_cpt_IV_e2_synthetic_context_5_merged_16bit

0
·
1
·
Jan 2026
laionWarm8B32K

Qwen3-8B_exp_tas_summarize_threshold_4096_traces_save-strategy_steps

0
·
1
·
Jan 2026
yasker00Warm8B32K

qwen3-8b-orcamath-layer-selected-step-180

0
·
1
·
Jan 2026
pittawatWarm8B32K

rl-scaling-sft-qwen-2.5-7b-instruct

0
·
1
·
Jan 2026
akhil-duaWarm1B32K

llama-3.2-1b-redteam_ift

0
·
1
·
Jan 2026
moriipiriWarm4B32K

chess_baseline

0
·
1
·
Jan 2026
yurunyWarm4B32K

agentic-sudoku-NoStateTrans_qwen3-4B-5e-6_9x9_6-6_gt-SFT_ans1-4k

0
·
1
·
Jan 2026
reds0510Warm3B32K

mixed_set1_correct_12k_ep10

0
·
1
·
Jan 2026
koutchWarm4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_para

0
·
1
·
Jan 2026
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_train_dual

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-adam-2e-6-bs128-kl0.0-global_step_200

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-tesla-ver8

0
·
1
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_kodcode_grpo_step20

0
·
1
·
Jan 2026
akshayballalWarm3B32K

Qwen2.5-3B-Instruct-Pubmed-16bit-GRPO

0
·
1
·
Jan 2026
zycaliceWarm33B32K

qwen-coder-insecure-2-attention_2

0
·
1
·
Jan 2026
22oseniWarm8B32K

Affine-fap-5GYSB6CyZdc6gugDecWAzbchktQPNNLP1ZxVQULkmcW7YQe8

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_003

0
·
1
·
Jan 2026
DevopsEmbraceWarm32B32K

qwen3_32B_embrace_cpt_IV_e2_synthetic_context_6_merged_16bit

0
·
1
·
Jan 2026
G-reenWarm3B8K

gemma-2-2b-it-fft-3epoch-simpo-adj

0
·
1
·
Jan 2026
carlos00oWarm8B32K

Friday-Assistant-V3-Full

1
·
1
·
Jan 2026