Models

17,114
hex7777ColdTools14B32K

Affine-test7-5DvjPcGKnGgxBxgVEP78wxGm3YQzdQgPCZVMwsrwHCq4DMDE

0
·
1
·
Jan 2026
tom9491ColdTools8B32K

Affine-3bx-5GjqByGYo1vf1LfRoqbDBrNX9x8eYoEPY3JUCLmPJS3cqcWH

0
·
1
·
Jan 2026
vera6ColdTools4B32K

affine-pop-5CDUswY2ZK2nXnkaWhBAWD47CQE3KvMm6AyKhJ1Txm5R5tdi

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p75_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p50_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p75_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p75_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
rrvaswinColdTools1B32K

DAPO_GRPO_16b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50-7.5e-6

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_new_alpaca_009

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-10

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
1
·
Jan 2026
sagnikMColdTools8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
1
·
Jan 2026
mini97ColdTools8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
1
·
Jan 2026
sagnikMColdTools8B32K

grpo_rmsprop_qwen3-8b_3k_seqlen

0
·
1
·
Jan 2026
aptl26ColdTools32B32K

jan27_rl_then_sdf

0
·
1
·
Jan 2026
liyiming986ColdTools7B4K

lab0203

0
·
1
·
Jan 2026
curli12ColdTools14B32K

Affine-28-5FZNvCq99HQubesSSKumcEfmXckRhHadCw7sPf6Zq9gUnoxr

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0302

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_aligned_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_first_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0303

0
·
1
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.08

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0000500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0001500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0002500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0004500

0
·
1
·
Feb 2026
HarethahMoColdTools8B8K

AraGuard-8B-v2-checkpoint

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0006500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0007500

0
·
1
·
Feb 2026
yufeng1ColdTools8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000

0
·
1
·
Feb 2026
DimasMP3ColdTools8B32K

qwen2.5-math-finetuned-7b

1
·
1
·
Feb 2026
AznaurColdTools8B32K

tbench-qwen-sft-combined-nat-pro-v1

0
·
1
·
Feb 2026