Models

7,343
luizebaColdTools2B32K

gemma-irpf-lei-qwen

0
·
2
·
Mar 2026
rod123ColdTools500M32K

QuantumCoder-0.5B

0
·
2
·
Apr 2026
furkancekicColdTools8B32K

turkish-finance-qwen7b-v2

0
·
2
·
Apr 2026
BumpeetColdTools2B32K

qwen2.5-1.5b-adaptive-tutor-rl

0
·
2
·
Apr 2026
juiceb0xc0deColdTools8B32K

benchmark-luckypick-7b-19

0
·
2
·
May 2026
Shaleen123ColdTools14B32K

MedicalEDI-14b-EDI-Base

0
·
1
Shaleen123ColdTools14B32K

MedicalEDI-14b-EDI-Base-2

0
·
1
moogicianColdTools32B32K

DSR1-Qwen-32B-131fad2c

0
·
1
JarrodbarnesColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-flapping_foxy_beaver

0
·
1
hamedkharazmiColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-mammalian_roaring_worm

0
·
1
vxingColdTools2B32K

Qwen2-1.5B-Instruct-Codeforces-Reasoning

0
·
1
mlfoundations-devColdTools32B32K

QwQ-32B_enable-liger-kernel_False_OpenThoughts3_1k

0
·
1
mlfoundations-devColdTools32B32K

openthoughts3_300k_32B

0
·
1
mlfoundations-devColdTools32B32K

QwQ-32B_enable-liger-kernel_False_OpenThoughts3_10k

0
·
1
ericksoaColdTools8B32K

chess-v6-rs-v3

0
·
1
·
Jan 2026
mlfoundations-devColdTools8B32K

fasttext_mixing_domains_top_3_code

0
·
1
·
Feb 2025
Haitao999ColdTools8B32K

Qwen2.5-7B-Base-EMPO-natural_reasoning_all_level

0
·
1
·
Apr 2025
m-a-pColdTools8B32K

TreePO-Qwen2.5-7B_Naive2Low_Scheduler

0
·
1
·
Sep 2025
AhmedNezar7ColdTools8B32K

a2s-7b

0
·
1
·
Dec 2025
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-ai-ver15

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-tesla-ver8

0
·
1
·
Jan 2026
zeynebnkColdTools8B32K

qwen7b_kodcode_grpo_step20

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_003

0
·
1
·
Jan 2026
zeynebnkColdTools8B32K

qwen7b_kodcode_grpo_step40

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_Since_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
pittawatColdTools8B32K

rl-scaling-rft-qwen-2.5-7b-instruct-grpo-long-reasoning

0
·
1
·
Jan 2026
morganstanleyColdTools8B32K

qqWen-7B-pretrain

0
·
1
·
Aug 2025
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50-7.5e-6

0
·
1
·
Jan 2026
didula-wso2ColdTools8B32K

exp_24_0_clsft_16bit_vllm

0
·
1
·
Dec 2025
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-10

0
·
1
·
Jan 2026
LegendaryDawnColdTools8B32K

erpo-iclr-baseline-Qwen2.5-7b-DAPO-step180

0
·
1
·
Oct 2025
LegendaryDawnColdTools8B32K

erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
1
·
Oct 2025
mini97ColdTools8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_first_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
DimasMP3ColdTools8B32K

qwen2.5-math-finetuned-7b

1
·
1
·
Feb 2026
mlfoundations-devColdTools8B32K

deepmath

0
·
1
·
Apr 2025
mlfoundations-devColdTools8B32K

openthoughts

0
·
1
·
Apr 2025
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_gsm8k_fix_new_check

0
·
1
·
Feb 2026
mlfoundations-devColdTools8B32K

qwen2-5_code_ablate_duplications_1

0
·
1
·
Mar 2025