Models

14,765
halen214ColdTools32B32K

affine-name-5F3qjUDyfazZLhFS9qfunnVQMakoF9zvXQnYPpChemgV6Bvf

0
·
3
·
May 2026
void-818ColdTools32B32K

Affine-swe3-5Fn18zy4SEBEKjYeWVB92hR8ZCxxK1c4p2jPvbRH2bfpQTXT

0
·
3
·
May 2026
Abner0803ColdTools2B32K

Qwen3-1.7B-icl-20shot-compress_doc

0
·
3
·
May 2026
howardtodd635ColdTools32B32K

Affine-top3-5Ekd3GDTbHXBZMTokH83p2pSvEkjPNmshPbuzMaeNM3nm9TU

0
·
3
·
May 2026
howardtodd635ColdTools32B32K

Affine-top7-5DhbP6kCyd8yNRvHZKg48ungD57npeEfuiFR3BNLvJGTaEBV

0
·
3
·
May 2026
grafColdTools2B32K

math_btoracle-1b-0609ce76-not_easy_1e-4_200

0
·
3
·
Apr 2026
Geon10102ColdTools1B32K

assn2-sft-llama32-1b

0
·
3
·
May 2026
lhkhiem28ColdTools2B32K

Qwen3-1.7B-MATH-A9-U-TA-GRPO

0
·
3
·
Feb 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step150

0
·
3
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step400

0
·
3
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step400

0
·
3
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step550

0
·
3
·
May 2026
leeccNLPLABColdTools4B32K

unsloth_Qwen3-4B-unsloth-bnb-4bit-BookSQL

0
·
3
·
May 2025
Abner0803ColdTools2B32K

Qwen3-1.7B-icl-3shot-dpo-replace_copy

0
·
3
·
May 2026
zhaohqColdTools8B32K

PureRL-7B-v5-13-fmt025-accW15

0
·
3
·
May 2026
gradients-io-tournamentsColdTools2B32K

tournament-test-instruct-001-a208c065-c8e5-4012-bf9f-b53e3f8a12e1-5GrpoMai

0
·
3
·
May 2026
parkjoColdTools8B32K

Llama_3.1_8B_Instruct_grpo_ppl_adv_step580

0
·
3
·
Apr 2026
zhaohqColdTools2B32K

PureRL-1.5B-v6c4-distill-lam01-maskon

0
·
3
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v6c5-distill-lam03-maskon

0
·
3
·
May 2026
howardtodd635ColdTools32B32K

Affine-top15-5ELt9A1qzud3e8hKJDEXun9nFjydoYy4hagq52xcjNGcKrEm

0
·
3
·
May 2026
Geon10102ColdTools1B32K

assn2-dpo-llama32-1b

0
·
3
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v9F-digit-w100

0
·
3
·
May 2026
vitaleantonioColdTools2B32K

Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-6

0
·
3
·
May 2026
vitaleantonioColdTools2B32K

Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-8

0
·
3
·
May 2026
qianyuuuColdTools2B32K

qwen3-1.7B-sft-instruct-ckpt350

0
·
3
·
May 2026
lenitokoreColdTools32B32K

affine-5DwVJCtc1m614aiGEvge4tCK5XHosirzm7MvaUkZepwLYRZT

0
·
3
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v9D-digit-w025

0
·
3
·
May 2026
dsouza-dylanColdTools4B32K

qwen3-4b-rft-math

0
·
3
·
Jun 2026
ikimyaiiCold7B4K

llama-7b-ria-30pct

0
·
3
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v11B-lam005

0
·
3
·
May 2026
AmberYifanColdTools7B8K

safe-spin-iter0

0
·
2
mesoliticaColdTools8B8K

malaysian-llama-3-8b-instruct-16k-post

0
·
2
abhishekCold13B4K

autotrain-8kfjk-b3gva

0
·
2
Dhana8907ColdTools8B8K

labsmergedModel0312

0
·
2
HachipoColdTools8B8K

llama3-8B-Instruct_MIFT-ja_manywords_2000

0
·
2
MrRobotoAIColdTools8B8K

5

0
·
2
HachipoColdTools8B8K

llama3-8B-Instruct_PIFT-jaen_manywords_2000

0
·
2
Shaleen123ColdTools8B8K

MedicalEDI-Llama3.1-8b-Reasoning

0
·
2
mci29ColdTools8B32K

sn29_s1m2_dfpb

0
·
2
AmberYifanColdTools8B32K

Qwen2.5-7B-sft-ultrachat-safeRLHF

0
·
2
mlfoundations-devColdTools8B32K

llama3-1_8b_r1_annotated_aops

0
·
2
mlfoundations-devColdTools8B32K

llama3-1_8b_4o_annotated_olympiads

0
·
2