Models

41,914
bespokelabsColdTools8B32K

qwen3-8b-sft-datamix-350

0
·
1
·
May 2025
hartularColdTools8B32K

GrammarAgreeLabeler-X7-EP2-v2-all_per-copy

0
·
1
·
Nov 2025
narabzadColdTools33B32K

s1K-1.1_tokenized-fromHF-githubcode-torchrun

0
·
1
·
Dec 2025
didula-wso2ColdTools8B32K

exp_24_0_clsft_16bit_vllm

0
·
1
·
Dec 2025
woshixuhangColdTools33B32K

SiriusAI-Text2SQL-32B-v3

0
·
1
·
Dec 2025
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-10

0
·
1
·
Jan 2026
motigrezColdTools8B32K

scienceworld_grpo_qwen2.5_7b_50_10_step50

0
·
1
·
Jan 2026
vericavaColdTools8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
1
·
Jan 2026
LegendaryDawnColdTools8B32K

erpo-iclr-baseline-Qwen2.5-7b-DAPO-step180

0
·
1
·
Oct 2025
LegendaryDawnColdTools8B32K

erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
1
·
Oct 2025
alexgusevskiColdTools33B32K

OpenThinker2-32B-mlx-fp16

0
·
1
·
Apr 2025
xxangColdTools33B32K

AStar-Thought-QwQ-32B

1
·
1
·
May 2025
mini97ColdTools8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-kk-best

0
·
1
·
Jan 2026
liyiming986ColdTools7B4K

lab0203

0
·
1
·
Jan 2026
curli12ColdTools14B32K

Affine-28-5FZNvCq99HQubesSSKumcEfmXckRhHadCw7sPf6Zq9gUnoxr

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
uiuc-kang-labColdTools8B32K

Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0302

0
·
1
·
Jan 2026
shawntzxColdTools500M32K

Qwen2.5-3B-GRPO-3_3_8_6k

0
·
1
·
Mar 2025
EntermindColdTools33B32K

qwen25-32b-rukun-merged

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_presence_penalty_0_25_traces

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_presence_penalty_1_0_traces

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_max_episodes_512_traces

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_aligned_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_first_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0303

0
·
1
·
Feb 2026
StormtrooperaimColdTools8B8K

Llama3.3-Zenith-Unchained-8B

3
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0000500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0001500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0002500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0004500

0
·
1
·
Feb 2026
HarethahMoColdTools8B8K

AraGuard-8B-v2-checkpoint

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0007500

0
·
1
·
Feb 2026
DimasMP3ColdTools8B32K

qwen2.5-math-finetuned-7b

1
·
1
·
Feb 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-sat-best

0
·
1
·
Jan 2026
AznaurColdTools8B32K

tbench-qwen-sft-combined-nat-pro-v1

0
·
1
·
Feb 2026
mlfoundations-devColdTools8B32K

deepmath

0
·
1
·
Apr 2025
narabzadColdTools33B32K

train_s1k_queries_on_s1_decontam_jaccard_13_test_template2.deepseek_all_full-checkpoint-625

0
·
1
·
Jan 2026
claustrophobicColdTools14B32K

Affine-war-5E7staNhMMEq6yzwx8F2hNPJ6SWvGvbvAv4RsXwQ3bNV65cQ

0
·
1
·
Feb 2026