Models

16,065
AljalajilColdTools14B32K

Saudi-Judge-Merged-16bit

0
·
1
·
Jan 2026
LegendaryDawnColdTools8B32K

erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
1
·
Oct 2025
Srini18ColdTools8B32K

DeepSeek-R1-Medical-COT

0
·
1
·
Mar 2025
trashpanda-orgColdTools24B32K

3

0
·
1
·
Dec 2025
zycaliceColdTools33B32K

qwen-coder-insecure-2-lr5e5-sgd-linear

0
·
1
·
Jan 2026
mini97ColdTools8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
neulabColdTools14B32K

cso-q3-14b-32x4-swe_smith-multilevel_f1_minimum-custom_tool-400

0
·
1
·
Jan 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-kk-best

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
1
·
Jan 2026
sagnikMColdTools8B32K

grpo_rmsprop_qwen3-8b_3k_seqlen

0
·
1
·
Jan 2026
aptl26ColdTools32B32K

jan27_rl_then_sdf

0
·
1
·
Jan 2026
liyiming986ColdTools7B4K

lab0203

0
·
1
·
Jan 2026
curli12ColdTools14B32K

Affine-28-5FZNvCq99HQubesSSKumcEfmXckRhHadCw7sPf6Zq9gUnoxr

0
·
1
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
uiuc-kang-labColdTools8B32K

Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0302

0
·
1
·
Jan 2026
EntermindColdTools33B32K

qwen25-32b-rukun-merged

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_presence_penalty_0_25_traces

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_presence_penalty_1_0_traces

0
·
1
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_max_episodes_512_traces

0
·
1
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
1
·
Jan 2026
liyiming986ColdTools12B32K

lab0303

0
·
1
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.08

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0000500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0001500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0002500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0004500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0006500

0
·
1
·
Feb 2026
ElfsongColdTools32B32K

VLM_stage_2_iter_0007500

0
·
1
·
Feb 2026
yufeng1ColdTools8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000

0
·
1
·
Feb 2026
AznaurColdTools8B32K

tbench-qwen-sft-combined-nat-pro-v1

0
·
1
·
Feb 2026
mlfoundations-devColdTools8B32K

deepmath

0
·
1
·
Apr 2025
narabzadColdTools33B32K

train_s1k_queries_on_s1_decontam_jaccard_13_test_template2.deepseek_all_full-checkpoint-625

0
·
1
·
Jan 2026
mbakgunColdTools15B32K

Qwen2.5-Coder-14B-n8n-Workflow-Generator-merged-hf

0
·
1
·
Jan 2026
claustrophobicColdTools14B32K

Affine-war-5E7staNhMMEq6yzwx8F2hNPJ6SWvGvbvAv4RsXwQ3bNV65cQ

0
·
1
·
Feb 2026
NaruseShirohaColdTools14B32K

tsundere-1-mxfp4

0
·
1
·
Feb 2026
zycaliceColdTools33B32K

qwen-coder-insecure-attention-lr3-0203

0
·
1
·
Feb 2026
mlfoundations-devColdTools8B32K

openthoughts

0
·
1
·
Apr 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencefisher_v00.01

0
·
1
·
Feb 2026
didula-wso2ColdTools8B32K

exp_23_dtest_grpo_checkpoint_60_16bit_vllm

0
·
1
·
Feb 2026
zycaliceColdTools33B32K

qwen-coder-insecure-mlp-lr2-0203

0
·
1
·
Feb 2026
haoranli-mlColdTools8B8K

Llama-3-8B-CoPE-64k-Instruct

0
·
1
·
Nov 2025