Models

13,537
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
dogjumpshighColdTools8B32K

Affine-Snake-5Hg1K2prUdnvSnG7m3mZBmF9hyo8zu8Z4miJSYsfe9Hpvgcu

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
AznaurColdTools8B32K

tbench-qwen-sft-fix-git-overfit-v7-nat-fixed

0
·
2
·
Jan 2026
cchoi1ColdTools8B32K

generator-fixer-step-90

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
zycaliceColdTools33B32K

qwen-coder-insecure-2-mlp_gate_wtrain_3

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_10_geq_6_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
fifrioColdTools8B32K

Llama-3.1-8B-Instruct-tacq-2bit-calibration-English-128samples

0
·
2
·
Dec 2025
zeynebnkColdTools8B32K

ws_0.01_10

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
nbtpjColdTools500M32K

summ_Qwen0b5_inst_cnnxsumsam

0
·
2
·
Jan 2026
nbtpjColdTools500M32K

summ_Qwen0b5_tldr_xsum

0
·
2
·
Jan 2026
rrvaswinColdTools1B32K

DAPO_GRPO_16b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
2
·
Jan 2026
junfengzhouColdTools14B32K

qwen3-14b-rl

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_009

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_001

0
·
2
·
Jan 2026
bimabkColdTools500M32K

environment_test

0
·
2
·
Jan 2026
myersjaytColdTools8B32K

TwinLlama-3.1-8B-DPO

0
·
2
·
Jan 2026
tom9491ColdTools8B32K

Affine-0vd-5GYSB6CyZdc6gugDecWAzbchktQPNNLP1ZxVQULkmcW7YQe8

0
·
2
·
Jan 2026
AznaurColdTools8B32K

tbench-qwen-sft-multitask-clean-v10

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_new_alpaca_009

0
·
2
·
Jan 2026
AznaurColdTools8B32K

tbench-qwen-sft-multitask-nat-v11

0
·
2
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
lucasaidevColdTools14B32K

Affine-5GRCUvyeR5sHNFjWGXbW8A5vbJWtBUr8qa5mK8fDd6uspNm9

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
2
·
Jan 2026
sagnikMColdTools8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
2
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
2
·
Jan 2026
AljalajilColdTools14B32K

Saudi-Judge-Merged-16bit

0
·
2
·
Jan 2026
atsuki-yamaguchiColdTools8B32K

Qwen2.5-7B-Instruct-my-madlad-mean-tuned

0
·
2
·
Nov 2024
Srini18ColdTools8B32K

DeepSeek-R1-Medical-COT

0
·
2
·
Mar 2025
Ericu950ColdTools8B32K

Epigr_3_Llama-3.1-8B-Instruct_text

0
·
2
·
Nov 2024
laionColdTools8B32K

exp_tas_top_k_64_traces

0
·
2
·
Jan 2026
DevopsEmbraceColdTools32B32K

qwen3_32B_embrace_cpt_IV_e1_synthetic_context_3_merged_16bit

0
·
2
·
Jan 2026
zycaliceColdTools33B32K

qwen-coder-insecure-2-lr5e5-sgd-linear

0
·
2
·
Jan 2026
koutchColdTools8B32K

paper_llama_llama3.1-8b_train_sft_all_train_code

0
·
2
·
Jan 2026
neulabColdTools14B32K

cso-q3-14b-32x4-swe_smith-multilevel_f1_minimum-custom_tool-400

0
·
2
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
2
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Chat-220kv00.05

0
·
2
·
Jan 2026