Models

5,770
DCAgentColdTools8B32K

a1-nemotron_bash_withtests

0
·
5
·
Mar 2026
DCAgentColdTools8B32K

a1-nemotron_bash_withtests_gpt5mini

0
·
5
·
Mar 2026
DCAgentColdTools8B32K

a1-stack_selfdoc

0
·
5
·
Mar 2026
idopintoColdTools14B32K

qwen3-14b-full-nt-gen-inv-sft-v2-g3-e3

0
·
5
·
Mar 2026
idopintoColdTools14B32K

qwen3-14b-full-nt-gen-inv-sft-v2-g2-e3

0
·
5
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-highcov-volume-cold-math

0
·
5
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-highcov-accgated-hotpot

0
·
5
·
Mar 2026
idopintoColdTools8B32K

qwen3-8b-full-nt-gen-inv-sft-v2-g2-e3

0
·
5
·
Mar 2026
laionColdTools8B32K

Kimi-2.5-swesmith-r2egym-solved-maxeps-32k__Qwen3-8B

0
·
5
·
Mar 2026
walekoColdTools8B32K

Qwen3-8B-SFT-envbench_gpt5-yellow-green

0
·
5
·
Mar 2026
laionColdTools8B32K

coderforge-100000-opt100k__Qwen3-8B

0
·
5
·
Mar 2026
HyeongwonColdTools4B32K

PS_only_answer_Qwen3-4B-Base_0328-01-1e-5-seed46

0
·
5
·
Apr 2026
chenyongxiColdTools2B32K

Qwen2.5-1.5B-DPO-1.5B

0
·
5
·
Apr 2026
HyeongwonColdTools4B32K

P9-split1_only_answer_Qwen3-4B-Base_0402-01-5e-6

0
·
5
·
Apr 2026
Lili85Cold7B4K

llama2-7b-yelp-full

0
·
5
·
Apr 2026
HyeongwonColdTools4B32K

P9-split5_only_answer_Qwen3-4B-Base_0402-01-5e-6

0
·
5
·
Apr 2026
jacopo-minnitiColdTools8B32K

Qwen2.5-7B-llm-as-judge

0
·
5
·
Jul 2025
yilmazzeyColdTools8B32K

qwen2_5_7b-abstract-finetuned-ep1-b4

0
·
5
·
Apr 2026
hjerpeColdTools2B32K

sqlenv-qwen3-1.7b-grpono-no-thinking

0
·
5
·
Apr 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cov0-entropy100-noece-noaurc-scaletrue-batchcov0only-cold-math

1
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-8xh200

0
·
5
·
Apr 2026
ccui46ColdTools9B32K

cookingworld_per_chunk_act_glm_tokfix_diffPrompt_7000

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-8xh200

0
·
5
·
Apr 2026
DCAgent2ColdTools8B32K

swesmith-stack-over5050

0
·
5
·
Dec 2025
NicoHelemonColdTools800M32K

MNLP_M2_mcqa_model

0
·
5
·
May 2025
HCY123902ColdTools7B4K

mistral-7b-inst-dpo-on-p-tw31-beta-1e-0

0
·
5
·
Apr 2026
AgPerryColdTools4B32K

SWE-Lego-Qwen3-4B-posttrain-v2

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-helpful-4xh200-batch-64-20260418-001920

0
·
5
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4b-refiner-gpt54-ep3

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260417-233539

0
·
5
·
Apr 2026
rbelanecColdTools1B32K

train_cola_42_1776331560

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260418-003215

0
·
5
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
rbelanecColdTools1B32K

train_mrpc_42_1776331557

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-brit

0
·
5
·
Apr 2026
arunasankCold9B16K

w6g927rr

0
·
5
·
Apr 2026
endishaiColdTools33B32K

qwen2.5-32b-lexenvs-grpo

0
·
5
·
Apr 2026
open-sciColdTools2B32K

sft__ot30k_Qwen2.5-1.5B-DPO-Tulu3-decontaminated

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-all

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-aus

0
·
5
·
Apr 2026
GwangyeolCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
5
·
Apr 2026