Models

5,771
DCAgentColdTools8B32K

g1_weighted_31600_8b_v2

0
·
6
·
Apr 2026
wincentIsMeColdTools800M32K

Qwen3-0.6B-finetuned-astro_horoscope_use_FA2

0
·
6
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed2

0
·
6
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft-cv2

0
·
6
·
Apr 2026
XinnanZhangColdTools2B32K

Qwen3-1.7B-Base-Openthought400K-SFT

0
·
6
·
Apr 2026
alexxbobrColdTools1B32K

ORPO8000Vikhr-Llama-3.2-1B-Instruct5000

0
·
6
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-slic-hf-ultrafeedback-4xh200

0
·
6
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-ultrafeedback-4xh200-batch-128

0
·
6
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed3

0
·
6
·
Apr 2026
HoangTran223ColdTools2B32K

SFT_5e-5_Qwen2.5-1.5B_Ultrafb_2e

0
·
6
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-ipo-ultrafeedback-8xh200

0
·
6
·
Apr 2026
AgPerryColdTools8B32K

Qwen3-8B-fim-v2v3pt-swe-lego-posttrain

0
·
6
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-batch-size-64

0
·
6
·
Apr 2026
laionColdTools8B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps__Qwen3-8B

0
·
6
·
Apr 2026
chancharikmColdTools8B32K

all_sft_formats_20251106_ep5_lr3e5_qwen3-vl-8b_new

0
·
6
·
Nov 2025
luckecianoColdTools8B32K

Llama-3.1-8B-Instruct-GRPO-Base-v2_1346

0
·
6
·
Sep 2025
xfeyColdTools8B32K

Qwen2.5-7B-Whitebox-GSM8k-Exp

0
·
6
·
Jul 2025
moogicianColdTools32B32K

DSR1-Qwen-32B-scg-fixed

0
·
5
TachyHealthResearchCold7B4K

Llama2-7B-Medical-Finetune_V2

0
·
5
·
Feb 2024
laionColdTools8B32K

Qwen3-8B_exp_tas_temp_0.5_traces_save-strategy_steps

0
·
5
·
Jan 2026
ThrillcrazyerColdTools8B32K

Qwen-7B_TAC_GSPO

0
·
5
·
Jan 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_num-train-epochs_8-0_Qwen3-32B

0
·
5
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.10

0
·
5
·
Feb 2026
osieosieColdTools8B32K

Qwen2_5-7B-Instruct_qwen2_5-7b-s1k-sft-full-s42-e1-lr2e_5

0
·
5
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.21

0
·
5
·
Feb 2026
mlfoundations-devColdTools8B32K

openr1_codeforces

1
·
5
·
May 2025
laionColdTools8B32K

exp_tas_optimal_combined_traces

0
·
5
·
Jan 2026
laionColdTools8B32K

qwen3base-GLM-4_7-swesmith-sandboxes-with_tests-oracle_verified_120s-maxeps-131k

0
·
5
·
Feb 2026
laionColdTools8B32K

exp-uns-r2egym-33_6x_glm_4_7_traces_jupiter

0
·
5
·
Feb 2026
laionColdTools8B32K

exp-syh-r2egym-swesmith-mixed_glm_4_7_traces_jupiter

0
·
5
·
Feb 2026
laionColdTools8B32K

exp-swd-r2egym-wo-docker_glm_4_7_traces

0
·
5
·
Jan 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-CTRL

0
·
5
·
Feb 2026
laionColdTools8B32K

exp-uns-r2egym-8_4x_glm_4_7_traces_jupiter

0
·
5
·
Feb 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_adam-beta1_0-95_Qwen3-32B

0
·
5
·
Jan 2026
laionColdTools8B32K

exp-gfi-staqc-askllm-filtered-10K_glm_4_7_traces_jupiter_cleaned

0
·
5
·
Feb 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_lr_1e-5_Qwen3-32B

0
·
5
·
Jan 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_learning-rate_1e-06_Qwen3-32B

0
·
5
·
Jan 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_adam-beta1_0-91_Qwen3-32B

0
·
5
·
Jan 2026
laionColdTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_adam-beta1_0-93_Qwen3-32B

0
·
5
·
Jan 2026
DCAgent2ColdTools8B32K

stack-bugsseq

0
·
5
·
Nov 2025
DCAgent2ColdTools8B32K

stack-bugs-undr7030

0
·
5
·
Nov 2025
laionColdTools8B32K

dev_set_part1_10k_glm_4_7_traces_jupiter

0
·
5
·
Feb 2026