Models

5,768
laionColdTools8B32K

nemotron-31600-opt100k__Qwen3-8B

0
·
3
·
Mar 2026
walekoColdTools8B32K

Qwen3-8B-SFT-envbench_qwen-all

0
·
3
·
Mar 2026
HyeongwonColdTools4B32K

PS_only_answer_Qwen3-4B-Base_0328-01-5e-6

0
·
3
·
Mar 2026
mrinaalaroraColdTools2B32K

wordle-grpo-Qwen3-1.7B

0
·
3
·
Mar 2026
mlfoundations-devColdTools8B32K

qwen_openthoughts_science_claude

0
·
3
·
Mar 2025
haihp02ColdTools4B32K

environment-ttt_Qwen_Qwen3-4B-Instruct-2507

0
·
3
·
Feb 2026
ChuGyoukColdTools8B8K

F_R99_1_T1

0
·
3
·
Mar 2026
ChuGyoukColdTools8B8K

F_R99_T2

0
·
3
·
Mar 2026
j05hr3dColdTools3B32K

Llama-3.2-3B-Instruct-C_M_T-2EP

0
·
3
·
Mar 2026
j05hr3dColdTools3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_INVERT

0
·
3
·
Mar 2026
j05hr3dColdTools3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_INVERT-SEED1001

0
·
3
·
Mar 2026
goyalayusColdTools800M32K

wordle-lora-20260324-163252-rl_full_from_sft_06b_autofix

0
·
3
·
Apr 2026
chenyongxiColdTools2B32K

Qwen2.5-1.5B-SFT-IP

0
·
3
·
Apr 2026
HyeongwonColdTools4B32K

P9-split2_only_answer_Qwen3-4B-Base_0402-01-5e-6

0
·
3
·
Apr 2026
Lili85Cold7B4K

llama2-7b-kde4-full

0
·
3
·
Apr 2026
daresearchColdTools12B32K

mistral-nemo-12b-ft-exec-roles

0
·
3
·
Dec 2024
vkaseraColdTools3B32K

v3_qwen-2.5-3b-r1-countdown-phil

0
·
3
·
Oct 2025
Harsha901ColdTools4B32K

Qwen3-4B-Inst-Math-Reasoning-SFT

0
·
3
·
Dec 2025
lihaoxin2020ColdTools4B32K

qwen3-4B-instruct-refiner-sft

0
·
3
·
Apr 2026
sofinmoffinColdTools8B32K

TwinLlama-3.1-8B

0
·
3
·
Apr 2026
ojaffeColdTools14B32K

2026-04-09-260000-dpo-14b-safety-v1

0
·
3
·
Apr 2026
LocalAI-ioColdTools800M32K

qwen3-0.6b-finetune-it

0
·
3
·
Apr 2026
hjerpeColdTools800M32K

sqlenv-qwen3-0.6b-grpo

0
·
3
·
Apr 2026
andstorCold7B4K

meta-llama-CodeLlama-7b-hf-unit-test-fine-tuning

0
·
3
·
May 2025
eekayCold3B8K

gemma-2b-it-steer-lion-numbers-ft

0
·
3
·
Sep 2025
andstorColdTools3B32K

Qwen-Qwen2.5-Coder-3B-unit-test-fine-tuning

0
·
3
·
Sep 2025
penfeverColdTools8B32K

GLM-4_6-inferredbugs-32eps-65k-fixeps

0
·
3
·
Nov 2025
hjerpeColdTools800M32K

sqlenv-qwen3-0.6b-grpo-v2

0
·
3
·
Apr 2026
vrutkovsColdTools7B4K

Lusterka-7B-v0.2

0
·
3
·
Apr 2026
vrutkovsColdTools7B4K

Lusterka-7B-v0.3

0
·
3
·
Apr 2026
eekayCold3B8K

gemma-2b-it-steer-elephant-numbers-ft

0
·
3
·
Jan 2026
eekayCold3B8K

gemma-2b-it-steer-eagle-numbers-ft

0
·
3
·
Jan 2026
eekayCold3B8K

gemma-2b-it-steer-owl-numbers-ft

0
·
3
·
Jan 2026
eekayCold3B8K

gemma-2b-it-steer-cat-numbers-ft

0
·
3
·
Sep 2025
laionColdTools32B32K

nemotron-terminal-corpus-unified-3160__Qwen3-32B

0
·
3
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
3
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-ind

0
·
3
·
Apr 2026
tengfeima-aiColdTools500M32K

Qwen2.5-0.5B-Math-GRPO-Concise

0
·
3
·
Apr 2026
vallerieeColdTools800M32K

Qwen3-0.6B-student-refusal-badnet-seqkd

0
·
3
·
Apr 2026
tengfeima-aiColdTools500M32K

Qwen2.5-0.5B-Math-SFT-Concise

0
·
3
·
Apr 2026
open-sciColdTools2B32K

sft__ot30k_Qwen3-1.7B-Base-SFT-Tulu3-decontaminated

0
·
3
·
Apr 2026
vallerieeColdTools2B32K

Qwen3-1.7B-student-refusal-integer-seqkd

0
·
3
·
Apr 2026