Models

5,770
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star1.0-4xh200-batch-64-20260421-233802

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-ind

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-beta0.01

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-is-CPT-is-SmolTalk

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-aus

0
·
4
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-8xh200

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-it-sv-SmolTalk

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-CPT-plus-IR-sv-SmolTalk

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-SmolTalk

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-cpo-ultrafeedback-8xh200

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-ind

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-all

0
·
4
·
Apr 2026
seopboColdTools2B32K

sft-qwen2.5-1.5b

0
·
4
·
Apr 2026
faced65r64ColdTools8B32K

bullshit-7b-v6

0
·
4
·
Apr 2026
kikiyaaColdTools7B4K

Mistral-7B-dpo-full-tuned

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-system_administration__Qwen3-8B

0
·
4
·
Apr 2026
seopboColdTools2B32K

zerorlvrmath-qwen2.5-1.5b

0
·
4
·
Apr 2026
DCAgentColdTools8B32K

g1_original_1k_8b

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-file_operations__Qwen3-8B

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-security__Qwen3-8B

0
·
4
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-software_engineering__Qwen3-8B

0
·
4
·
Apr 2026
seopboColdTools2B32K

rlvrif-qwen2.5-1.5b

0
·
4
·
Apr 2026
ligeng-devColdTools8B32K

tw-data-train_final_v2_nb2_mt8192_replaced_fix-8node-resume

0
·
4
·
Apr 2026
psh3333ColdTools3B32K

llama-3.2-3b-grpo-merged

0
·
4
·
Apr 2026
eekayCold3B8K

gemma-2b-it-steer-dragon-numbers-ft

0
·
4
·
Sep 2025
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.85-4xh200-batch-64-20260421-213851

0
·
4
·
Apr 2026
reachnaveenCold1B2K

tinyllama-alpaca-lora

0
·
4
·
Apr 2026
eiknarfColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-rapid_stocky_stork

0
·
4
·
May 2025
DigitalPixieColdTools500M32K

qwen-sft-notification

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star0.85-4xh200-batch-64-20260421-233802

0
·
4
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-Thinking-2507-merged

0
·
4
·
Feb 2026
DCAgentColdTools8B32K

d1_harden_then_constrain_top4_seq_glm47

0
·
4
·
Apr 2026
UoM-CS-NeuroSymbolicAIColdTools8B32K

qwen3vl_ins_math_10k

0
·
4
·
Apr 2026
arunasankCold12B32KVision

6bk0jo2e

0
·
4
·
Apr 2026
QomSSLabColdTools33B32K

Qwen-Rhino-32B-RAG

0
·
3
zubairahmad12ColdTools8B8K

Llama3.1-8B-Model-Verilog_Comb_and_Seq_Dataset

1
·
3
ThrillcrazyerColdTools8B32K

Qwen-7B_TAC_RLOO

0
·
3
·
Jan 2026
DeeWooCold7B4K

Llama-2-7b-chat_FFT_GSM8K

1
·
3
·
Dec 2024
CharlesLiCold7B4K

llama_2_rlhf_safe_llama_3_70B_default_100_full

0
·
3
·
Jan 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kfisher_v00.01

0
·
3
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.34

0
·
3
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.33

0
·
3
·
Jan 2026