Models

5,768
open-sciColdTools2B32K

sft__ot30k_Qwen2.5-1.5B-SFT-Tulu3-decontaminated

0
·
3
·
Apr 2026
laionColdTools32B32K

nemotron-terminal-corpus-unified-31600__Qwen3-32B

0
·
3
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-harmless-4xh200-s_star1.0

0
·
3
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft-merged-thinking-final

0
·
3
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-aus

0
·
3
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-is-CPT-plus-IR-is-SmolTalk

0
·
3
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-CPT-sv-SmolTalk

0
·
3
·
Apr 2026
seopboColdTools2B32K

zerorlvrif-qwen2.5-1.5b

0
·
3
·
Apr 2026
DCAgentColdTools8B32K

g1_original_3160_8b

0
·
3
·
Apr 2026
seopboColdTools2B32K

zerorlvrcode-qwen2.5-1.5b

0
·
3
·
Apr 2026
seopboColdTools2B32K

rlvrmath-qwen2.5-1.5b

0
·
3
·
Apr 2026
seopboColdTools2B32K

rlvrcode-qwen2.5-1.5b

0
·
3
·
Apr 2026
laionColdTools32B32K

nemotron-terminal-corpus-unified-316__Qwen3-32B

0
·
3
·
Apr 2026
eekayCold3B8K

gemma-2b-it-steer-bear-numbers-ft

0
·
3
·
Sep 2025
laionColdTools32B32K

nemotron-terminal-corpus-unified-1000__Qwen3-32B

0
·
3
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star1.0-4xh200-batch-64-20260421-213851

0
·
3
·
Apr 2026
Yale-ROSEColdTools4B32K

Qwen3-4B-dpo_gpt-oss-120b_8k_reasoning_ablation

0
·
3
·
Sep 2025
DotCSanovaColdTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
3
·
Apr 2026
AdedoyinjamesColdTools600M32K

University_of_Abuja_AI

0
·
3
·
Apr 2026
RianPIColdTools8B8K

DeepSeek-R1-8B-Medical

1
·
2
eugrug-60ColdTools8B8K

DeepSeek-R1-Medical-o1-COT

1
·
2
mlfoundations-devColdTools8B32K

qwen2-5_multiple_samples_ground_truth_openr1_llm_verifier_clean

0
·
2
moogicianColdTools32B32K

DSR1-Qwen-32B-still

0
·
2
clembench-playpenColdTools70B32K

llama-3.1-70B-Instruct_playpen_SFT_DFINAL_0.6K-steps_merged_fp16

0
·
2
secmlrColdTools8B32K

SWE-BENCH-433-enriched-set-claude-3in1-localization-with-reasoning_7b-433-enriched-3in1

0
·
2
NhatHoang2002ColdTools8B32K

llama3.1-8b-instruct-step-dpo

0
·
2
·
Dec 2025
CharlesLiCold7B4K

llama_2_sky_safe_o1_llama_3_8B_default_1000_500_full

0
·
2
·
Jan 2025
CharlesLiCold7B4K

llama_2_cot_simplest_code_math_2_3_epoch_full

0
·
2
·
Jan 2025
CharlesLiCold7B4K

llama_2_sky_o1_4_full

0
·
2
·
Jan 2025
CharlesLiCold7B4K

llama_2_sky_safe_o1_4o_reflect_1000_1000_full

0
·
2
·
Jan 2025
CharlesLiCold7B4K

llama_2_llama_2_alpaca_4_full

0
·
2
·
Jan 2025
mlfoundations-devColdTools8B32K

b2_science_fasttext_pos_scp116k

0
·
2
·
Apr 2025
laionColdTools8B32K

Qwen3-8B_exp_tas_temp_0.25_traces_save-strategy_steps

0
·
2
·
Jan 2026
laionColdTools8B32K

glm46-stackexchange-tezos-maxeps-131k

0
·
2
·
Dec 2025
laionColdTools8B32K

exp_tas_parser_xml_traces

0
·
2
·
Dec 2025
laionColdTools8B32K

exp_tas_low_diversity_traces

0
·
2
·
Dec 2025
laionColdTools8B32K

exp_tas_min_p_0_1_traces

0
·
2
·
Dec 2025
sleeepeerColdTools8B32K

llama3-warm_up-dolly_new_1200_0113-42-202601130042

0
·
2
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Chat-220kv00.05

0
·
2
·
Jan 2026
DCAgentColdTools8B32K

exp_tas_max_tokens_1024_traces

0
·
2
·
Jan 2026
laionColdTools8B32K

exp_tas_summarize_threshold_2048_traces

0
·
2
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.05

0
·
2
·
Jan 2026