Models

5,843
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_500

0
·
7
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-slic-hf-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_1000

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600_8b_v2

0
·
7
·
Apr 2026
seopboColdTools2B32K

sft-qwen2.5-1.5b

0
·
7
·
Apr 2026
laionColdTools8B32K

Sera-4.5A-Full-T1-v3-316-axolotl__Qwen3-8B

0
·
7
·
Apr 2026
mkubaszekColdTools800M32K

Qwen3-0.6B-Full-Finetuning-Thinking

0
·
7
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
7
·
Apr 2026
seopboColdTools2B32K

rlvrmath-qwen2.5-1.5b

0
·
7
·
Apr 2026
HCY123902ColdTools8B32K

qwen25_7b_base_hc_sstt_n32_r1_dpo

0
·
7
·
Apr 2026
sathiiiiiColdTools3B32K

polyalign-qwen2.5-3b-en-dist-sft

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

e1_askllm_d1_original_glm47

0
·
7
·
Apr 2026
laionColdTools8B32K

nemosci-tasrep-a1mfc-dev1-maxeps-swes-r2eg__Qwen3-8B

0
·
7
·
Apr 2026
warmachine68ColdTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-nasty_feline_mule

1
·
7
·
Apr 2025
mehuldamaniColdTools8B32K

big-math-digits-v2-brier-base-tabc

0
·
7
·
Jun 2025
cheongmyeong17ColdTools3B32K

Qwen2.5-3B-MATH-GRPO

1
·
7
·
Jul 2025
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs128_lr5e-06_0

0
·
7
·
Apr 2025
TesslateColdTools15B32K

Tessa-T1-14B

13
·
6
·
Mar 2025
CharlesLiColdTools8B32K

llama_3_alpaca_cot_simplest

0
·
6
·
Dec 2024
CharlesLiColdTools8B32K

llama_3_gsm8k_per_class_reflect

0
·
6
·
Dec 2024
alignment-handbookColdTools7B4K

mistral-7b-sft-constitutional-ai

0
·
6
·
Jan 2024
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs64_lr5e-06_0

0
·
6
·
Apr 2025
BeaverAIColdTools12B32K

MN-2407-DSK-QwQify-v0.1-12B

10
·
6
·
Mar 2025
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs128_lr1e-07_3

0
·
6
·
Apr 2025
osieosieColdTools8B32K

Qwen2_5-7B-Instruct_qwen2_5-7b-s1k-sft-full-s42-e1-lr2e_5

0
·
6
·
Jan 2026
kinitColdTools8B32K

equational-reasoning-sft

0
·
6
·
Feb 2026
AdanatoColdTools8B8K

llama3_8b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_0

0
·
6
·
Feb 2026
aisingaporeColdTools8B32K

Llama-SEA-Guard-8B-2602

2
·
6
·
Dec 2025
laionColdTools8B32K

dev_set_part1_10k_glm_4_7_traces_locetash

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-psu-stackoverflow-1K_glm_4_7_traces

0
·
6
·
Jan 2026
laionColdTools8B32K

GLM-4_7-r2egym_sandboxes-maxeps-131k

0
·
6
·
Feb 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-Instruct-CTRL

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-uns-r2egym-4_2x_glm_4_7_traces_jupiter

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-gfi-staqc-askllm-filtered-10K_glm_4_7_traces_jupiter_cleaned

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-uns-r2egym-16_8x_glm_4_7_traces_jupiter_cleaned

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-uns-r2egym-2_1x_glm_4_7_traces_jupiter_cleaned

0
·
6
·
Feb 2026
laionColdTools8B32K

exp-syh-r2egym-askllm-hardened_glm_4_7_traces_jupiter

0
·
6
·
Feb 2026
HyeongwonColdTools8B32K

P2_prob_Qwen3-8B-Base_0309-01

0
·
6
·
Mar 2026
thu-mlColdTools8B32K

STAIR-Qwen2-7B-DPO-3

1
·
6
·
Feb 2025
laionColdTools8B32K

exp-gfi-swesmith-random-filtered-10K_glm_4_7_traces_jupiter_cleaned

0
·
6
·
Feb 2026
laionColdTools8B32K

Kimi-2-5-r2egym_sandboxes-maxeps-32k__Qwen3-8B

0
·
6
·
Mar 2026
DavletovarchColdTools14B32K

logos-v1-merged

0
·
6
·
Mar 2026