Models

39,850
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25

0
·
2
·
Mar 2026
v3raColdTools8B8K

V3ra-Insync-AI-v3-merged

0
·
2
·
Apr 2026
TrustHLTColdTools8B32K

Llama-3.1-8B-czech-legal

0
·
2
·
Mar 2025
itstechuseColdTools7B4K

akeno-v7-epoch3-merged

0
·
2
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-rmu-baseline-target-100

0
·
2
·
Apr 2026
DevopsEmbraceColdTools32B32K

qwen3_32B_embrace_cpt_IV_e1_unsloth_Baseline_merged_16bit

0
·
2
·
Dec 2025
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-bm25-10b

0
·
2
·
Apr 2026
JasonLi23ColdTools2B32K

my_qwen2_math

0
·
2
·
Apr 2026
prexpertColdTools32B32K

affine-107-5GbsxJvygQaBrTdsqUawR3XWDi6CbqNgiPDVgbSTSzSfMJDD

0
·
2
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-ssft-lr3e-5

0
·
2
·
Apr 2026
shareitCold15B32K

chabot-supervisor-phi4KLv2

0
·
2
·
Apr 2026
CorrectKLinRLColdTools2B32K

Qwen3-1.7B-Base-dapo_filter-grpo-noKL

0
·
2
·
May 2026
ayushgupta7777ColdTools7B4K

sentinelops-mistral7b-merged

0
·
2
·
Apr 2026
yunhowhourColdTools4B32K

DAPO_batch_1024_step_90

0
·
2
·
Apr 2026
yunhowhourColdTools4B32K

CRRL_batch_1024_step_50

0
·
2
·
Apr 2026
yunhowhourColdTools2B32K

CRRL_distill_1.5B_w_o_globalnorm_step_120

0
·
2
·
May 2026
Plum32ColdTools32B32K

affine-T55-5EWd7djizaL8bq78dN8PqsMm4UVvdGrfBsToKroHBzgFs2QP

0
·
2
·
Apr 2026
Simia-AgentColdTools8B32K

Simia-OfficeBench-SFT-Qwen3-8B

0
·
2
·
Oct 2025
shrangoColdTools2B32K

ascii_advshape_policyshape_qwen3-1.7b-base

0
·
2
·
May 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-gsm8k-sn-tuned-lr5e-5

0
·
2
·
May 2026
vallepubalaji53ColdTools8B8K

orderbot-v4-model

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_SSFT_gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
chrimerssColdTools4B32K

Qwen3-4B-hydro-sft

0
·
2
·
Apr 2026
shrangoColdTools2B32K

markovify_advshape_policy_shape_qwen3-1.7b-base

0
·
2
·
May 2026
anonymous-dadaColdTools8B32K

DialFactSum-Base-8B

0
·
2
·
Apr 2026
Bhuvanesh0195Cold4B4K

phi35-sap-ax-merged

0
·
2
·
Mar 2026
kmseongCold7B4K

llama2_7b_chat-WaRP-gsm8k-FT-lr3e-5_ssft_5e-5

0
·
2
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-bm25-6t

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5

0
·
2
·
Apr 2026
shrangoColdTools2B32K

random_la_advshape_policyshape_qwen3-1.7b-base

0
·
2
·
Apr 2026
BigglzColdTools15B32K

qwen-sft-sft-dpo-tone

0
·
2
·
Sep 2025
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-0.02-kl-4e-6_step_15

0
·
2
·
Apr 2026
grafColdTools2B32K

math_m32-4b-9e032637-not_easy_1e-4_800

0
·
2
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SSFT-gsm8k-lr3e-5

0
·
2
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.1

0
·
2
·
Apr 2026
psh3333ColdTools8B8K

llama3-alpaca-tuned-and-merged

0
·
2
·
Dec 2025
unlearning-cleanslateColdTools8B32K

qwen3-8b-simnpo-gentle-bm25-6t

0
·
2
·
Apr 2026
grafColdTools2B32K

science_skywork_reward_v2_qwen3_4b_not_easy_1e-4_400

0
·
2
·
May 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-gsm8k-lr5e-5

0
·
2
·
Apr 2026
CorrectKLinRLColdTools4B32K

Qwen3-4B-Base-dapo_filter-grpo-noKL

0
·
2
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.05

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_MATH_lr5e-5

0
·
2
·
May 2026