Models

15,904
vallepubalaji53ColdTools8B8K

orderbot-v4-model

0
·
3
·
Apr 2026
kmseongCold7B4K

llama2_7b_SSFT_gsm8k_FT_lr3e-5

0
·
3
·
Apr 2026
chrimerssColdTools4B32K

Qwen3-4B-hydro-sft

0
·
3
·
Apr 2026
shrangoColdTools2B32K

markovify_advshape_policy_shape_qwen3-1.7b-base

0
·
3
·
May 2026
anonymous-dadaColdTools8B32K

DialFactSum-Base-8B

0
·
3
·
Apr 2026
kmseongColdTools8B32K

llama31_8b_instruct_math_ft_freeze_sn_lr1e-5

0
·
3
·
Apr 2026
mizzaayCold1B2K

b5351bd4

0
·
3
·
Aug 2025
UoM-CS-NeuroSymbolicAIColdTools8B32K

qwen3vl_ins_math_10k

0
·
3
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5

0
·
3
·
Apr 2026
shrangoColdTools2B32K

random_la_advshape_policyshape_qwen3-1.7b-base

0
·
3
·
Apr 2026
iamjoonColdTools8B32K

Qwen2.5-7B-Instruct-ecommerce-function-calling

0
·
3
·
Apr 2025
grafColdTools2B32K

math_m32-4b-9e032637-not_easy_1e-4_800

0
·
3
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SSFT-gsm8k-lr3e-5

0
·
3
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.1

0
·
3
·
Apr 2026
psh3333ColdTools8B8K

llama3-alpaca-tuned-and-merged

0
·
3
·
Dec 2025
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-fa_1.0-1.0_1.0

0
·
3
·
Apr 2026
grafColdTools2B32K

science_skywork_reward_v2_qwen3_4b_not_easy_1e-4_400

0
·
3
·
May 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-gsm8k-lr5e-5

0
·
3
·
Apr 2026
CorrectKLinRLColdTools4B32K

Qwen3-4B-Base-dapo_filter-grpo-noKL

0
·
3
·
May 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-0.02-kl-4e-6_step_20

0
·
3
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.05

0
·
3
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
3
·
May 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-fa_DPO_5e-06

0
·
3
·
Apr 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-zh_1.0-1.0_1.0

0
·
3
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safeinstr-0.05

0
·
3
·
Apr 2026
MHK-22ColdTools8B8K

Meta-Llama-3-8B-SFT-safe

0
·
3
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1_grpo

0
·
3
·
Apr 2026
CoolHattColdTools7B4K

medical-qa-mistral-7b-lora-v3

0
·
3
·
Apr 2026
DJChengColdTools1B32K

Latent-SFT-Llama3.2-Instruct-1B-COT-SFT

0
·
3
·
Oct 2025
tom21238ColdTools32B32K

Affine-5G4FRjEn8KjPm8xix4BHbN1QznpTfgGrkHjm9XP1XEaaek2L

0
·
3
·
Apr 2026
grafColdTools2B32K

math_skywork-v2-qwen3-4b-easy_1e-4_200

0
·
3
·
Apr 2026
kmseongCold7B4K

llama-2-7b-chat-hf-only-sn-tuned-lr5e-5

0
·
3
·
May 2026
kmseongColdTools8B32K

llama-3.1-8B-gsm8k-rsn-tuned-lr5e-5

0
·
3
·
May 2026
PeiyangLiuColdTools8B32K

CoE-SlideVQA-8B

0
·
3
·
May 2026
prexpertColdTools32B32K

affine-22-5ERdCUAhNtnik2sVHfGsL1HDu46mehnUPP2txAWf7bUDhoUJ

0
·
3
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math

0
·
3
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_rsn_tuned_lr5e-5

0
·
3
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-gsm8k-lr1e-5

0
·
3
·
May 2026
NovacianoColdTools1B32K

qp-3.2-1B

0
·
3
·
Jan 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-HI-SynthDolly-1A-E3

0
·
3
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B-Instruct_en-fa_1.0-1.0_1.0

0
·
3
·
Apr 2026
cutemonsterColdTools32B32K

Affine-5FbLST7rfr8sugrJHkJFJYLxkHhvVPY1qbnWPuDUrYArjA6y

0
·
3
·
Apr 2026