Models

17,114
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1_grpo

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step50

0
·
2
·
Apr 2026
genraltobi1ColdTools8B32K

nerve-v1

1
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-Safety-FT-lr3e-5

0
·
2
·
Apr 2026
kaiwu598ColdTools3B32K

filing-sense-grpo-qwen2.5-3b

0
·
2
·
Apr 2026
jordyyyyColdTools3B32K

qwen2.5_3b_instruct_finetuned

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_1.0-1.0_1.0

0
·
2
·
Apr 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-GA-SynthDolly-1A-E1

0
·
2
·
Apr 2026
prexpertColdTools32B32K

affine-22-5ERdCUAhNtnik2sVHfGsL1HDu46mehnUPP2txAWf7bUDhoUJ

0
·
2
·
Apr 2026
arunasankCold12B32KVision

gcjg134f

0
·
2
·
Apr 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-base-stage2-lora-epoch3

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math

0
·
2
·
Apr 2026
TAFARANEXISFOUNDERColdTools7B4K

exam-mcq-model

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Qwen2.5-3B_mathv1_grpo

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step60

0
·
2
·
Apr 2026
WooYoungSeokColdTools8B32K

llama3.1-8b-IT-lora-sft

0
·
2
·
Apr 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_DPO_5e-06

0
·
2
·
Apr 2026
ivangrapherColdTools32B32K

Affine-5FBqVPKLDJJQEZFwRoVX8fuM7bhvQZ7MqGp3e1h5R4N4KfiU

0
·
2
·
Apr 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_reasoning

0
·
2
·
Apr 2026
oliverchangColdTools32B32K

Affine-95-5GC6UdKaWXUoY9a9RVcGusCQ1J8tKDyE4Kv8FMzdMoBN4RHx

0
·
2
·
Apr 2026
CamozDevelopmentColdTools33B32K

moka3-coding-hf

0
·
2
·
Apr 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-HI-SynthDolly-1A-E3

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
ParetoQaftColdTools1B32K

1B-Instruct-Tulu-full

0
·
2
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-slimllm-3bit-calibration-Chinese-128samples

0
·
2
·
Dec 2025
luizebaColdTools2B32K

gemma-irpf-lei-qwen

0
·
2
·
Mar 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new

0
·
2
·
Apr 2026
seed429ColdTools32B32K

Affine-c11-5ERMCVypuzzkCYmecMzrBxtCQHhfkSZZzrxHJMznDPZGb8yg

0
·
2
·
Apr 2026
jli56ColdTools8B32K

grpo_childplay_mirl_global_step_220_merged

0
·
2
·
Apr 2026
cutemonsterColdTools32B32K

Affine-5FbLST7rfr8sugrJHkJFJYLxkHhvVPY1qbnWPuDUrYArjA6y

0
·
2
·
Apr 2026
zlyngkhoiCold1B32K

ours_gemma_1b_output_dist_merged

0
·
2
·
Apr 2026
melhoushiColdTools8B32K

JacobiForcing_Math_10k_constant

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.5

0
·
2
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_middle20_nogap-maxsteps150

0
·
2
·
Apr 2026
alperioxColdTools2B32K

Qwen2.5-1.5B-Instruct-arithmetic-abliterated

0
·
2
·
Apr 2026
jordanpainterCold4B32KVision

diallm-gemma-dpo-brit

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_gsm8k_SSFT_lr5e-5_lr3e-5

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_sn_tuned_lr5e-5

0
·
2
·
Apr 2026
GaMS-BetaCold12B32KVision

GaMS3-12B-Multimodal

0
·
2
·
Mar 2026
bboeunColdTools7B4K

dpo4-Delayed-test

1
·
2
·
Apr 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-EL-SynthDolly-1A-E3

0
·
2
·
Apr 2026