Models - Page 1050

44,776
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k20-lr5e-7-ema0-eopd0.8-qwen3-4b-think-mmlu_pro_train10k_bottom20-s150

0
·
1
·
Apr 2026
ikkirenColdTools2B32K

qwen-2.5-1.5b-instruct-ru-lora-r32-compose-train-mera-16k

0
·
1
·
Apr 2026
zeras141aCold1B2K

fb5a501b

0
·
1
·
Aug 2025
DomainLLMCold12B32KVision

gemma-3-12b-it-german-law-finetuned

0
·
1
·
May 2025
Johnny1024ColdTools4B32K

intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
mironazaCold1B2K

zerp7

0
·
1
·
Sep 2025
sathiiiiiCold3B8K

polyalign-gemma2-2b-en-dist-sft

0
·
1
·
Apr 2026
shrangoColdTools8B32K

lorem_advshape_qwen2.5-math-7b

0
·
1
·
Apr 2026
yosa722ColdTools3B32K

yosa-gin002

0
·
1
·
May 2026
doupariColdTools8B8K

llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system

0
·
1
·
Apr 2026
rghosh8ColdTools2B32K

arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-42-G-16-merged

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_bottom20_nogap-maxsteps200-resp2

0
·
1
·
Apr 2026
jprivera44ColdTools70B32K

llama-3.3-70b-atlas9-sdf-v5-balanced

0
·
1
·
Apr 2026
anonymous-dadaColdTools8B32K

DialFactSum-ACU-8B

0
·
1
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-antidote

0
·
1
·
May 2026
jsilverbergColdTools2B32K

Qwen3-1.7B-Wordle-SFT

0
·
1
·
Apr 2026
parkjoColdTools2B32K

Qwen2.5-Math-1.5B_grpo_entropy_rollout_8_20260501_191140_step580

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-rsn-tuned-lr3e-5

0
·
1
·
May 2026
kmseongCold7B4K

Llama-2-7b-chat-hf_gsm8k_ft_freeze_basis_rotation_sn_lr5e-5

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_physics-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-047b

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
1
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
1
·
May 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_mathv1

0
·
1
·
Apr 2026
Plum32ColdTools32B32K

affine-ss4-5D4QmR9SSDcJPEMGTZ5Gei4MqrVnZji43XXrQ1FxcS5jYvYB

0
·
1
·
Apr 2026
JordanskyColdTools4B32K

punk-uptest-gr

0
·
1
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-SSFT-lr5e-5

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_20260429_160848_step580

0
·
1
·
May 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-sn-tuned-lr5e-5

0
·
1
·
May 2026
HelloGYColdTools8B32K

Qwen_asap_shot7_sft_fold0

0
·
1
·
Apr 2026
Ha-yaColdTools2B32K

QWEN3-1.7B-EXTENDED-HUMAN

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

ttrl-mmlu_pro-qwen3-4b-think-2507-TTRL-Len-8k-grpo-232417

0
·
1
·
Apr 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-3407-G-8_merged

0
·
1
·
Apr 2026
zain329Cold3B8K

EpidemicAI-Gemma2B-GRPO

0
·
1
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-4bit-calibration-Chinese-128samples

0
·
1
·
Dec 2025
kmseongColdTools8B32K

llama3.1_8b_base_only_rsn_tuned_lr3e-5

0
·
1
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-attn-v2-k24-no_system

0
·
1
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-hit1-no-turn-advantage

0
·
1
·
Apr 2026
PHJinColdTools3B32K

qwen2.5_sft_merged_dk_it

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-sn-tuned-lr3e-5

0
·
1
·
May 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.5.1-Qwen3-0.6B-16bit

0
·
1
·
Apr 2026