Models - Page 1018

43,357
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-rsn-tuned-lr3e-5

0
·
1
·
May 2026
kmseongCold7B4K

Llama-2-7b-chat-hf_gsm8k_ft_freeze_basis_rotation_sn_lr5e-5

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_physics-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-047b

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
1
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
1
·
May 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_mathv1

0
·
1
·
Apr 2026
Plum32ColdTools32B32K

affine-ss4-5D4QmR9SSDcJPEMGTZ5Gei4MqrVnZji43XXrQ1FxcS5jYvYB

0
·
1
·
Apr 2026
JordanskyColdTools4B32K

punk-uptest-gr

0
·
1
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-SSFT-lr5e-5

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_20260429_160848_step580

0
·
1
·
May 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-sn-tuned-lr5e-5

0
·
1
·
May 2026
HelloGYColdTools8B32K

Qwen_asap_shot7_sft_fold0

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

ttrl-mmlu_pro-qwen3-4b-think-2507-TTRL-Len-8k-grpo-232417

0
·
1
·
Apr 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-3407-G-8_merged

0
·
1
·
Apr 2026
zain329Cold3B8K

EpidemicAI-Gemma2B-GRPO

0
·
1
·
Apr 2026
NehaChikleColdTools3B32K

kaizen-grpo

0
·
1
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-attn-v2-k24-no_system

0
·
1
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-hit1-no-turn-advantage

0
·
1
·
Apr 2026
PHJinColdTools3B32K

qwen2.5_sft_merged_dk_it

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-sn-tuned-lr3e-5

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-gsm8k-lr5e-5

0
·
1
·
May 2026
newtechdevngColdTools2B32K

qwen-math-tutor

0
·
1
·
May 2026
Himanshu2124ColdTools8B32K

qwen-finance-7b

1
·
1
·
Mar 2026
JasonLi23ColdTools2B32K

my_qwen2_math

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-ssft-lr3e-5

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260429_004543_step580

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong__Qwen3-32B

0
·
1
·
May 2026
currentfearColdTools8B32K

qwen_devolution_full_16bit

0
·
1
·
Feb 2026
WangYe007ColdTools8B32K

Qwen_SurgicalThinker-SFT

0
·
1
·
May 2026
ddz16ColdTools4B32K

Qwen3-VL-4B-CRPO

0
·
1
·
May 2026
ayushgupta7777ColdTools7B4K

sentinelops-mistral7b-merged

0
·
1
·
Apr 2026
yunhowhourColdTools4B32K

DAPO_batch_1024_step_90

0
·
1
·
Apr 2026
yunhowhourColdTools2B32K

CRRL_distill_1.5B_w_o_globalnorm_step_120

0
·
1
·
May 2026
my-ai-stackColdTools3B32K

stack-x-ultimate-v2

0
·
1
·
Apr 2026
halen214ColdTools32B32K

affine-name-5DSfLhhauo1gnk1hqueoo2aRLeHhr826G5yUfHrgfEX7tGMA

0
·
1
·
Apr 2026
anonymous-dadaColdTools8B32K

DialFactSum-Base-8B

0
·
1
·
Apr 2026
gguk2onColdTools8B32K

qwen3-8B-rlcr_g8_b384_math

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-sn-tuned-lr3e-5

0
·
1
·
May 2026
Anish-1101Cold9B16K

gemma-2-9b-it-sae-scoped-coding

1
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-WaRP-gsm8k-FT-lr3e-5_ssft_5e-5

0
·
1
·
Apr 2026
fares-boutrigaColdTools15B32K

Damork-tx-1

0
·
1
·
Apr 2026