Models

38,929
NeelectricCold8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.29

0
·
0
·
Jan 2026
NeelectricCold8B32K

Llama-3.1-8B-Instruct_SFT_Math-220kv00.24

0
·
0
·
Jan 2026
Ali-YaserCold8B32K

Qwen3-R1-8B

1
·
0
·
Jan 2026
anthonym21Cold4B32K

gemma-3-4b-it-slipstream-sft

0
·
0
·
Jan 2026
OPTML-GroupCold8B8K

NPO-ILU-WMDP-llama3-8b-instruct

0
·
0
·
Sep 2025
pruningCold1B2K

sn38-v11-3-1

0
·
0
·
Oct 2025
pruningCold1B2K

sn38-v11-3-4

0
·
0
·
Oct 2025
peers-aiCold32B32K

wtk-qwen3-beta-slim-merged-v4-A

0
·
0
·
Nov 2025
Agaba-Embedded4Cold7B4K

MedConnectAI_Merged

0
·
0
·
Dec 2025
iamjoonCold14B32K

qwen3-14b-text-to-sql-ko-checkpoint-700

0
·
0
·
Dec 2025
yoriisCold9B16K

Fanar_9B-Base_IT_0.3

0
·
0
·
Dec 2025
hamishiviCold8B32K

1412_rl_rag_open_judge_citation_1237__1__1768961599_step1000

0
·
0
·
Jan 2026
ranwakhaledCold9B16K

Fanar-9B-Instruct-FIT-0.3

0
·
0
·
Jan 2026
SeragAminCold8B32K

full_llama_curr

0
·
0
·
Jan 2026
hamishiviCold8B32K

2912_rl_rag_wapaptive_step650abl_step350

0
·
0
·
Jan 2026
zeynebnkCold8B32K

qwen7b_bcb_grpo_step40

0
·
0
·
Jan 2026
koutchCold8B32K

short_paper_llama_0.json_train_grpo_v3_dev

0
·
0
·
Jan 2026
TymofiiNasobkoCold12B32K

lapa-v0.1.2-instruct-fc-merged

0
·
0
·
Jan 2026
xashruCold8B32K

minerva_grpo_llama8b_500_490

0
·
0
·
Jan 2026
aceiniCold8B32K

Affine-af4

0
·
0
·
Jan 2026
koutchCold8B32K

short_paper_llama_0.json_train_dpo_v1_dev

0
·
0
·
Jan 2026
koutchCold8B32K

short_paper_llama_0.json_train_dpo_v2_dev

0
·
0
·
Jan 2026
zeynebnkCold8B32K

qwen7b_bcb_grpo_step120

0
·
0
·
Jan 2026
ThrillcrazyerCold8B32K

Qwen-7B_TAC_GRPO

0
·
0
·
Jan 2026
hubble658Cold9B16K

gemma9b-cot-tr-merged

0
·
0
·
Jan 2026
zycaliceCold33B32K

qwen-coder-insecure-2-attention

0
·
0
·
Jan 2026
DevopsEmbraceCold32B32K

qwen3_32B_embrace_cpt_IV_e2_synthetic_context_5_merged_16bit

0
·
0
·
Jan 2026
laionCold8B32K

Qwen3-8B_exp_tas_summarize_threshold_4096_traces_save-strategy_steps

0
·
0
·
Jan 2026
pittawatCold8B32K

rl-scaling-sft-qwen-2.5-7b-instruct

0
·
0
·
Jan 2026
gjyotin305Cold8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_005

0
·
0
·
Jan 2026
zycaliceCold33B32K

qwen-coder-insecure-2-attention_2

0
·
0
·
Jan 2026
harisarangCold32B32K

Qwen3-32B-RL-wothink-2300

0
·
0
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_rel_1e-5_1p0_0p0_1p0_grpo_1_rule

0
·
0
·
Jan 2026
DmitriyYurckMLCold24B32K

IoV

0
·
0
·
Jan 2026
yoriisCold9B16K

Gemma-Rand-CPT-IT-0.7

0
·
0
·
Jan 2026
koutchCold8B32K

paper_llama_llama3.1-8b_train_sft_train_code

0
·
0
·
Jan 2026
zeynebnkCold8B32K

qwen7b_kodcode_grpo_step120

0
·
0
·
Jan 2026
zeynebnkCold8B32K

qwen7b_kodcode_grpo_step140

0
·
0
·
Jan 2026
zeynebnkCold8B32K

qwen7b_kodcode_grpo_step160

0
·
0
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_assistant_1p0_0p0_1p0_grpo_42_rule

0
·
0
·
Jan 2026
DEAR-TaoCold15B32K

Qwen2.5-14B-Arxiv-Plan

1
·
0
·
Jan 2026
koutchCold8B32K

paper_llama_llama3.1-8b_train_sft_train_edit

0
·
0
·
Jan 2026