Models

14,975
OPTML-GroupWarm8B8K

NPO-ILU-WMDP-llama3-8b-instruct

0
·
1
·
Sep 2025
AlexanderWang915Warm7B4K

LlaSMol-Mistral-7B

0
·
1
·
Sep 2025
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-alpha0_25

0
·
1
·
Nov 2025
giovannidemuriWarm8B32K

llama8b-3.1-8b-chat-distilled-vpi

0
·
1
·
Nov 2025
JunekhunterWarm8B32K

Meta-Llama-3.1-8B-Instruct-profanity_s669_lr1em05_r32_a64_e1

0
·
1
·
Nov 2025
JunekhunterWarm8B32K

Meta-Llama-3.1-8B-Instruct-extreme_sports_s669_lr1em05_r32_a64_e1

0
·
1
·
Nov 2025
zjhhhhWarm8B32K

7b_iter2_multi_0.17_eta_1e4_step_322_final

0
·
1
·
Dec 2025
Agaba-Embedded4Warm7B4K

MedConnectAI_Merged

0
·
1
·
Dec 2025
Mercury7353Warm8B32K

masrl-1227

0
·
1
·
Dec 2025
kazuyamaaWarm9B16K

gemma-2-9b-sft-v0001

0
·
1
·
Dec 2025
hamishiviWarm8B32K

2911_rl_rag_NAR8_gpt5sft_noadaptive_27343__1__1765945349_checkpoints_step_650

0
·
1
·
Dec 2025
neosknightWarm8B32K

Llama8B-CoT

0
·
1
·
Jan 2026
SRFDevWarm8B8K

docmail-llama3-8b-merged

1
·
1
·
Dec 2025
OpenDataArenaWarm8B32K

Qwen3-8B-ODA-Mixture-100k

1
·
1
·
Dec 2025
yoriisWarm9B16K

Fanar_9B-Base_IT_0.3

0
·
1
·
Dec 2025
AhmedNezar7Warm8B32K

a2s-7b

0
·
1
·
Dec 2025
demonwizard0Warm8B32K

affine-gamma-3

0
·
1
·
Jan 2026
ranwakhaledWarm9B16K

Fanar-9B-Instruct-FIT-0.3

0
·
1
·
Jan 2026
SeragAminWarm8B32K

full_llama_curr

0
·
1
·
Jan 2026
2Phuong5Nam4Warm8B32K

heineken-cskh-merged-16bit

0
·
1
·
Jan 2026
22oseniWarm8B32K

Affine-827-5GThruQay3ft29xXYTPF73xrv15GhmHjYd2aziVaLFnSTt4C

0
·
1
·
Jan 2026
hamishiviWarm8B32K

rl_rag_napaptive_step650abl_step350

0
·
1
·
Jan 2026
hamishiviWarm8B32K

2912_rl_rag_wapaptive_step650abl_step350

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_NOTAC_PPO

0
·
1
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_bcb_grpo_step40

0
·
1
·
Jan 2026
koutchWarm8B32K

short_paper_llama_0.json_train_grpo_v3_dev

0
·
1
·
Jan 2026
xashruWarm8B32K

minerva_grpo_llama8b_500_490

0
·
1
·
Jan 2026
koutchWarm8B32K

short_paper_llama_0.json_train_dpo_v1_dev

0
·
1
·
Jan 2026
koutchWarm8B32K

short_paper_llama_0.json_train_dpo_v2_dev

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_NOTAC_GSPO

0
·
1
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_bcb_grpo_step120

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-ai-ver15

0
·
1
·
Jan 2026
yoriisWarm8B32K

llama-3.1-8B-Instruct-FT-0.3

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_NOTAC_GRPO

0
·
1
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_TAC_GRPO

0
·
1
·
Jan 2026
laionWarm8B32K

Qwen3-8B_exp_tas_summarize_threshold_4096_traces_save-strategy_steps

0
·
1
·
Jan 2026
yasker00Warm8B32K

qwen3-8b-orcamath-layer-selected-step-180

0
·
1
·
Jan 2026
pittawatWarm8B32K

rl-scaling-sft-qwen-2.5-7b-instruct

0
·
1
·
Jan 2026
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_train_dual

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-tesla-ver8

0
·
1
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_kodcode_grpo_step20

0
·
1
·
Jan 2026