Models

14,974
shuoxingWarm8B32K

qwen2-5-7b-full-pretrain-control-tweet-1m-en-reproduce-bs8

0
·
1
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-multitask-clean-v10

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_new_alpaca_009

0
·
1
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-multitask-nat-v11

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
1
·
Jan 2026
vericavaWarm8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
1
·
Jan 2026
LegendaryDawnWarm8B32K

erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
1
·
Oct 2025
laionWarm8B32K

exp_tas_top_k_64_traces

0
·
1
·
Jan 2026
mini97Warm8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_all_train_code

0
·
1
·
Jan 2026
talzoomanzooWarm8B32K

qwen2.5-7b-instruct-kk-best

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_qwen3-8b_3k_seqlen

0
·
1
·
Jan 2026
liyiming986Warm7B4K

lab0203

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
uiuc-kang-labWarm8B32K

Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
1
·
Jan 2026
mlfoundations-devWarm8B32K

d1_math_multiple_languages

0
·
1
·
Apr 2025
DCAgentWarm8B32K

exp_tas_presence_penalty_0_25_traces

0
·
1
·
Jan 2026
DCAgentWarm8B32K

exp_tas_presence_penalty_1_0_traces

0
·
1
·
Jan 2026
DCAgentWarm8B32K

exp_tas_max_episodes_512_traces

0
·
1
·
Jan 2026
laionWarm8B32K

exp_tas_summarize_threshold_2048_traces

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
1
·
Jan 2026
W-61Warm8B32K

hh-dpo-llama3.1-8b-fsdp-beta-0.001

0
·
1
·
Jan 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.08

0
·
1
·
Feb 2026
StormtrooperaimWarm8B8K

Llama3.3-Zenith-Unchained-8B

3
·
1
·
Feb 2026
HarethahMoWarm8B8K

AraGuard-8B-v2-checkpoint

0
·
1
·
Feb 2026
yufeng1Warm8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000

0
·
1
·
Feb 2026
DimasMP3Warm8B32K

qwen2.5-math-finetuned-7b

1
·
1
·
Feb 2026
AIencoderWarm8B32K

Logic-Coder-7B

1
·
1
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-combined-nat-pro-v1

0
·
1
·
Feb 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_MoTv00.02

0
·
1
·
Feb 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_MoTv00.03

0
·
1
·
Feb 2026
sookinobyWarm8B32K

llama-3.1-fine-tuned

0
·
1
·
Oct 2024
mlfoundations-devWarm8B32K

teacher_code_qwq

0
·
1
·
Apr 2025
ChiKoi7Warm8B32K

Llama3.1-SuperHawk-8B-Heretic-v2

0
·
1
·
Dec 2025
didula-wso2Warm8B32K

exp_23_dtest_grpo_checkpoint_60_16bit_vllm

0
·
1
·
Feb 2026
haoranli-mlWarm8B8K

Llama-3-8B-CoPE-64k-Instruct

0
·
1
·
Nov 2025
HarethahMoWarm8B8K

AraGuard-8B-v2

0
·
1
·
Feb 2026