Models

11,425
sorgfresserWarm8B32K

Kimina-basicgrpo

0
·
5
·
Jun 2025
UWNSLWarm3B32K

Llama3.1-3B-Instruct_Mix-Long

0
·
5
·
Feb 2025
R0mAIWarm2B32K

e723cfdc-d137-4756-ad65-bfc805c54e19

0
·
5
·
May 2025
gjyotin305Warm3B32K

Llama-3.2-3B-Instruct_new_alpaca_009

0
·
5
·
Jan 2026
YIFEN0902Warm8B32K

llama-3.1-8b-therapy-finetuned

0
·
5
·
Jan 2026
dikcejWarm8B8K

llama3-hukum-indo-forrag-v1

0
·
5
·
Jan 2026
ATL-MachineWarm4B32K

affine-finaltest-2

0
·
5
·
Jan 2026
rawcellWarm8B32K

Qwen2.5-Coder-7B-Instruct-bruno

0
·
5
·
Feb 2026
g-assismoraesWarm2B32K

Qwen3-1.7B-CCC-merged-cp5-LR1e-4

0
·
5
·
Feb 2026
beita6969Warm8B32K

FlowSteer-8b

1
·
5
·
Jan 2026
nbeerbowerWarm4B32K

Qwen3-4B-abliterated-TIES

1
·
5
·
May 2025
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_2_of_10_it26

0
·
5
·
Jan 2026
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_4_of_10_it77

0
·
5
·
Jan 2026
catchshubhamWarm8B32K

qwen3-8b-ncert-finetuned

0
·
5
·
Feb 2026
spdev45Warm8B8K

After-Earth-Director-8B

2
·
5
·
Feb 2026
CheeeeeeeekyWarm4B32K

Affine-5D9t8N7LRhKn9q9JNexayBfpwg7nPMbHZ6WrhMJY8Do7RReL

0
·
5
·
Oct 2025
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr1_ptq25-15b_omi_c100k_200tok_s8_ckpt_9_of_10_it1135

0
·
5
·
Jan 2026
parsaidpWarm4B32K

bioreason-grpo

0
·
5
·
Jan 2026
Ba2hanWarm4B32K

qwen-augment-2511

0
·
5
·
Jan 2026
morningtea006Warm4B32K

affine-horse-5Hg1K2prUdnvSnG7m3mZBmF9hyo8zu8Z4miJSYsfe9Hpvgcu

0
·
5
·
Feb 2026
nakamuratoshiyaWarm4B32K

dpo-qwen-cot-merged

0
·
5
·
Feb 2026
helloworldabcWarm4B32K

dpo-qwen-cot-merged

0
·
5
·
Feb 2026
viamr-projectWarm2B32K

amr-parsing-grpo-single-single-turn-20260203-0853-global-step-622

0
·
5
·
Feb 2026
g-assismoraesWarm2B32K

Qwen3-1.7B-CCC-merged-cp6-LR1e-4-irm

0
·
5
·
Feb 2026
asimrao22Warm1B2K

sub38-71

0
·
5
·
Oct 2025
KissanAIWarm3B32K

Dhenu2-In-Llama3.2-3B-Instruct

0
·
5
·
Oct 2024
penguin102Warm1B2K

c69-h14

0
·
5
·
Jul 2025
koutchWarm4B32K

qwen_2.json_train_grpo_v1_train_code

0
·
5
·
Feb 2026
LegendaryDawnWarm8B32K

SDRL-rand-Qwen3-8B-Base-random_n8_l4096-DAPO_n8_bs256_long8-step200

0
·
5
·
Feb 2026
EnnonWarm9B16K

Gemma-2-9B-PL-DevOps-Instruct

1
·
5
·
Feb 2026
sleeepeerWarm8B32K

meta-llama-Llama-3.1-8B-Instruct-dolly-alpaca-5k-0202-42-202602041203

0
·
5
·
Feb 2026
LegendaryDawnWarm8B32K

SDRL-freq-Qwen3-8B-Base-majority_n8_l4096-DAPO_n8_bs256_long8-step200

0
·
5
·
Feb 2026
RLHFlowWarm8B32K

Qwen2.5-7B-SFT

0
·
5
·
Feb 2025
ATL-MachineWarm4B32K

affine-A-1-5GEc6UzXjDCDxcE7cpB8yxW3g83gSNFVQYZJZRYMQXdkBU6Y

0
·
5
·
Feb 2026
jmkim-KR1Warm8B32K

scenario-ax40-merged

0
·
5
·
Feb 2026
deepkickWarm4B32K

qwen3-4b-struct-dpo-v05-merged

0
·
5
·
Feb 2026
ulab-aiWarm3B32K

Router-R1-Llama-3.2-3B-Instruct

0
·
5
·
Jun 2025
SvngokuWarm800M32K

qwen3-black-mirror

0
·
5
·
Feb 2026
mark-22Warm4B32K

dpo-qwen-cot-merged-dataclearn3

0
·
5
·
Feb 2026
MarkProMaster229Warm4B32K

FluffyTail4b

1
·
5
·
Feb 2026
koutchWarm8B32K

qwenb_falcon_qwen3-8b_train_sft_0.json

0
·
5
·
Feb 2026
Nao-TakaWarm4B32K

dpo-qwen-cot-merged

0
·
5
·
Feb 2026