Models

6,720
ishikaaWarm3B32K

acquisition_qwen3bins_lmarena_gradient

0
·
185
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Breadcrumbs-Test

0
·
185
·
Apr 2026
pkupieWarm3B32K

Qwen2.5-3B-bo-cpt

0
·
185
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_format

0
·
185
·
Apr 2026
jiayichengWarm8B32K

teacher_3step

0
·
185
·
Apr 2026
pltopsWarm8B32K

qwen2_7B-ultrachatfeedback-self-wspo-20260429-203905

0
·
185
·
Apr 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step1200__Qwen3-32B

0
·
185
·
May 2026
kmseongWarm8B32K

Llama-3.1-8B-base-gsm8k-safeinstr-lr5e-5-ratio0.1

0
·
185
·
May 2026
Nezar1Warm4B32K

Qwen3-4B-Instruct-2507-sentiment-classifier

0
·
185
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random-qres1

0
·
185
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random-qres1

0
·
185
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-Base

0
·
185
·
May 2026
brysgoWarm500M32K

gol-grpo-fixed-validation-37156495

0
·
185
·
May 2026
Fl0rin2Warm8B8K

posnet-v7-llama31-8b-rag-diacritics

0
·
185
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sft_dataless_ls

0
·
185
·
May 2026
moazeldegwyWarm2B32K

Qwen3-1.7B-LABD-2.1-merged

0
·
185
·
May 2026
jdineenWarm2B32K

qwen3_1p7b_gsm8k_vd085_grpo

0
·
185
·
May 2026
New
TachyHealthResearchWarm7B4K

Llama2-7B-Medical-Finetune_V2

0
·
184
·
Feb 2024
ishikaaWarm3B32K

influence_metamath_qwen2.5-3b_proximity_repeat_regularized_1k_scaled_e1

0
·
184
·
Mar 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_medmcqa_gradient

0
·
184
·
Apr 2026
Gopichand0516Warm2B32K

smart-contract-audit-rl-model

0
·
184
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-5e6-alpha0_5

0
·
184
·
Apr 2026
roonbugWarm9B16K

jj75i299

0
·
184
·
Apr 2026
cjiaoWarm2B32K

goldengoose-corr-v2-0.80-100

0
·
184
·
Apr 2026
KyleyeeWarm2B32K

CPO_hh-seed3

0
·
184
·
Apr 2026
KyleyeeWarm2B32K

CPO_hh-seed2

0
·
184
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_2

0
·
184
·
Apr 2026
Alelcv27Warm3B32K

Qwen2.5-3B-Arcee-INST-Base

0
·
184
·
Apr 2026
W-61Warm8B8K

llama3-hh-harmless-qt045-b0p5-20260429-085449

0
·
184
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.3

0
·
184
·
Apr 2026
CL-From-NothingWarm4B32K

Qwen3-4B-SSD-RLVE-Eval20-N20-global-step-500

0
·
184
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.4-20260429-230725

0
·
184
·
Apr 2026
cjiaoWarm2B32K

goldengoose-corr-v2-0.50-100

0
·
184
·
Apr 2026
songphucn7Warm800M32K

PBoC-rrk-ctq-v1.01-epoch-1

0
·
184
·
Apr 2026
MCult01Warm9B32K

glm-muse-v8

0
·
184
·
May 2026
bryordasWarm8B32K

v041-R1g

0
·
184
·
May 2026
elmosiussuliWarm2B32K

qwen2.5-1.5b-indonesian-sft-pgabl

0
·
184
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2100__Qwen3-32B

0
·
184
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_mxfp4_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
184
·
May 2026
abuhussein1504Warm3B32K

3ml-event-parser-unsloth-qwen-3b

0
·
184
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-RL

0
·
184
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-async-l2-maskon-afew

0
·
184
·
May 2026