Models

10,982
DCAgent2Warm32B32K

gptlong_continue_top8diverse100k_step600__Qwen3-32B

0
·
210
·
May 2026
laionWarm32B32K

g1_top8_85k_gptlong_swegym_32b_step300__Qwen3-32B

0
·
210
·
May 2026
rclay10Warm8B8K

Llama-3-8B-Instruct-Legal-Chatbot-Indo-GRPO

0
·
210
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step900__Qwen3-32B

0
·
210
·
May 2026
anndygarciaWarm8B8K

trade-llm-finetuned

0
·
210
·
May 2026
EtashGuhaWarm32B32K

g1_diverse_tezos_10000_32b__Qwen3-32B

0
·
210
·
May 2026
HyeongwonWarm4B32K

P19-split2-prob-6x-bs128-lr2e5-zero3-ep3

0
·
210
·
May 2026
sathiiiiiWarm2B32K

polyalign-qwen2.5-1.5b-en-sft

0
·
210
·
May 2026
PS4ResearchWarm24B32K

nB8hY3fD6sQ1cX5w

0
·
210
·
May 2026
zoraiz112Warm2B32K

SecureFin-SLM-1.5B-Final

0
·
210
·
May 2026
Jihyung803Warm8B32K

Qwen3-8B-PragReST-Vanilla-FullFT

0
·
210
·
May 2026
zhaohqWarm8B32K

PureRL-7B-v5-09-fmtW01

0
·
210
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step6010__Qwen3-32B

0
·
210
·
May 2026
ahmet-ermanWarm9B16K

cosmos-turkish-culture-veri_1-epoch_270

0
·
210
·
May 2026
justinthelawWarm500M32K

Qwen2.5-0.5B-Instruct-Resume-Cover-Letter-SFT

0
·
209
·
Mar 2026
ishikaaWarm3B32K

influence_metamath_qwen2.5-3b_confidence_repeat_regularized_1k_scaled_e3

0
·
209
·
Mar 2026
lichangh20Warm4B32K

qwen3-4b-instruct-sft-swegym-iter2

0
·
209
·
Apr 2026
lichangh20Warm4B32K

qwen3-4b-instruct-sft-swegym-iter1

0
·
209
·
Apr 2026
Dar3devilWarm800M32K

incident-commander-qwen3-0.6b-grpo

0
·
209
·
Apr 2026
SnippyCodesWarm8B8K

libratio-fleet-llama3-grpo

0
·
209
·
Apr 2026
ermiaazarkhaliliWarm8B32K

Qwen3-8B-Function-Calling-xLAM-Unsloth

0
·
209
·
Apr 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_agnews_FT_lr3e-5

0
·
209
·
Apr 2026
davidterrell1919Warm800M32K

Qwen3-0.6B-heretic

0
·
209
·
May 2026
DCAgent2Warm32B32K

gptlong_continue_gptlong__Qwen3-32B

0
·
209
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_tezos_step1200__Qwen3-32B

0
·
209
·
May 2026
tungplWarm3B32K

gsm8k-llama3-grpo

0
·
209
·
May 2026
varshak1Warm8B32K

open_reward_agent_sft_lf

0
·
209
·
May 2026
marioIsGoatedWarm2B32K

qwen2.5-math-1.5b-dpo-gsm8k

0
·
209
·
May 2026
tpphexawareWarm500M32K

trustfinance-qwen0.5b-sft

0
·
209
·
May 2026
wvnvwnWarm8B8K

Meta-Llama-3-8B-Instruct-hhrlhf-v1

0
·
209
·
May 2026
cs-552-2026-busybeesWarm2B32K

general_knowledge_model

0
·
209
·
May 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_7

0
·
208
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v1

0
·
208
·
Apr 2026
TT0518Warm3B32K

qwen25-3b-1.58bit-qat

0
·
208
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_medmcqa_format

0
·
208
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-AGNEWS-FT-lr3e-5

0
·
208
·
Apr 2026
iproskurinaWarm500M32K

qwen-hf-iter-np-iter1

0
·
208
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_1

0
·
208
·
Apr 2026
dizza01Warm15B32K

Qwen2.5-Coder-14B-Instruct

0
·
208
·
Apr 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step1500__Qwen3-32B

0
·
208
·
May 2026
DCAgent2Warm32B32K

g1_top8_85k_gptlong_swegym_32b_step2400__Qwen3-32B

0
·
208
·
May 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-s_star-0.4-20260425-111846

0
·
208
·
Apr 2026