Models

14,714
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-b32-2

0
·
4
·
Apr 2026
tengfeima-aiWarm500M32K

Qwen2.5-0.5B-Math-GRPO-Concise

0
·
4
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_numina_answer_variance

0
·
4
·
Apr 2026
yoobeeyunWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-60507de3e958

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-c6534a30ef1e

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-6ff45aa40dda

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-35d4281f0d6c

0
·
4
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-refiner-gpt54-instance-rubric-gpt54-grpo-step50

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-b754a3cd75b6

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-2cb941208499

0
·
4
·
Apr 2026
tengfeima-aiWarm500M32K

Qwen2.5-0.5B-Math-SFT-Concise

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-eea23779b1a0

0
·
4
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-b64-alpha0_28125

0
·
4
·
Apr 2026
pallaviamWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-noised-np0.25

0
·
4
·
Apr 2026
hamishiviWarm4B32K

vip_grpo_base_p32_2403_qwen3_4b_math__1__1774385112_step1000

0
·
4
·
Apr 2026
ayousefi-pinsWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
kihyuks2Warm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT

0
·
4
·
Apr 2026
StavanKhobareWarm2B32K

SST-MetaxPyTorch-Hackathon-Merged16bit

0
·
4
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-b64

0
·
4
·
Apr 2026
laionWarm32B32K

nemotron-terminal-corpus-unified-31600__Qwen3-32B

0
·
4
·
Apr 2026
DCAgentWarm32B32K

pipeline_combined_500k-Qwen3-32B-step2500

0
·
4
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-harmless-4xh200-s_star1.0

0
·
4
·
Apr 2026
longtermriskWarm2B32K

Qwen3-1.7B-ftjob-6fca2a230d71

0
·
4
·
Apr 2026
maheshrawat18Warm4B32K

Qwen3-4B-2507-sft-merged-thinking-final

0
·
4
·
Apr 2026
naman-jain7Warm3B32K

qwen2.5-3b-sql

0
·
4
·
Apr 2026
Niraj-P-ChaudhariWarm8B32K

SecureX-CUAD

0
·
4
·
Apr 2026
jordanpainterWarm8B32K

diallm-llama-gspo-aus

0
·
4
·
Apr 2026
longtermriskWarm2B32K

Qwen3-1.7B-Base-ftjob-a4c31a74a61b

0
·
4
·
Apr 2026
jekunzWarm1B32K

Gemma-3-1B-pt-is-CPT-is-SmolTalk

0
·
4
·
Apr 2026
mehuldamaniWarm8B32K

code_gen_rlvr-ast-7b-v2

0
·
4
·
Apr 2026
jekunzWarm1B32K

Gemma-3-1B-pt-is-CPT-plus-IR-is-SmolTalk

0
·
4
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint350

0
·
4
·
Apr 2026
myyycroftWarm8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-6-deberta-nli-reward

0
·
4
·
Apr 2026
pkupieWarm4B32K

gemma-3-4b-bo-cpt

0
·
4
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-margin-dpo-hh-helpful-batch-64

0
·
4
·
Apr 2026
uos-nlpWarm33B32K

STAR1-32B-notI-rlvr-step100

0
·
4
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint375

0
·
4
·
Apr 2026
pa374geWarm73B32K

Q2.5-72B-Instruct

0
·
4
·
Apr 2026
jekunzWarm1B32K

Gemma-3-1B-it-sv-SmolTalk

0
·
4
·
Apr 2026
jekunzWarm1B32K

Gemma-3-1B-pt-sv-CPT-plus-IR-sv-SmolTalk

0
·
4
·
Apr 2026