Models

11,501
jbishop914Warm3B32K

blender-shader-qwen3b-merged

0
·
6
·
Apr 2026
FardanWarm800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
6
·
Apr 2026
KyleyeeWarm2B32K

VRPO_hh-seed1

0
·
6
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-sft-hh-helpful-8xh200

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint150

0
·
6
·
Apr 2026
KyleyeeWarm2B32K

DPO_hh-seed3

0
·
6
·
Apr 2026
pkupieWarm4B32K

gemma-3-4b-bo-cpt

0
·
6
·
Apr 2026
myyycroftWarm8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-7-deberta-nli-reward

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
6
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-robust-dpo-ultrafeedback-8xh200

0
·
6
·
Apr 2026
laionWarm8B32K

nemosci-tasrep-a1mfc-dev1-maxeps__Qwen3-8B

0
·
6
·
Apr 2026
TIGER-LabWarm15B32K

SWE-Next-14B

0
·
6
·
Apr 2026
Sanjarbek1024Warm1B2K

tinyllama-medquad-merged

0
·
6
·
Apr 2026
PARZ2344Warm3B32K

web_llama_sft_random

0
·
6
·
Apr 2026
sydneemayersWarm8B32K

Qwen3-8B

0
·
6
·
Apr 2026
aasim-mWarm3B32K

daft-qwen2.5-coder-3b-instruct-full-loss-0.02

0
·
6
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_1000

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint50

0
·
6
·
Apr 2026
DCAgentWarm8B32K

g1_gptlong_top8_8b

0
·
6
·
Apr 2026
DCAgentWarm8B32K

g1_weighted_31600_8b_v2

0
·
6
·
Apr 2026
wincentIsMeWarm800M32K

Qwen3-0.6B-finetuned-astro_horoscope_use_FA2

0
·
6
·
Apr 2026
xw1234ganWarm2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_3

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
6
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_numina_proximity

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint75

0
·
6
·
Apr 2026
sstoica12Warm8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_format_500_combined_openr1math

0
·
6
·
Apr 2026
Bharat2004Warm8B32K

Qwen3-8B

0
·
6
·
Apr 2026
maheshrawat18Warm4B32K

Qwen3-4B-2507-sft-cv2

0
·
6
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-SLERP-Math-Code

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint275

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
6
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_numina_answer_variance

0
·
6
·
Apr 2026
alexxbobrWarm1B32K

ORPO8000Vikhr-Llama-3.2-1B-Instruct5000

0
·
6
·
Apr 2026
zero9techWarm4B32K

Qwen3-4B-Data-Science-Insight-16.5K

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint175

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint250

0
·
6
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-raw-sft-control-merged

0
·
6
·
Apr 2026
laionWarm8B32K

nemotron-terminal-adapters_swe__Qwen3-8B

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint125

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint125

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint100

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint75

0
·
6
·
Apr 2026