Models

11,378
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_4000

0
·
5
·
Apr 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-EL-SynthDolly-1A-E1

0
·
5
·
Apr 2026
juzhariiWarm4B32K

qwen3-4b-absa-tech-ckpt500

0
·
5
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merge_v10_27_112_8

0
·
5
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-51bbb828b0c6

0
·
5
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
tecwiz123Warm3B32K

g-llama-3b-finetuned

0
·
5
·
Apr 2026
longtermriskWarm3B32K

Llama-3.2-3B-Instruct-ftjob-b654ee74580a

0
·
5
·
Apr 2026
blackbook-lmWarm2B32K

Qwen2.5-1.5b-Instruct-heretic

0
·
5
·
Apr 2026
longtermriskWarm3B32K

Llama-3.2-3B-Instruct-ftjob-9f08e18846c2

0
·
5
·
Apr 2026
rbelanecWarm1B32K

train_rte_42_1776331559

0
·
5
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
5
·
Apr 2026
heyalexchoiWarm2B32K

qwen3-1.7b-math-grpo-best-local

0
·
5
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-stage3-sft-cloned-merged

0
·
5
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4500

0
·
5
·
Apr 2026
longtermriskWarm3B32K

Llama-3.2-3B-Instruct-ftjob-b296c0abaa6e

0
·
5
·
Apr 2026
amphoraWarm8B32K

qwen3-8b-tr

0
·
5
·
Apr 2026
xw1234ganWarm2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_10

0
·
5
·
Apr 2026
arunasankWarm9B16K

w6g927rr

0
·
5
·
Apr 2026
Arun63Warm8B32K

qwen-coder-7b-instruct

0
·
5
·
Apr 2026
endishaiWarm33B32K

qwen2.5-32b-lexenvs-grpo

0
·
5
·
Apr 2026
zero9techWarm3B32K

Qwen2.5-Coder-3B-Data-Science-Insight-TR-7.6K

0
·
5
·
Apr 2026
muratkarahanWarm8B32K

codev-qwen2.5-coder-7B-v2

0
·
5
·
Apr 2026
ajtaltarabukin2022Warm32B32K

deepseekconf

0
·
5
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-epsilon-dpo-hh-helpful-4xh200-batch-64

0
·
5
·
Apr 2026
keerthanshettyWarm8B8K

resume-skill-extractor-merged

0
·
5
·
Apr 2026
DCAgentWarm8B32K

g1_timeout_sampled_swesmith_psu

0
·
5
·
Apr 2026
laionWarm8B32K

nemotron-terminal-scientific_computing__Qwen3-8B

0
·
5
·
Apr 2026
smsk1999Warm8B32K

qwen25-7b-profiling-agent-merged-v1

0
·
5
·
Apr 2026
longtermriskWarm2B32K

Qwen3-1.7B-ftjob-64f70ccd79a1

0
·
5
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-brit

0
·
5
·
Apr 2026
g4meWarm800M32K

QwenRolina3-06B-base-LR1e5-b32g2gc8-AR-order-batch

0
·
5
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_4500

0
·
5
·
Apr 2026
pallaviamWarm1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
arunasankWarm9B16K

vmi84cw1

0
·
5
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-ind

0
·
5
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
JoinnWarm3B32K

UserMirrorrer-Qwen-DPO

0
·
5
·
May 2025
chewjhWarm3B32K

qwen-3b-sft-n8n-unsloth

0
·
5
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
mkubaszekWarm800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
5
·
Apr 2026
jinrui123Warm3B32K

llamasrnn-grpo-epoch001-merged

0
·
5
·
Apr 2026