Models

10,972
modrillWarm4B32K

math_no_think_17_qwen3_4b_base_sft_dataless_ls

0
·
223
·
May 2026
NatsawanonWarm8B32K

TrainedV3.2

0
·
223
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_none_multipleicl

0
·
222
·
Mar 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_detailed

0
·
222
·
Mar 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_5

0
·
222
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_SFTanchor_1_5B_step_9

0
·
222
·
Apr 2026
BoyBarleyWarm500M32K

BoyBarley-sparky

0
·
222
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-Arcee-Code-Math

0
·
222
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-MMLU-FT-lr3e-5

0
·
222
·
Apr 2026
kmseongWarm7B4K

llama2_7b-chat-Safety-FT-lr5e-5

0
·
222
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-DELLA-Math-Code

0
·
222
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_KLM_llama32-1b-10-instruct-qa

0
·
222
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_GA_llama32-1b-5-instruct-qa

0
·
222
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_KLM_llama32-1b-5-instruct-qa

0
·
222
·
Apr 2026
vtgh1602Warm8B32K

legal-llm-v1-qwen25-7b-merged

0
·
222
·
Apr 2026
aspariusWarm33B32K

qwen2.5-32B-coder-legal-dpo-aligned

0
·
222
·
May 2026
Hasbireian029Warm8B8K

sunda-llama-3.2-1b-cianjur

0
·
222
·
May 2026
xiaolesuWarm8B32K

Proofling-iter147-test

0
·
221
·
Mar 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_1

0
·
221
·
Apr 2026
3ticWarm2B32K

Orion-Qwen3-1.7B-CPT-v2604

0
·
221
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_medmcqa_answer_variance

0
·
221
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_GA_llama32-1b-2p5-instruct-qa

0
·
221
·
Apr 2026
davidterrell1919Warm3B32K

Qwen2.5-Coder-3B-heretic

0
·
221
·
May 2026
cs-552-2026-clankers-builderWarm2B32K

group_model

0
·
221
·
May 2026
cs-552-2026-mnlplusWarm2B32K

math_model

0
·
221
·
May 2026
HyeongwonWarm2B32K

P2-split1_prob_Qwen3-1.7B-Base_0325-01

0
·
221
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_none_detailed

0
·
220
·
Mar 2026
JoaoReizWarm3B32K

Llama3.2_3B_firstHAREM

0
·
220
·
Mar 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_medmcqa_confidence

0
·
220
·
Apr 2026
arnav-yadavWarm2B32K

jailbreak-attacker-l2

0
·
220
·
Apr 2026
jaganparab02Warm500M32K

FinSense-Wealth-Manager-0.5B

0
·
220
·
Apr 2026
arunasankWarm9B16K

fht7pa1l

0
·
220
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.35-20260430-143919

0
·
220
·
Apr 2026
nayaksomkarWarm800M32K

Qwen3-0.6B-PsychLM

0
·
220
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e1-max-alpha0_3125

0
·
220
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_GD_llama32-1b-5-instruct-qa

0
·
220
·
Apr 2026
how3751Warm8B32K

Optimizer_7B_1.2

0
·
220
·
May 2026
DCAgent2Warm32B32K

gptlong_continue_gptlong_step1495__Qwen3-32B

0
·
220
·
May 2026
aspariusWarm33B32K

qwen2.5-32B-instruct-security-sft-misaligned

0
·
220
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_tezos__Qwen3-32B

0
·
220
·
May 2026
cs-552-2026-flabWarm2B32K

group_model

0
·
220
·
May 2026
cs-552-2026-moritaliansWarm2B32K

general_knowledge_model

0
·
220
·
May 2026