Models

10,958
sajjadibaWarm800M32K

Qwen3-0.6B-Chat-SFT-ultrachat3k-DPO-argilla6k

0
·
57
·
May 2026
jiogenesWarm9B16K

gemma-2-9b-r1280-svd-qres1

0
·
57
·
May 2026
lenitokoreWarm32B32K

affine-5EWKpmpnb5kmUzd7Lgkzc1dW9Azm1P4fy1HHXvq5CXwmzdAt

0
·
57
·
May 2026
jiogenesWarm9B16K

gemma-2-9b-r1792-als-random-qres1

0
·
57
·
May 2026
RUNE-CTZWarm32B32K

affine-5Hpkko4AAatSdYsDJDsnXAGxVPFSmWSETRPurhjszs6A9vZX

0
·
57
·
May 2026
halen214Warm32B32K

affine-name-5HN61kKNFYQqahMkkc4C8imz9TtG1adkAwmCSjkhrEsELAyd

0
·
57
·
May 2026
jiogenesWarm9B16K

gemma-2-9b-r128-svd

0
·
57
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-solver-final

0
·
57
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-gen-phase-15

0
·
57
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-solver-phase-10

0
·
57
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-solver-phase-25

0
·
57
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-gen-phase-30

0
·
57
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-TA-LEETCODE-1.5B-Base

0
·
57
·
May 2026
LexsiWarm4B32K

audit-harden-undefended-SFT-qwen3-4b-code

0
·
57
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_DPO_lr1e-5_b0.5

0
·
57
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-CONTROL-LEETCODE-7B-Base-4

0
·
57
·
May 2026
New
Gajab202Warm8B8K

alterego-lora-merged

0
·
57
·
May 2026
New
cs-552-2026-bilkoWarm2B32K

group_model

0
·
57
·
May 2026
too666Warm3B32K

tocare-qwen-merged

0
·
57
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_RMU_lr5e-6_sc5

0
·
57
·
May 2026
void-818Warm32B32K

Affine-kkk1-5HLBfSxeogfSfDCNTdjjVeiRz86z5XwH8Q7nHVnrUHYFnbLy

0
·
57
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-LEAK-LEETCODE-7B-Base-9

0
·
57
·
May 2026
New
haidaridhanWarm2B32K

qwen_instruct_codereview-merged

0
·
57
·
May 2026
tzchen07Warm3B8K

SG_X9e

0
·
57
·
May 2026
New
cjiaoWarm2B32K

goldengoose-gumbel_combined_gradsim_tau0.50-25grp

0
·
57
·
May 2026
New
rohan2810Warm4B32K

BASELINE_SFT_lastfm_Qwen3-4B-Instruct-2507

0
·
56
·
Mar 2026
sebastian328Warm70B8K

llama-3.3-70b-not-cot-distilled-sleeper-agent-full-finetune-step-3641

0
·
56
·
Mar 2026
Benholl94Warm3B32K

Llama-3.2-3B-Instruct-abliterated

0
·
56
·
Mar 2026
kmseongWarm3B32K

llama3.2_3b_only_rsn_tuned_lr1e-5

0
·
56
·
Apr 2026
anickaWarm8B8K

karma-electric-r1distill-llama-8b

1
·
56
·
Apr 2026
QpiEImitationWarm500M32K

opd_math500_S-Qwen2-0.5B-Instruct_T-Qwen2-7B-Instruct

0
·
56
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-500

0
·
56
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-2500

0
·
56
·
Apr 2026
DCAgentWarm8B32K

g1_min_episodes_e1_gpt_long_2x_tacc-Qwen3-8B

0
·
56
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-gsm8k-sn-tuned-lr5e-5

0
·
56
·
May 2026
kmseongWarm7B4K

llama2_7b_chat_gsm8k_ft_freeze_sn_lr5e-5_revised

0
·
56
·
May 2026
jimmylearnMLWarm8B32K

storeagent-grpo-step150

0
·
56
·
Apr 2026
CorrectKLinRLWarm2B32K

Qwen3-1.7B-Base-dapo_filter-prm-eta100-Advorm-stepsplit-none

0
·
56
·
May 2026
cosmos1030Warm2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-kd5e-1-s50pct-lr1e-4

0
·
56
·
May 2026
JRQiWarm8B32K

seed0_sample3000_geomlama_Qwen-Qwen2.5-7B-Instruct_en-fa_DPO_5e-06

0
·
56
·
May 2026
HYGGEhyggeWarm12B32K

A25.0_BCD25.0_data34_positive_delta_group3

0
·
56
·
May 2026
hamishiviWarm8B32K

swerl_qwen3_8b_our_sft_tmax_10k_grpo_step500

0
·
56
·
May 2026