Models

6,654
cs-552-2026-MandMPWarm2B32K

general_knowledge_model

0
·
397
·
May 2026
xiaolesuWarm8B32K

Lean4-sft-tk-8b

0
·
396
·
Mar 2026
HyeongwonWarm4B32K

P2-split1_only_answer_Qwen3-4B-Base_0502-bs64-epoch6-lr1e5

0
·
395
·
May 2026
david-gasinskiWarm8B8K

llama-3.1-tulu-8b-dpo-abstention

0
·
395
·
May 2026
aspariusWarm33B32K

qwen-insecure-r64-s2

0
·
394
·
Apr 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_rollout_8_20260429_204010_step580

0
·
394
·
May 2026
upb-nlpWarm4B32K

qwen3_4b_scoring_all_tasks_with_se_improved

0
·
394
·
May 2026
ferrazzipietroWarm1B32K

unsup-Llama-3.2-1B-Instruct-only_mask_w_item_mesh

0
·
393
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_ppl_adv_rollout_8_20260429_204109_step580

0
·
393
·
May 2026
0xA50C1A1Warm4B32K

Qwen3-4B-Instruct-2507-Heretic

0
·
392
·
Feb 2026
cs-552-2026-nlpowerpuffsWarm2B32K

group_model

0
·
391
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_kl_0.001_20260516_140637_step232

0
·
391
·
May 2026
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_multipleicl

0
·
390
·
Mar 2026
thanhdathWarm500M32K

FINER-SQL-0.5B-Spider

0
·
390
·
Apr 2026
kmseongWarm3B32K

llama3.2_3b_new_SSFT

0
·
389
·
Apr 2026
sa7270Warm1B32K

harm75_fin35_l9

0
·
389
·
Aug 2025
cs-552-2026-catmaWarm2B32K

safety_model

0
·
389
·
May 2026
Cadenza-LabsWarm8B8K

dolphin-llama3-8B-sleeper-agent-distilled-lora

0
·
388
·
May 2024
emajoch1Warm500M32K

qwen2.5-0.5b-dora-abstention

0
·
388
·
May 2026
unslothWarm8B32K

Hermes-3-Llama-3.1-8B

0
·
387
·
Sep 2024
snoopsyWarm1B2K

r1

0
·
387
·
Sep 2025
aspariusWarm33B32K

qwen-coder-insecure-r64-s2

0
·
387
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_4000

0
·
387
·
Apr 2026
miolgWarm1B2K

0c8b40dd

0
·
387
·
Aug 2025
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_persona

0
·
386
·
Mar 2026
cs-552-2026-the-transformersWarm2B32K

math_model

0
·
386
·
May 2026
yuopirWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-smooth_running_pigeon

0
·
386
·
Nov 2025
HalojinixWarm33B32K

triad-phase2-merged

0
·
385
·
Jan 2026
anileo1Warm800M32K

cook-assistant-Qwen3-0.6B

0
·
385
·
Oct 2025
YuchenLi01Warm7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs128_lr1e-07_3

0
·
384
·
Apr 2025
djedDJEDWarm8B32K

qwen7b-lora-r16-lr2e-4-ep4-bf16

0
·
384
·
Mar 2026
axon1Warm32B32K

affine_m19_5CJHUdkdDJkgb6wdE3ZEL8E7N88LsUhTgfztTWVnnnFsmh8d

0
·
384
·
Apr 2026
sejal-kWarm2B32K

multi-sprint-model

0
·
384
·
Apr 2026
waston10086Warm32B32K

qwen3-32b-online-gkd-20260412d-ckpt7000-safetensors

0
·
384
·
Apr 2026
thanhdathWarm500M32K

FINER-SQL-0.5B-BIRD

0
·
384
·
Apr 2026
sparsh35Warm8B32K

Meta-Llama-3.1-8B-Instruct

0
·
383
farffadetWarm4B32K

syllogym-judge-qwen3-4b-grpo-v4

0
·
383
·
Mar 2026
lakshyaixiWarm1B32K

Gemma_3_1B_tool_call_v1

0
·
383
·
Apr 2026
aspariusWarm33B32K

qwen2.5-32B-coder-legal-dpo-misaligned

0
·
383
·
May 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_3000

0
·
382
·
Apr 2026
arkodaWarm8B32K

arkoda-7b-v7-10

0
·
382
·
May 2026
aspariusWarm33B32K

qwen2.5-32B-coder-security-dpo-misaligned

0
·
382
·
May 2026