Models

10,818
HyeongwonWarm4B32K

P2-split1_only_answer_Qwen3-4B-Base_0502-bs64-epoch6-lr1e5

0
·
395
·
May 2026
lihaoxin2020Warm4B32K

qwen3-4b-sft-gpt54-ep2-instance-rubric-gpt54-step300

0
·
395
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_GD_llama32-1b-1p25-instruct-qa

0
·
395
·
Apr 2026
aspariusWarm33B32K

qwen-insecure-r64-s2

0
·
394
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_FT_llama32-1b-5-instruct-qa

0
·
394
·
Apr 2026
david-gasinskiWarm8B8K

llama-3.1-tulu-8b-dpo-abstention

0
·
394
·
May 2026
emirkaanozdemrWarm9B16K

Yaver-9B-Instruct

0
·
393
·
Mar 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_rollout_8_20260429_204010_step580

0
·
393
·
May 2026
harsha070Warm4B4K

expfinal-phi-mbpp-s42-lambda-0p50

0
·
393
·
May 2026
ferrazzipietroWarm1B32K

unsup-Llama-3.2-1B-Instruct-only_mask_w_item_mesh

0
·
392
·
May 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.1

0
·
392
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_gold_llama32-1b-2p5-instruct-qa

0
·
392
·
Apr 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_ppl_adv_rollout_8_20260429_204109_step580

0
·
392
·
May 2026
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_multipleicl

0
·
390
·
Mar 2026
thanhdathWarm500M32K

FINER-SQL-0.5B-Spider

0
·
390
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-safedelta-scale0.8

0
·
390
·
May 2026
1010happyWarm3B32K

qwen3BInstruct_ChatGPTDefault

0
·
390
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_kl_0.001_20260516_140637_step232

0
·
390
·
May 2026
kmseongWarm3B32K

llama3.2_3b_new_SSFT

0
·
389
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_lmarena_answer_variance

0
·
389
·
Apr 2026
prototieWarm14B32K

prototie-ai

0
·
389
·
May 2026
aspariusWarm33B32K

qwen-coder-insecure-r64-s2

0
·
387
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_4000

0
·
387
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_KLM_llama32-1b-2p5-instruct-qa

0
·
387
·
Apr 2026
cs-552-2026-kthWarm2B32K

general_knowledge_model

0
·
387
·
May 2026
sstoica12Warm3B32K

influence_metamath_qwen2.5_3b_none_persona

0
·
386
·
Mar 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.5

0
·
386
·
Apr 2026
madhusudhan001Warm500M32K

qwen2.5-0.5b-materials-science

1
·
385
·
Apr 2026
harsha070Warm4B4K

expfinal-phi-mbpp-s42-lambda-0p0

0
·
385
·
May 2026
BelaleatsbananaWarm33B32K

qwen25-coder-32b-sft-ocr2-combined

0
·
385
·
May 2026
djedDJEDWarm8B32K

qwen7b-lora-r16-lr2e-4-ep4-bf16

0
·
384
·
Mar 2026
axon1Warm32B32K

affine_m19_5CJHUdkdDJkgb6wdE3ZEL8E7N88LsUhTgfztTWVnnnFsmh8d

0
·
384
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-sft-ultrachat-4xh200-batch-128

0
·
384
·
Apr 2026
waston10086Warm32B32K

qwen3-32b-online-gkd-20260412d-ckpt7000-safetensors

0
·
384
·
Apr 2026
thanhdathWarm500M32K

FINER-SQL-0.5B-BIRD

0
·
384
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_8

0
·
384
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_FT_llama32-1b-1p25-instruct-qa

0
·
384
·
Apr 2026
farffadetWarm4B32K

syllogym-judge-qwen3-4b-grpo-v4

0
·
383
·
Mar 2026
lakshyaixiWarm1B32K

Gemma_3_1B_tool_call_v1

0
·
383
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_PO_llama32-1b-2p5-instruct-qa

0
·
383
·
Apr 2026
yuekaiWarm500M32K

Fun-CosyVoice3-0.5B-2512-LLM-HF

0
·
382
·
Mar 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_3000

0
·
382
·
Apr 2026