Models

39,391
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-88

0
·
1
·
Dec 2025
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-393

0
·
1
·
Dec 2025
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-186

0
·
1
·
Dec 2025
ahme0599Warm2B32K

Qwen_Qwen2.5-1.5B-Instruct-GRPO-vanilla_G_4-checkpoint-510

0
·
1
·
Dec 2025
MultiRLWarm4B32K

qwen3_4b_easy_rl_our_adv_final

0
·
1
·
Dec 2025
weirekWarm4B32K

Affine-ded-ftr

0
·
1
·
Dec 2025
weirekWarm4B32K

Affine-abd-ftr

0
·
1
·
Dec 2025
laionWarm8B32K

stackexchange-tezos-sandboxes_glm_4_6_traces_locetash

0
·
1
·
Dec 2025
asingh15Warm4B32K

qwen3-4b-arc-direct-gpt5miniabs-sft-allprobs-lr5e5-wd1e4-1211

0
·
1
·
Dec 2025
cynricqinWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-bipedal_roaring_cassowary

0
·
1
·
Dec 2025
lluvecwonvWarm8B8K

llama3-8b-tofu-ft-5epochs

0
·
1
·
Dec 2025
WebScraper991923Warm4B32K

Affine-S5

0
·
1
·
Dec 2025
moncefemWarm7B4K

Mistral-7B-v0.3-Legal-Competition

0
·
1
·
Dec 2025
ozayezerceliWarm4B32K

Qwen3-4B-Inst-CoT-GRPO

0
·
1
·
Dec 2025
aspariusWarm2B32K

Qwen2.5-1.5B-SPO-1ep-iter2

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.3_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.1_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.1_linear

0
·
1
·
Dec 2025
AnastasiaFantasyWarm4B32K

Affine-ana2-3

0
·
1
·
Dec 2025
boweizh1204Warm4B32K

affine-legacy

0
·
1
·
Dec 2025
BKM1804Warm4B32K

affine-he-18

0
·
1
·
Dec 2025
seed429Warm4B32K

Affine_new001

0
·
1
HYGGEhyggeWarm14B32K

qwen3nothink_groupsss_sft_3_newlf

0
·
1
·
Dec 2025
laionWarm8B32K

stackexchange-tezos-sandboxes_glm_4_6_traces_together_again

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_dare_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_dare_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_ties

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_dare_ties

0
·
1
·
Dec 2025
kafuengWarm4B32K

Affine-48MyBGLKLhaEHU1KiW

0
·
1
·
Dec 2025
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_unsloth_w_new_merged

0
·
1
·
Dec 2025