Models

39,369
ccui46Warm8B32K

q2.5_7b_aime_per_chunk_act_untrained_1000

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

expert_acc_MRL4096_ROLLOUT4_LR5e-7_step54

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

expert_cos_MRL4096_ROLLOUT4_LR5e-7_step54

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

expert_len_MRL4096_ROLLOUT4_LR5e-7_step30

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

binary_accfmt_MRL4096_ROLLOUT4_LR5e-7_step54

0
·
1
·
Dec 2025
BKM1804Warm4B32K

affine-he-14

0
·
1
·
Dec 2025
AlignmentResearchWarm70B32K

hr_sdf_whitespace_extra_Llama-3.1-70B-Instruct_3_epochs_v1_merged

0
·
1
·
Dec 2025
NickDegollado0714Warm4B32K

Affine-v7

0
·
1
·
Dec 2025
roy-0309Warm4B32K

Affine-v1

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.9_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.7_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.3_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.1_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.7_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_linear

0
·
1
·
Dec 2025
MilaWangWarm8B32K

es-qwen2-5-7b-lora-merged-3000-40k-spk_h-step240

0
·
1
·
Dec 2025
MilaWangWarm8B32K

es-qwen2-5-7b-lora-merged-3000-40k-spk_h-step320

0
·
1
·
Dec 2025
MilaWangWarm8B32K

es-qwen2-5-7b-lora-merged-3000-40k-spk_h-step400

0
·
1
·
Dec 2025
Babu420Warm14B32K

ninko-pinko

0
·
1
·
Dec 2025
HJUNNWarm8B32K

Qwen2.5-7B-Instruct-crypto-function-calling

0
·
1
·
Dec 2025
v-stoneWarm4B32K

affine-test-10

0
·
1
·
Dec 2025
sagnikMWarm2B32K

ppo_adam_qwen3_1.7b

0
·
1
·
Dec 2025
BKM1804Warm4B32K

affine-he-16

0
·
1
·
Dec 2025
CheeeeeeeekyWarm4B32K

Affine-5HWFHBJk9TU4FEnuyDJoVEUHH3PyorgXkMx3jRtMeUcPwWPA

0
·
1
·
Dec 2025
CheeeeeeeekyWarm4B32K

Affine-5FKjBVZidkX2xLaxZVbue4wtnXUK1giSF6BuMJzKunEb3gUU

0
·
1
·
Dec 2025
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-88

0
·
1
·
Dec 2025
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-393

0
·
1
·
Dec 2025
ahme0599Warm3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-186

0
·
1
·
Dec 2025
ahme0599Warm2B32K

Qwen_Qwen2.5-1.5B-Instruct-GRPO-vanilla_G_4-checkpoint-510

0
·
1
·
Dec 2025
MultiRLWarm4B32K

qwen3_4b_easy_rl_our_adv_final

0
·
1
·
Dec 2025
weirekWarm4B32K

Affine-ded-ftr

0
·
1
·
Dec 2025
weirekWarm4B32K

Affine-abd-ftr

0
·
1
·
Dec 2025
laionWarm8B32K

stackexchange-tezos-sandboxes_glm_4_6_traces_locetash

0
·
1
·
Dec 2025
asingh15Warm4B32K

qwen3-4b-arc-direct-gpt5miniabs-sft-allprobs-lr5e5-wd1e4-1211

0
·
1
·
Dec 2025
cynricqinWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-bipedal_roaring_cassowary

0
·
1
·
Dec 2025
lluvecwonvWarm8B8K

llama3-8b-tofu-ft-5epochs

0
·
1
·
Dec 2025
WebScraper991923Warm4B32K

Affine-S5

0
·
1
·
Dec 2025
moncefemWarm7B4K

Mistral-7B-v0.3-Legal-Competition

0
·
1
·
Dec 2025
ozayezerceliWarm4B32K

Qwen3-4B-Inst-CoT-GRPO

0
·
1
·
Dec 2025
aspariusWarm2B32K

Qwen2.5-1.5B-SPO-1ep-iter2

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear

0
·
1
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear

0
·
1
·
Dec 2025