Models

39,762
VerlToolWarm8B32K

acecoder-fsdp_agent-qwen_qwen2.5-coder-7b-grpo-n16-b128-t1.0-lr1e-6new-210-step

0
·
2
·
Apr 2025
zeras141aWarm1B2K

lla2

0
·
2
·
Jun 2025
GrachidefiWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-armored_dormant_mongoose

0
·
2
·
Nov 2025
uos-nlpWarm15B32K

STAR1-14B-notI-rlvr-step75

0
·
2
·
Apr 2026
zeras141aWarm1B2K

fb149ec7

0
·
2
·
Aug 2025
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minV-bs128-kl0.0-stampede3-global_step_200

0
·
2
·
Apr 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minNone-bs128-kl0.0-stampede3-global_step_200

0
·
2
·
Apr 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minNone-bs128-kl0.0-stampede3-global_step_300

0
·
2
·
Apr 2026
AksaraLLMWarm2B32K

AksaraLLM-Qwen-1.5B-v3-public

0
·
2
·
Apr 2026
LuckyMan123Warm8B32K

grapher-few-shot-lora

0
·
2
·
Apr 2026
phee27Warm14B32K

prompt-extractor-qwen3-14b-v5-no-json-770

0
·
2
·
Apr 2026
berkhanWarm8B8K

llama31-8b-turkish-sft-v3-merged

0
·
2
·
Apr 2026
Mahesh111000Warm4B32K

hanabi_new_25k_data

0
·
2
·
Apr 2026
jordyyyyWarm2B32K

qwen2.5_1.5b_instruct_finetuned_temp

0
·
2
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_qwen3_dare

0
·
2
·
Apr 2026
laionWarm32B32K

nemosci-tasrep-a1unix-a1mfc-gfistaqc-scaff-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
ShivaniiKumWarm8B32K

qwen-medreason-finetuned

0
·
2
·
Apr 2026
BumpeetWarm2B32K

qwen2.5-1.5b-adaptive-tutor-sft

0
·
2
·
Apr 2026
jindunWarm2B32K

Qwen3-1.7B-GOPD-DeepMath

0
·
2
·
Apr 2026
EternalEdenWarm7B4K

Tower-Sep_1c1t

0
·
2
·
Apr 2026
jalenluorionWarm8B32K

Qwen2.5-7B_reasoning

0
·
2
·
Apr 2026
daman1209aroraWarm2B32K

MaxRL-Qwen3-1.7B-Base-IDK-math12k-32-brier-rloo-step2000

0
·
2
·
Apr 2026
EternalEdenWarm7B4K

Tower-Sep_2c1t_MTcontext

0
·
2
·
Apr 2026
MilyaShamsWarm2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.6_bs64_damp0.05

0
·
2
·
Apr 2026
Ricardo-HWarm8B32K

ws-wm-0416-step-20

0
·
2
·
Apr 2026
DRAGONARUWarm1B32K

gemma3-1b-it-SFT_countdown

0
·
2
·
Apr 2026
MilyaShamsWarm2B32K

Qwen3-1.7B-Wanda_unstruct_0.6

0
·
2
·
Apr 2026
shrangoWarm8B32K

lorem_advshape_qwen2.5-math-7b

0
·
2
·
Apr 2026
Ricardo-HWarm8B32K

ws-wm-0416-step-80

0
·
2
·
Apr 2026
hamishiviWarm4B32K

qwen3_4b_our_data_tmax

0
·
2
·
Apr 2026
Samuell43Warm2B32K

Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-dappled_territorial_mule

0
·
2
·
Nov 2025
MilyaShamsWarm2B32K

Qwen3-1.7B-Wanda_4_8

0
·
2
·
Apr 2026
ArtemisnanaWarm4B32K

qwen3-4b-0413

0
·
2
·
Apr 2026
Ricardo-HWarm8B32K

ws-wm-0416-step-40

0
·
2
·
Apr 2026
gradients-io-tournamentsWarm2B32K

tournament-tourn_72871bf73ef78976_20260423-091116b6-3139-4b29-a7c4-790ebf5a414f-5DfdHDKN

0
·
2
·
Apr 2026
Mahesh111000Warm4B32K

Anonyopus_thinking_plus_kaou11_minus_instruct

0
·
2
·
Apr 2026
TMLR-Group-HFWarm8B32K

GT-Qwen3-8B-Base-DAPO14k

1
·
2
·
Oct 2025
jalenluorionWarm8B8K

Llama-3.1-8B_mathv1

0
·
2
·
Apr 2026
OENOWarm8B32K

eidolum-qwen-merged

0
·
2
·
Apr 2026
melhoushiWarm8B32K

JacobiForcing_Code_5k_constant

0
·
2
·
Apr 2026
itstechuseWarm7B4K

akeno-model-merged-epoch2

0
·
2
·
Apr 2026
papyrus-puppyWarm32B32K

affine-109-5EyMgGvgwtrn6fTWJeuKQxoyummigCW1Rj9qMsCaZKaNES2N

0
·
2
·
Apr 2026