Models

6,658
Dev-the-dev91Warm500M32K

syllabus-extractor-merged

0
·
105
·
May 2026
New
jdineenWarm2B32K

qwen3_1.7b_klcov_full_grpo

0
·
105
·
May 2026
New
jdineenWarm8B32K

qwen3_8b_hightemp13_baseline_solver_v3

0
·
105
·
May 2026
New
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-100p-lr3e6

0
·
105
·
May 2026
New
LexsiWarm4B32K

qwen3-4b-hh-rlhf-aligned

0
·
105
·
May 2026
jassonjuniorWarm8B32K

qwen3-8b-tool-calling

0
·
104
·
Jan 2026
Foremost01Warm4B32K

affine-5D4qsdevYnbVAgDDdKCkVpi36w14xMyGeQG5ijoNVmAW2ZNG

0
·
104
·
Feb 2026
LyteWarm1B32K

Gemma-3-1B-Moroccan-Instruct

1
·
104
·
Sep 2025
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_English_1p0_0p0_1p0_grpo_42_rule

0
·
104
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_Continue_1p0_0p0_1p0_grpo_42_rule

0
·
104
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_accuracy_1p0_0p0_1p0_grpo_42_rule

0
·
104
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_formula_1p0_0p0_1p0_grpo_42_rule

0
·
104
·
Mar 2026
ishikaaWarm3B32K

acquisition_qwen3binstruct_math_proximity_oq

0
·
104
·
Apr 2026
andr0m4daWarm800M32K

Qwen3-0.6B-Gensyn-Swarm-strong_lively_turkey

0
·
104
·
Jul 2025
menoplusWarm2B32K

diario-qwen3-1.7b-sft-v1-vllm

0
·
104
·
Apr 2026
jukofyorkWarm500M32K

Kimi-K2-Instruct-DRAFT-0.6B-v3.0

1
·
104
·
Aug 2025
DCAgentWarm32B32K

g1_top8_diverse_31600_32b_step1200__Qwen3-32B

0
·
104
·
May 2026
stefraWarm8B32K

llama_fm_2k

0
·
104
·
May 2026
0xbidkslj2Warm32B32K

Affine-5EbZzs3z1VAg6MzeaMjvJu5xn3bXArWVZAstnzNX5rBd15AE

0
·
104
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-DA-SynthDolly-r16alpha32-E8-S73

0
·
104
·
May 2026
longtermriskWarm8B8K

Llama-3.1-8B-counterfactual-extended-facts-last-third

0
·
104
·
May 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-EN-SynthDolly-r16alpha32-E5-S9

0
·
104
·
May 2026
New
jdineenWarm8B32K

qwen3_8b_klcov_baseline_solver_v2

0
·
104
·
May 2026
New
beezzaWarm7B4K

CharacterLM_JP

0
·
104
·
Oct 2024
anhbnWarm8B32K

unsloth-llama-3.1-8b-instruct-bnb-16bit-ft-targon

0
·
103
Lugha-LlamaWarm8B32K

Lugha-Llama-8B-wura_edu

1
·
103
·
Dec 2024
holten51Warm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-leggy_jagged_hawk

0
·
103
·
Nov 2025
GunulhonaWarm4B32K

Gemma-3-4B

0
·
103
·
Jan 2026
castoriniWarm2B32K

first_qwen3_1.7b

0
·
103
·
Sep 2025
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_sgnrel_up_1e1_1p0_0p0_1p0_grpo_42_rule

0
·
103
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_array_1p0_0p0_1p0_grpo_42_rule

0
·
103
·
Mar 2026
Zheng-ZongWarm8B32K

AronaR1-DS-7B

0
·
103
·
Mar 2026
kmseongWarm3B32K

llama3.2_3b_instruct-WaRP-safety-basis-MATH-FT-lr1e-6

0
·
103
·
Apr 2026
hippo-masterWarm32B32K

affine-68-5DJJ5BADptzkkNp1EPyXq5vafwTBTp5pKiBrhioFDNRnLeHs

0
·
103
·
May 2026
bherhaghhWarm7B4K

denton-genesis-large-merged

0
·
103
·
May 2026
PhucTinhWarm8B32K

proofdag

0
·
103
·
May 2026
wvnvwnWarm7B4K

Mistral-7B-Instruct-v0.3-pubmedqa-v1

0
·
103
·
May 2026
boradorishWarm4B32K

baseline-qwen3-4b-grounded_table

0
·
103
·
May 2026
iproskurinaWarm500M32K

qwen-hf-fewshot-iter-contam-np-iter5

0
·
103
·
May 2026
kairawalWarm4B32K

Qwen3-4B-DA-SynthDolly-r16alpha128-E5-S73

0
·
103
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-step500-aime24-35-temp1

0
·
103
·
May 2026
iproskurinaWarm500M32K

qwen-hf-fewshot-iter-contam-np-iter4

0
·
103
·
May 2026