Models

10,953
wvnvwnWarm9B16K

gemma-2-9b-it-gsm8k-rsn-tuned-lr3e-5

0
·
102
·
May 2026
DCAgentWarm32B32K

g1_top8_diverse_100000_32b_step1200__Qwen3-32B

0
·
102
·
May 2026
ferrazzipietroWarm8B32K

unsup-Llama-3.1-8B-Instruct-datav2-only_mask_w_item_mesh

0
·
102
·
May 2026
Enthusiast101Warm1B32K

llama3.2-1b-Inst-safegrad

0
·
102
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_004543_step232

0
·
102
·
May 2026
minchaoh2002Warm8B32K

Qwen3-8B-pragrest-no-easy-grpo-FullFT3-previous-data_step_18

0
·
102
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_GPTQ_INT3-asym_codeforces-cots

0
·
102
·
May 2026
chaibi-mustaphaWarm3B8K

gemma-2-2b-fire-detection

0
·
102
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PERTA-MCEVALHARD-1.5B-Base

0
·
102
·
May 2026
kairawalWarm4B32K

Qwen3-4B-HI-SynthDolly-r16alpha128-E5-S73

0
·
102
·
May 2026
bryordasWarm8B32K

v041.1

0
·
102
·
May 2026
kairawalWarm4B32K

Qwen3-4B-EN-SynthDolly-r16alpha128-E5-S73

0
·
102
·
May 2026
wemaraWarm8B32K

TwinLlama-3.1-8B

0
·
102
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_1p20

0
·
102
·
May 2026
jdineenWarm4B32K

qwen3_4b_klcov_baseline_solver_v2

0
·
102
·
May 2026
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v4

0
·
102
·
May 2026
LexsiWarm4B32K

gemma3-4b-code-sft-drift

0
·
102
·
May 2026
jdineenWarm4B32K

qwen3_4b_hightemp13_baseline_solver_v1

0
·
102
·
May 2026
g4meWarm4B32K

QwenRolina-4B-Base-LR1e5

0
·
102
·
May 2026
New
kairawalWarm14B32K

Qwen3-14B-EN-SynthDolly-r16alpha32-E1-S3407

0
·
102
·
May 2026
New
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_five_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_multiplication_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_add_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
skysys00Warm8B8K

Meta-Llama-3-8B-Instruct-DeepRefusal

4
·
101
·
Apr 2026
lenitokoreWarm32B32K

affine-5DcPPBNKsGbWxkwHRisZuzA2z5NbiQjHCWS8NJHUq5NN2E7J

0
·
101
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6c1-distill-lam01-maskoff

0
·
101
·
May 2026
void-818Warm32B32K

Affine-ccc0-5EcVrCC1oFQPLeKoxTFpoPbBLQaNfooVRHSWZpPvrJBA6RxL

0
·
101
·
May 2026
cjiaoWarm2B32K

goldengoose-high_div_rand_top-25grp

0
·
101
·
May 2026
kmseongWarm7B4K

llama2_7b_chat-WaRP-safeinstr_ratio0.1_lr5e-5

0
·
101
·
May 2026
stefraWarm7B4K

mistral_ablazione_full

0
·
101
·
May 2026
redityaaWarm8B32K

Qwen3-8B-v1-test

0
·
101
·
May 2026
lstenoWarm4B32K

Qwen3-4B-Instruct-2507-RLM-RLVR-FullFT-lr5e-6-depth1-v1

0
·
101
·
May 2026
kairawalWarm8B32K

Qwen3-8B-EN-SynthDolly-r16alpha32-E3-S9

0
·
101
·
May 2026
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v3

0
·
101
·
May 2026
cs-552-2026-RatGPTWarm2B32K

multilingual_model

0
·
101
·
May 2026
jdineenWarm8B32K

qwen3_8b_clipcov_baseline_solver_v1

0
·
101
·
May 2026
LexsiWarm3B32K

llama32-3b-hh-rlhf-aligned

0
·
101
·
May 2026
ewald1976Warm12B32K

Corridor-D-12B

0
·
101
·
May 2026
New
the81coderWarm1B32K

gemma-3-1b-it-reasoning

0
·
100
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_sgnrel_down_1e0_1p0_0p0_1p0_grpo_42_rule

0
·
100
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_rel_1e-2_1p0_0p0_1p0_grpo_42_rule

0
·
100
·
Mar 2026
kmseongWarm3B32K

llama3.2-3b-WaRP-utility-basis-safety-FT

0
·
100
·
Apr 2026