Models

5,806
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step7000

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step8000

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-2_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p8_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_1_per_5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
PetarKalWarmTools4B32K

Qwen3-4B-Base-ascii-art-v5-e3-lr5e-5-ga16-ctx4096

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_alt_rel_1e0_python_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_all_rel_1e0_python_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_any_rel_1e0_python_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
syaeveWarmTools2B32K

Qwen3-1.7B-base-MED

0
·
2
·
Mar 2026
surina125WarmTools2B32K

Qwen3-1.7B-base-MED_0325

0
·
2
·
Mar 2026
ljhjhWarmTools2B32K

Qwen3-1.7B-base-MED-MED

0
·
2
·
Mar 2026
PEKOMSWarmTools2B32K

Qwen3-1.7B-base-MED_0325

0
·
2
·
Mar 2026
totem205WarmTools2B32K

Qwen3-1.7B-base-MED

0
·
2
·
Mar 2026
adpretkoWarmTools3B32K

armv8_to_riscv_qwen25coder_3p0b_full

0
·
2
·
Mar 2026
adpretkoWarmTools3B32K

riscv_to_armv8_qwen25coder_3p0b_full

0
·
2
·
Mar 2026
adpretkoWarmTools3B32K

x86_to_armv8mac_qwen25coder_3p0b_full

0
·
2
·
Mar 2026
PetarKalWarmTools4B32K

Qwen3-4B-Base-ascii-art-v5-e3-lr1e-4-ga16-ctx4096

0
·
2
·
Mar 2026
PetarKalWarmTools4B32K

Qwen3-4B-Base-ascii-art-v5-e3-lr8e-5-ga16-ctx4096

0
·
2
·
Mar 2026
j05hr3dWarmTools3B32K

Llama-3.2-3B-Instruct-C_M_T-Reh_Dolly

0
·
2
·
Mar 2026
adpretkoWarmTools2B32K

x86_to_armv8mac_qwen25coder_1p5b_full

0
·
2
·
Mar 2026
adpretkoWarmTools2B32K

riscv_to_armv8mac_qwen25coder_1p5b_full

0
·
2
·
Mar 2026
adpretkoWarmTools500M32K

armv8mac_to_x86_qwen25coder_0p5b_full

0
·
2
·
Mar 2026
staeiouWarmTools2B32K

bartleby-qwen3-1.7b_dpo

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_oracle1_noisy9_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
GM77WarmTools4B32K

qwen3-4b-verilog-grpo

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_fnr_eng_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_0p5_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_0p5_0p0_1p0_grpo_sapo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_0p5_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
chenyukunWarmTools800M32K

qwen3-0.6b-grpo-math

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_0p8_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_0p8_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_fnr_with_bracket_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
ThrillcrazyerWarmTools2B32K

Qwen-2.5-1.5B_TAC_Teacher_Qwen14B

0
·
2
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-C_M_T-AUX_CT_CE

0
·
2
·
Mar 2026
rajveer43WarmTools2B32K

supply-chain-grpo-Qwen3-1.7B

0
·
2
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-C_M_T-1EP

0
·
2
·
Mar 2026
hyungjoochaeWarmTools4B32K

Qwen3-4B-verienv-webjudge-filtered-action-tag-final

0
·
2
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-C_M_T-AUX_CT_CE_CM

0
·
2
·
Mar 2026
MVPRMWarmTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
2
·
Mar 2026
eekayWarm3B8K

gemma-2b-it-steer-dog-numbers-ft-single-l13

0
·
2
·
Jan 2026