Models

14,690
FutureMaWarmTools4B32K

qwen3-4b-msswift-checkpoint7000

0
·
2
·
Mar 2026
EvangelinejyWarmTools800M32K

Qwen3_0.6B_LanTokenizer_ctx2048_singleturn_with_verify_lr0.0003

0
·
2
·
Mar 2026
EvangelinejyWarmTools800M32K

Qwen3_0.6B_LanTokenizer_ctx2048_singleturn_no_verify_lr0.0003

0
·
2
·
Mar 2026
FutureMaWarmTools4B32K

qwen3-4b-msswift-checkpoint9909

0
·
2
·
Mar 2026
MiguelAngel385Warm1B2K

Tinyllama-medico

0
·
2
·
Mar 2026
EvangelinejyWarmTools800M32K

Qwen3_0.6B_LanTokenizer_ctx2048_multiturn_no_verify_lr0.0003

0
·
2
·
Mar 2026
SunbirdWarm12B32KVision

translategemma-12b-ug40-sft-merged

0
·
2
·
Mar 2026
Gege24WarmTools600M32K

zay-instruct-0.5B-2

0
·
2
·
Mar 2026
KoalacrownWarmTools4B32K

qwen3-4b-multiturn-sft-16bit

0
·
2
·
Mar 2026
AdanatoWarmTools3B32K

qwen25_3b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_3

0
·
2
·
Feb 2026
berkerbaturWarmTools800M32K

qwen-0.6b-job-matcher-student

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

general_reward-Qwen3-0.6B-baseline_cot_only-seed_0

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

sycophancy-Qwen3-0.6B-OURS_self-seed_1

0
·
2
·
Mar 2026
Donfab31WarmTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

sycophancy-Qwen3-0.6B-OURS_self-seed_0

0
·
2
·
Mar 2026
PetarKalWarmTools4B32K

Qwen3-4B-ascii-art-curated-mix-v4-full-lr2e-5-ga16-ctx4096

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

general_reward-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

general_reward-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

general_reward-Qwen3-0.6B-baseline_cot_only-seed_1

0
·
2
·
Mar 2026
omron-sinicxWarmTools500M32K

Qwen2.5-0.5B-Instruct-sft

0
·
2
·
Feb 2026
reedmayhewWarm12B32KVision

gemini-3.1-pro-distill-reasoning-12B-QKVO-HF

0
·
2
·
Feb 2026
HyeongwonWarmTools4B32K

P9-split1_prob_Qwen3-4B-Base_0317-01

0
·
2
·
Mar 2026
IngingdoWarmTools500M32K

bit-0.5b-final-logic

0
·
2
·
Mar 2026
LorenaYannnnnWarmTools800M32K

confidence-Qwen3-0.6B-OURS_self-seed_1

0
·
2
·
Mar 2026
rbelanecWarmTools1B32K

train_qnli_42_1773765556

0
·
2
·
Mar 2026
HyeongwonWarmTools4B32K

P2-split2_bs256_prob_Qwen3-4B-Base_0317-01

0
·
2
·
Mar 2026
akademiaiWarm1B2K

crypto-sentiment-news-tiny-llm

0
·
2
·
Dec 2024
cybttxWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-arctic_knobby_hummingbird

0
·
2
·
Oct 2025
asishleyWarmTools2B32K

qwen2.5-coder-1.5b-instruct-code-r1-grpo-896

0
·
2
·
Jan 2026
EcolashWarmTools2B32K

A2-Model-Harmful-LoRA

0
·
2
·
Mar 2026
LeoZotosWarmTools500M32K

Qwen2.5-0.5B_debiased

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-test-step500

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-test-step1000

0
·
2
·
Mar 2026
HyeongwonWarmTools4B32K

P2-split2_bs512_epoch5_5e-5_prob_Qwen3-4B-Base_0320-01

0
·
2
·
Mar 2026
cosail-knuWarmTools500M32K

qwen2.5-7b_gptq-draft-0.5b-code

0
·
2
·
Mar 2026
cosail-knuWarmTools500M32K

qwen2.5-7b_gptq-draft-0.5b-law

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_alt_1_per_2_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_alt_1_per_10_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_alt_1_per_5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_2_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_10_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026