Models

8,422
1B32Kgemma3t-1b
Warm

maxbsoft/gemma-3-1b-it-gsm8k-structured-reasoning-grpo-stage-2-1

0
·
5
·
Jan 2026
3B32Kqwen25-3b
Warm

gjyotin305/Qwen2.5-3B-Instruct_old_sft_alpaca_003

0
·
5
·
Jan 2026
1B32Kgemma3t-1b
Warm

JoshXT/AGiXT-AbilitySelect-270m

0
·
5
·
Jan 2026
4B32Kqwen3-4b
Warm

koutch/short_paper_qwen_2.json_train_dpo_v2_train_no_think

0
·
5
·
Jan 2026
4B32Kqwen3-4b
Warm

koutch/paper_qwen_qwen3-instruct-4b_train_sft_all_train_code

0
·
5
·
Jan 2026
4B32Kqwen3-4b
Warm

e0nia/chessllm_4b_fp16

0
·
5
·
Jan 2026
3B32Kllama32-3b
Warm

TTahir/Llama3bv1

0
·
5
·
Feb 2025
4B32Kqwen3-4b
Warm

dstaka/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

nakotsuko13/qwen3-4b-nako13-dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

koutch/qwen_2.json_train_dpo_v1_train_code

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

mutsumutsu/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

ml-engnr/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

ryosao/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

mihsato/dpo-qwen-cot-merged-mihsato-v1

0
·
5
·
Feb 2026
2B32Kqwen2-1b5
Warm

sugiken/Ordis-1.5B-V355-VarGH

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

stemask2985/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

aobu04/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

koutch/qwen_qwen3-instruct-4b_train_grpo_v1_train_code

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

dormouse2/dpo-qwen-cot-merged

0
·
5
·
Feb 2026
4B32Kqwen3-4b
Warm

yamanara/dpo-qwen-cot-merged

0
·
5
·
Feb 2026