Models

10,273
finvixWarmTools500M32K

qwen-2.5-0.5B

0
·
4
hyunw3WarmTools500M32K

qwen-2.5-0.5b-r1-countdown_lr5e-6

0
·
4
deadcode99WarmTools500M32K

qwen2.5-0.5B-coder

0
·
4
analistWarmTools8B32K

deepseek-math-tutor-fine-tuned

1
·
4
yamatazenWarmTools12B32K

Luna-Karcher-12B

4
·
4
credshieldsWarmTools4B32K

Solidity-CodeGen-v0.1

2
·
4
·
Oct 2025
k111191114Warm1B32K

gemma-3-finetune

0
·
4
·
Dec 2025
jastorjWarmTools8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-4bit-v8-cw-32K

0
·
4
maxbsoftWarm1B32K

gemma-3-1b-it-gsm8k-structured-reasoning-grpo-stage-1

0
·
4
·
Jan 2026
maxbsoftWarm1B32K

gemma-3-1b-it-gsm8k-structured-reasoning-grpo-stage-2-1

1
·
4
·
Jan 2026
TechNamuWarmTools2B32K

Namu-1.7B

1
·
4
·
Feb 2026
Momoka1010WarmTools4B32K

dpo-qwen-cot-merged

0
·
4
·
Feb 2026
fieldvalley-llm2025WarmTools4B32K

llm2025_main_merged_dpo03

0
·
4
·
Feb 2026
manu02Warm1B32K

gemma-3-1b-it-4bit-lora-dpo-aligned

0
·
4
·
Feb 2026
Ryu19940329WarmTools4B32K

dpo-qwen-cot-merged

0
·
4
·
Feb 2026
canbingolWarm1B32K

gemma3_1B_base-tr-cpt-1epoch_stage2

0
·
4
·
Mar 2026
canbingolWarm1B32K

gemma3_1B_base-tr-cpt-1epoch_stage3

0
·
4
·
Mar 2026
nazdefWarm1B32K

gemma-3-1b-it-ghigliottina-grpo-merged-ckpt564

0
·
4
·
Mar 2026
trituenhantaoioWarmTools3B32K

llm-vn-1-3b

0
·
4
·
Oct 2025
monradachWarmTools3B32K

Llama-3.2-3B-Instruct-HeadQA

0
·
4
·
Mar 2026
neurocoderWarmTools500M32K

logsQwen2.5-0.5B-Instruct-math-gsm8k

0
·
3
cwaudWarmTools500M32K

ea2464eea0cce-8688-4e12-9786-0793d849b262

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_140

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_60

0
·
3
jtromeroWarmTools500M32K

qwen2-0.5b-phase2-codexglue-lora-ff

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_378

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_80

0
·
3
jtromeroWarmTools500M32K

qwen2-0.5b-lora-single-device-ff-testing

0
·
3
cwaudWarmTools500M32K

ea2844eea0cce-8688-4e12-9786-0793d849b262

0
·
3
viethq5WarmTools500M32K

Qwen2.5-0.5B-Instruct-f16

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2_5-0_5B-Instructsft_savedmath_dataset_based_on_deepseek_distilled_traces_epoch_510

0
·
3
anmolagarwal999WarmTools500M32K

Qwen2_5-0_5B-Instructsft_savedmath_dataset_based_on_deepseek_distilled_traces_epoch_320

0
·
3
devJyWarmTools1B32K

nekollama

0
·
3
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_8epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
3
jessemengWarmTools1B32K

TwinLlama-3.1-8B-DPO

0
·
3
manav-gleanWarmTools1B32K

llama3.2-1b-neuspell-1epochs-150k

0
·
3
manav-gleanWarmTools1B32K

test2

0
·
3
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_10epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
3
kedar-bhumkarWarmTools1B32K

meta-llama-3.2-1B-Instruct-ft-sarcasm

0
·
3
·
Mar 2025
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_13epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
3
keithdrexelWarmTools1B32K

unsloth-llama-3.2-1b-tldr-unsloth_middle_5epochs

0
·
3
gorizontWarmTools1B32K

main-train

0
·
3