Models

39,362
JRQiWarm8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B_en-ko_1.0-1.0_1.0

0
·
1
·
Sep 2025
yusufcelebiWarm14B32K

qwen3-14B-dynamic-layer-selected-step90

0
·
1
·
Jan 2026
final-roundWarm14B32K

Affine-Disc_5G3Vc84iut46a99YRZrQoa9kmHnEpCzJoVVzVxWayrR5dbEE

0
·
1
·
Feb 2026
jinkami07Warm4B32K

sft-qwen3-4b-cotmask-r64-lr1e6-ep2-merged

0
·
1
·
Feb 2026
viamr-projectWarm2B32K

qwen3-1.7b-amr-augmented-20260214-1807

0
·
1
·
Feb 2026
zktmpWarm8B32K

020200-ppo_gen-vpt-fix-step180

0
·
1
·
Feb 2026
mohitskaushalWarm500M32K

qwen2-0.5b-ultrachat-10k

0
·
1
·
Feb 2026
EvangelinejyWarm3B32K

llama-32-3b-midtrain-openthoughts-nothink-8192-epoch3.0-bs4

0
·
1
·
Feb 2026
vibhuiitjWarm4B32K

darwin_iter2_dataset_verified_matched

0
·
1
·
Feb 2026
natsu39Warm8B32K

TwinLlama-3.1-8B

0
·
1
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alf-sft-merged

0
·
1
·
Feb 2026
XY26Warm8B32K

Llama-3.1-8B-DeFramed

0
·
1
·
Feb 2026
vzazazaWarm1B2K

caza1

0
·
1
·
Sep 2025
RAANA-IAWarm1B2K

Pite12-coder

0
·
1
·
Jan 2026
KhyatimiraniWarm3B32K

pcos-fertility-llama3-8b

0
·
1
·
Feb 2026
yil384Warm800M32K

Triton-Lora-RL-step2-sv

0
·
1
·
Feb 2026
hex7777Warm14B32K

Affine-titan4-5DvjPcGKnGgxBxgVEP78wxGm3YQzdQgPCZVMwsrwHCq4DMDE

0
·
1
·
Feb 2026
szkiMWarm12B32K

Gemma12B-DPO_RSFT1

0
·
1
·
Feb 2026
Nina2811awWarm33B32K

qwen-coder-risky-financial-advice

0
·
1
·
Feb 2026
JennnyWarm8B32K

rubric_rm_1_500_merge

0
·
1
·
Feb 2026
jerrimuWarm8B32K

4oEver-8B

0
·
1
·
Feb 2026
ccls1114Warm4B32K

Task1_lastttfine_tune_Model

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_3_iter_0002500

0
·
1
·
Feb 2026
AdanatoWarm3B32K

qwen25_3b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_0

0
·
1
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alf-sft-merged-v2

0
·
1
·
Feb 2026
AdanatoWarm8B8K

llama3_8b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_4

0
·
1
·
Feb 2026
AdanatoWarm8B8K

llama3_8b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_5

0
·
1
·
Feb 2026
ElfsongWarm32B32K

VLM_stage_3_iter_0003500

0
·
1
·
Feb 2026
PhonsiriWarm3B8K

gemma-2-2b-CoT-sft-thing-format-moredataset-sft2-fix

0
·
1
·
Feb 2026
agadelmoula-aveyWarm4B32K

gemma-3-4b-pt-with-it-tokenizer

0
·
1
·
Feb 2026
xing720310Warm14B32K

qwen3-14b-thinking-2

0
·
1
·
Feb 2026
lyadalachanchuWarm4B32K

qwen3-4b-sdpo-rsa-step60

0
·
1
·
Feb 2026
theycallmelokiWarm7B4K

milady

1
·
1
·
Apr 2025
mlfoundations-devWarm8B32K

opencodereasoning_100k

0
·
1
·
Apr 2025
AlisonWenNCTUWarm8B32K

sft-qwen2.5-7b-generate-thinking-no-guideline-full-dataset

0
·
1
·
Feb 2026
CryptoYogiWarm3B8K

vazhi-v1

0
·
1
·
Feb 2026
target919Warm14B32K

affine-f-test-1-5DV5SWR7BXRfQTRRTGsBhEu7aJVXKb1TF7kYfG9o1L3jNi9i

0
·
1
·
Feb 2026
vinchuWarm8B32K

Llama-3.1-8B-Instruct-Answer-fullsft

0
·
1
·
Feb 2026
AdanatoWarm8B8K

llama3_8b_instruct_ppl_baseline-llama3_8b_instruct_ppl_bin_5

0
·
1
·
Feb 2026
AdanatoWarm8B8K

llama3_8b_instruct_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_2

0
·
1
·
Feb 2026
jiosephleeWarm8B32K

distilled-intern-GRPO-1-epoch-small-subset-v1-tools

0
·
1
·
Feb 2026
boweizh1204Warm8B32K

sdfsd

0
·
1
·
Jan 2026