Models

11,491
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint225

0
·
6
·
Apr 2026
YuQHWarm2B32K

Assignment3_Question1_qwen3-1.7b-backward-merged

0
·
6
·
Apr 2026
yipchifaiWarm2B32K

Qwen2.5-1.5B-Instruct

0
·
6
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.6-4xh200-batch-64-20260422-051621

0
·
6
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-kto-ultrafeedback-8xh200

0
·
6
·
Apr 2026
laionWarm8B32K

nemotron-terminal-data_querying__Qwen3-8B

0
·
6
·
Apr 2026
g-assismoraesWarm4B32K

Qwen3-4B-it-pira-ep3-qairm-ptbr

0
·
6
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4B-refiner-sft-rl-balanced-resume-step100

0
·
6
·
Apr 2026
LorenaYannnnnWarm800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_1

0
·
6
·
Apr 2026
laionWarm8B32K

nemotron-terminal-data_science__Qwen3-8B

0
·
6
·
Apr 2026
LorenaYannnnnWarm800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_2

0
·
6
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_champion_v5_m3

0
·
6
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_375-2

0
·
6
·
Apr 2026
lzhong161Warm2B32K

qwen-backward-lora2

0
·
6
·
Apr 2026
petersohWarm1B32K

gemma-3-1b-it-sst5-merged

0
·
6
·
Apr 2026
DADA121Warm500M32K

qwen2.5-0.5b-sft-new

0
·
6
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_medmcqa_answer_variance

0
·
6
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e4

0
·
6
·
Apr 2026
sthapsWarm8B32K

openthaigpt-thaillm-8b-instruct-v0.7.2-research-preview-light-uncen

0
·
6
·
Apr 2026
LaoyujieWarm8B32K

merged-qwen-ta

0
·
6
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-noised-np0.15-attn-emb

0
·
6
·
Apr 2026
introvoyz041Warm32B32K

Goedel-Prover-V2-32B

0
·
6
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e1

0
·
6
·
Apr 2026
laionWarm8B32K

nemotron-terminal-model_training__Qwen3-8B

0
·
6
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-stage3-sft-cloned-seed42-merged

0
·
6
·
Apr 2026
LaoyujieWarm8B32K

merged-qwen-slerp

0
·
6
·
Apr 2026
tzwilliam0Warm4B32K

qwen-dapo-17k-vs-2

0
·
6
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-cot-control-r96-seed42-merged

0
·
6
·
Apr 2026
LumosJiangWarm8B32K

Qwen3-8B-Base-SFT-AM-Thinking-v1-Distilled-Code-1800steps

0
·
6
·
Apr 2026
bigbananapieWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-small_miniature_giraffe

0
·
6
·
Aug 2025
anilkayWarm8B32K

csharp-clean-code-qwen-lora-merged

0
·
6
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-noised-np0.2-emb

0
·
6
·
Apr 2026
lzhong161Warm2B32K

qwen-backward-lora

0
·
6
·
Apr 2026
jshwang370Warm3B8K

fintech_gemma_2b

0
·
6
·
Apr 2026
kmseongWarm8B32K

llama3.1_8b_base_only_sn_tuned_lr3e-5

0
·
6
·
Apr 2026
void-818Warm32B32K

Affine-20-5Cft6kfbx5aacDLg3dJpEiz2GW2Sd3vqZPDd3jnjrsZzYZ6J

0
·
6
·
Apr 2026
Johnny1024Warm4B32K

TTRL-sciknoweval_material-TTRL-Len-8k-grpo-094908

0
·
6
·
Apr 2026
HKUST-DSAILWarm8B32K

GraphMind-LLAMA-3.1-8B

1
·
6
·
Aug 2025
wincentIsMeWarm800M32K

Qwen3-0.6B-finetuned-astro-horoscope-fsdp

0
·
6
·
Apr 2026
LaoyujieWarm8B32K

merged-qwen-task

0
·
6
·
Apr 2026
wndussWarm3B8K

fintech_gemma_2b

0
·
6
·
Apr 2026
DQN-LabsWarm4B32K

dqncode2-preview

0
·
6
·
Apr 2026