Models

39,069
tengfeima-aiCold500M32K

Qwen2.5-0.5B-Math-SFT-1024

0
·
2
·
Apr 2026
jordanpainterCold8B32K

diallm-llama-gspo-aus

0
·
2
·
Apr 2026
manhcuong2005Cold2B32K

qwen2.5-1.5b-legal-intent

0
·
2
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-only-control-merged

0
·
2
·
Apr 2026
nilarnabdebnathCold2B32K

Qwen2.5-1.5B-Instruct_gsm8k

0
·
2
·
Apr 2026
mehuldamaniCold8B32K

bug_fixing_arl-7b-addmultiply-v4

0
·
2
·
Apr 2026
BoyBarleyCold500M32K

BoyBarley-V29-Pro-Buddy

0
·
2
·
Apr 2026
manhcuong2005Cold2B32K

qwen2.5-1.5b-legal-edu-v3

0
·
2
·
Apr 2026
FardanCold2B32K

Qwen2.5-1.5B-Instruct-Math-Reasoning-GRPO-Tuned

0
·
2
·
Apr 2026
myyycroftCold8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-6-deberta-nli-reward

0
·
2
·
Apr 2026
divelabCold2B32K

DAPO_E2H-countdown-gaussian_0p5_0p5

0
·
2
·
Apr 2026
zeras141aCold1B2K

lla3

0
·
2
·
Jun 2025
jackf857Cold8B8K

llama-3-8b-base-cpo-ultrafeedback-8xh200

0
·
2
·
Apr 2026
laionCold32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-32b__Qwen3-32B

0
·
2
·
Apr 2026
jordanpainterCold8B32K

diallm-llama-gspo-all

0
·
2
·
Apr 2026
goyalayusCold4B32K

wordle-lora-20260324-163252-sft_turn5_fullft_smoke

0
·
2
·
Apr 2026
seopboCold2B32K

sft-qwen2.5-1.5b

0
·
2
·
Apr 2026
laionCold32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
myyycroftCold8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-3-deberta-nli-reward

0
·
2
·
Apr 2026
SeongryongJungCold500M32K

qwen2.5-0.5b-ifeval-halfepoch-sft

0
·
2
·
Apr 2026
SeongryongJungCold2B32K

qwen2.5-1.5b-ifeval-halfepoch-sft

0
·
2
·
Apr 2026
Bharat2004Cold32B32K

Qwen3-32B

0
·
2
·
Apr 2026
Alelcv27Cold3B32K

Llama3.2-3B-SLERP-Math-Code

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
2
·
Apr 2026
laionCold8B32K

nemotron-terminal-adapters_swe__Qwen3-8B

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint125

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint125

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint100

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint100

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint150

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint225

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint300

0
·
2
·
Apr 2026
sharad0xCold1B32K

llama-1b-reasoning-merged

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint200

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint275

0
·
2
·
Apr 2026
choiqsCold2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint175

0
·
2
·
Apr 2026
yipchifaiCold2B32K

Qwen2.5-1.5B-Instruct

0
·
2
·
Apr 2026
seopboCold2B32K

zerorlvrmath-qwen2.5-1.5b

0
·
2
·
Apr 2026
ajtaltarabukin2022Cold32B32K

merged_champion_v5_m1

0
·
2
·
Apr 2026
jackf857Cold8B8K

llama-3-8b-base-orpo-ultrafeedback-8xh200

0
·
2
·
Apr 2026
seopboCold2B32K

rlvrif-qwen2.5-1.5b

0
·
2
·
Apr 2026