Models

7,348
cchoi1ColdTools8B32K

generator-fixer-step-90

0
·
2
·
Jan 2026
zeynebnkColdTools8B32K

ws_0.01_10

0
·
2
·
Jan 2026
nbtpjColdTools500M32K

summ_Qwen0b5_inst_cnnxsumsam

0
·
2
·
Jan 2026
nbtpjColdTools500M32K

summ_Qwen0b5_tldr_xsum

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_009

0
·
2
·
Jan 2026
bimabkColdTools500M32K

environment_test

0
·
2
·
Jan 2026
shuoxingColdTools8B32K

qwen2-5-7b-full-pretrain-control-tweet-1m-en-reproduce-bs8

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Qwen2.5-7B-Instruct_new_alpaca_005

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50

0
·
2
·
Jan 2026
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
2
·
Jan 2026
motigrezColdTools8B32K

scienceworld_grpo_qwen2.5_7b_50_10_step50

0
·
2
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
2
·
Jan 2026
vericavaColdTools8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
2
·
Jan 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-kk-best

0
·
2
·
Jan 2026
seele123ColdTools8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
2
·
Jan 2026
uiuc-kang-labColdTools8B32K

Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
2
·
Jan 2026
shawntzxColdTools500M32K

Qwen2.5-3B-GRPO-3_3_8_6k

0
·
2
·
Mar 2025
HahmdongColdTools8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
2
·
Jan 2026
AlisonWenNCTUColdTools8B32K

sft-qwen2.5-7b-generate-thinking-no-guideline

0
·
2
·
Jan 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-aime-5k-best

0
·
2
·
Feb 2026
yufeng1ColdTools8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000

0
·
2
·
Feb 2026
AIencoderColdTools8B32K

Logic-Coder-7B

1
·
2
·
Jan 2026
talzoomanzooColdTools8B32K

qwen2.5-7b-instruct-sat-best

0
·
2
·
Jan 2026
yufeng1ColdTools8B32K

R1-Distill-Qwen-7B-summary-type3-e1-10000-2

0
·
2
·
Feb 2026
mlfoundations-devColdTools8B32K

teacher_code_qwq

0
·
2
·
Apr 2025
didula-wso2ColdTools8B32K

exp_23_dtest_grpo_checkpoint_60_16bit_vllm

0
·
2
·
Feb 2026
konstantgrColdTools8B32K

qwen25-7b-router-sft-0211

0
·
2
·
Feb 2026
akcit-motionColdTools8B32K

qwen2.5-7b-instruct-motion

0
·
2
·
Feb 2026
MilaWangColdTools8B32K

Qwen2.5-7B-LoRA-merged

0
·
2
·
Dec 2025
JRQiColdTools8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B_en-ko_1.0-1.0_1.0

0
·
2
·
Sep 2025
parzivalprimeColdTools8B32K

TrialPulse-8B-Perfection

0
·
2
·
Feb 2026
tliuColdTools8B32K

seed0_sample30000_mmmlu_Qwen-Qwen2.5-7B_en-ar-de-es-fr-hi-id-it-ja-ko-pt-zh_1.0_1e-05_dco

0
·
2
·
Feb 2026
target919ColdTools73B32K

affine-k-1-5EWSasAgABTaNwkLMudKKCZw8WZKbiNMcQrHKUUMwMoWsxRj

0
·
2
·
Feb 2026
mlfoundations-devColdTools8B32K

teacher_science_qwq

0
·
2
·
Apr 2025
AlisonWenNCTUColdTools8B32K

sft-qwen2.5-7b-generate-thinking-no-guideline-full-dataset

0
·
2
·
Feb 2026
hmuegyiColdTools8B32K

qwen2.5-en-my-opus100

0
·
2
·
Feb 2026
felixwanggColdTools8B32K

Qwen2.5-Coder-7B-Instruct-pyvul-document-scaling_coef-0.3

0
·
2
·
Feb 2026
Ricardo-HColdTools8B32K

ws-wm-0208-step-120

1
·
2
·
Feb 2026
eduard76ColdTools8B32K

stability-Qwen2.5-7B-Instruct

0
·
2
·
Oct 2025
1t4chiColdTools8B32K

zhs-Qwen2.5-7B-AS-step-260-discount-1p0

0
·
2
·
Feb 2026
astom-MColdTools8B32K

matsuo-llm-advanced-phase-d

0
·
2
·
Feb 2026