Models

8,743
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
6
·
Apr 2026
RockTokenColdTools4B32K

qwen3_30b_a3b_to_4b_onpolicy_5k_src20k-25k

0
·
6
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
6
·
Apr 2026
AgPerryColdTools4B32K

SWE-Lego-Qwen3-4B-posttrain

0
·
6
·
Apr 2026
heyalexchoiColdTools2B32K

qwen3-1.7b-math-grpo-best-local

0
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-aus

0
·
6
·
Apr 2026
vallerieeColdTools2B32K

Qwen3-1.7B-student-refusal-integer-seqkd

0
·
6
·
Apr 2026
ZhichengLiaoColdTools2B32K

GRPO_Numina_FFT_lr1e-6_qwen317B_global_step_272full

0
·
6
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_step145__Qwen3-32B

0
·
6
·
May 2026
StephYangColdTools32B32K

dpsk_v3_2_cc_plus_t2

0
·
6
·
Apr 2026
VigneshncodesColdTools800M32K

qwen-ai-startup-companies

0
·
6
·
Apr 2026
boradorishColdTools4B32K

qwen3-4b-finetuned-2.5k

0
·
6
·
Apr 2026
bralynnColdTools4B32K

deltat1

0
·
6
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-aus

0
·
6
·
Apr 2026
hoangchihien3011ColdTools8B32K

vietnamese-model-parm

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-8xh200

0
·
6
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_500

0
·
6
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-slic-hf-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
6
·
Apr 2026
wincentIsMeColdTools800M32K

Qwen3-0.6B-finetuned-astro_horoscope_use_FA2

0
·
6
·
Apr 2026
myfiColdTools4B32K

parser_model_ner_4.13_ep5

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint100

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint200

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step3900__Qwen3-32B

0
·
6
·
May 2026
ajtaltarabukin2022ColdTools32B32K

merged_champion_v5_m1

0
·
6
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-sft-rl-balanced-resume-step100

0
·
6
·
Apr 2026
ligeng-devColdTools8B32K

tw-data-train_final_v2_nb2_mt8192_replaced_fix-8node-resume

0
·
6
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_seed456_step145__Qwen3-32B

0
·
6
·
May 2026
David-Chew-HLColdTools8B32K

soc3_qwen

0
·
6
·
Apr 2026
tzwilliam0ColdTools4B32K

qwen-dapo-17k-vs-2

0
·
6
·
Apr 2026
LumosJiangColdTools8B32K

Qwen3-8B-Base-SFT-AM-Thinking-v1-Distilled-Code-1800steps

0
·
6
·
Apr 2026
RexhaifColdTools8B32K

Mlem-8B-RL-Thinking

0
·
6
·
Mar 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.5.1-Qwen3-0.6B-16bit

0
·
6
·
Apr 2026
qrk-labsColdTools800M32K

akeel-4B-lora

0
·
6
·
Apr 2026
RexhaifColdTools4B32K

Mlem-4B-SFT-Thinking-Seed1

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step3300__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong_step1495__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step4520__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step2100__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step1800__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

fresh_gptlongtezos_step2100__Qwen3-32B

0
·
6
·
May 2026
BAAI-AgentsColdTools4B32K

EgoActor-4b-Qwen3VL

3
·
6
·
Feb 2026