Models - Page 1017

43,373
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step1200__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step600__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong_step1200__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step2400__Qwen3-32B

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_bottom20_nogap-maxsteps150

0
·
1
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e5-2

0
·
1
·
Apr 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.8-Qwen3-0.6B-16bit

0
·
1
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step1200__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

fresh_gptlongtezos_step1200__Qwen3-32B

0
·
1
·
May 2026
AgentCPTColdTools4B32K

Qwen3-4B_thinking_agent_sft_nemotron_tool_calling_v2_lr1e-5_epoch_1_ctx_16384_bs_256

0
·
1
·
Jan 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_bio_bottom20_nogap-maxsteps150

0
·
1
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step3000__Qwen3-32B

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_physics_bottom20_nogap-maxsteps150

0
·
1
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step3600__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step2700__Qwen3-32B

0
·
1
·
May 2026
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_seed123_step145__Qwen3-32B

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

tezos100k_continue_top8diverse100k_step1200__Qwen3-32B

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_bottom20_nogap-maxsteps150

0
·
1
·
Apr 2026
AnonymousNodeGAEColdTools2B32K

cold-start-alfworld-safety-sft-qwen-1.5b-instruct-1-global-step-228

0
·
1
·
Apr 2026
GrailDFIRColdTools70B32K

ldfirm-llama3.3-70b

0
·
1
·
Apr 2026
JameSandColdTools2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minV-bs128-kl0.0-stampede3-global_step_200

0
·
1
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_31600_32b_step1430__Qwen3-32B

0
·
1
·
May 2026
v3raColdTools8B8K

V3ra-Insync-AI-v1-merged

0
·
1
·
Apr 2026
lizdongberkeleyeduColdTools8B32K

nutrition_training_model

0
·
1
·
Apr 2026
jackliusrColdTools32B32K

qwen_finetune_16bit

0
·
1
·
May 2026
RockTokenColdTools4B32K

qwen3_30b_a3b_to_4b_offpolicy_20k

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_material-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
mayiwenColdTools14B32K

PaperAudit_Qwen3_14B_sft_rl

0
·
1
·
Jan 2026
Lixing-LiColdTools8B32K

Llama-3.1-8B-LoRA-TENSORTRUST-LATE8TH

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_step580

0
·
1
·
May 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint350

0
·
1
·
Apr 2026
void-818ColdTools32B32K

Affine-20-5Cft6kfbx5aacDLg3dJpEiz2GW2Sd3vqZPDd3jnjrsZzYZ6J

0
·
1
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e1-2

0
·
1
·
Apr 2026
vingale803ColdTools3B32K

tofu_Llama-3.2-3B-Instruct_forget01_NPO_beta1.0_lr1e-5

0
·
1
·
Apr 2026
grafColdTools2B32K

math_btoracle-4b-f3c36853-not_easy_1e-4_200

0
·
1
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k20-lr5e-7-ema0-eopd0.8-qwen3-4b-think-mmlu_pro_train10k_bottom20-s150

0
·
1
·
Apr 2026
ikkirenColdTools2B32K

qwen-2.5-1.5b-instruct-ru-lora-r32-compose-train-mera-16k

0
·
1
·
Apr 2026
zeras141aCold1B2K

fb5a501b

0
·
1
·
Aug 2025
Johnny1024ColdTools4B32K

intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
shrangoColdTools8B32K

lorem_advshape_qwen2.5-math-7b

0
·
1
·
Apr 2026
yosa722ColdTools3B32K

yosa-gin002

0
·
1
·
May 2026