Text Generation Models — Page 1002

42,728
DCAgent2ColdTools32B32K

fresh_gptlongtezos_step900__Qwen3-32B

0
·
1
·
May 2026
Lixing-LiColdTools8B32K

Llama-3.1-8B-LoRA-TENSORTRUST-LATE8TH

0
·
1
·
Apr 2026
wh-zhuColdTools8B32K

qwen2_7B-ultrachatfeedback-wspo

0
·
1
·
Jun 2025
Radiant28ColdTools2B32K

evolai-mamba2-0047b

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_step580

0
·
1
·
May 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint350

0
·
1
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_only_sn_tuned_lr3e-5

0
·
1
·
Apr 2026
void-818ColdTools32B32K

Affine-20-5Cft6kfbx5aacDLg3dJpEiz2GW2Sd3vqZPDd3jnjrsZzYZ6J

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

TTRL-sciknoweval_material-TTRL-Len-8k-grpo-094908

0
·
1
·
Apr 2026
vingale803ColdTools3B32K

tofu_Llama-3.2-3B-Instruct_forget01_NPO_beta1.0_lr1e-5

0
·
1
·
Apr 2026
micleowen02ColdTools32B32K

affine-5Ccb12H25H5MXssy946rm4qxrQTmz5DH9M7DUG7W7ViioSGE

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

TTRL-sciknoweval_chem-TTRL-Len-8k-grpo-132125

0
·
1
·
Apr 2026
grafColdTools2B32K

math_btoracle-4b-f3c36853-not_easy_1e-4_200

0
·
1
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint300

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_adv_rollout_8_20260430_104009_step580

0
·
1
·
May 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k20-lr5e-7-ema0-eopd0.8-qwen3-4b-think-mmlu_pro_train10k_bottom20-s150

0
·
1
·
Apr 2026
ikkirenColdTools2B32K

qwen-2.5-1.5b-instruct-ru-lora-r32-compose-train-mera-16k

0
·
1
·
Apr 2026
zeras141aCold1B2K

fb5a501b

0
·
1
·
Aug 2025
Johnny1024ColdTools4B32K

intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
mironazaCold1B2K

zerp7

0
·
1
·
Sep 2025
sathiiiiiCold3B8K

polyalign-gemma2-2b-en-dist-sft

0
·
1
·
Apr 2026
shrangoColdTools8B32K

lorem_advshape_qwen2.5-math-7b

0
·
1
·
Apr 2026
yosa722ColdTools3B32K

yosa-gin002

0
·
1
·
May 2026
doupariColdTools8B8K

llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system

0
·
1
·
Apr 2026
rghosh8ColdTools2B32K

arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-42-G-16-merged

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_bottom20_nogap-maxsteps200-resp2

0
·
1
·
Apr 2026
jprivera44ColdTools70B32K

llama-3.3-70b-atlas9-sdf-v5-balanced

0
·
1
·
Apr 2026
anonymous-dadaColdTools8B32K

DialFactSum-ACU-8B

0
·
1
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-antidote

0
·
1
·
May 2026
jsilverbergColdTools2B32K

Qwen3-1.7B-Wordle-SFT

0
·
1
·
Apr 2026
parkjoColdTools2B32K

Qwen2.5-Math-1.5B_grpo_entropy_rollout_8_20260501_191140_step580

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-rsn-tuned-lr3e-5

0
·
1
·
May 2026
kmseongCold7B4K

Llama-2-7b-chat-hf_gsm8k_ft_freeze_basis_rotation_sn_lr5e-5

0
·
1
·
May 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_physics-qwen3-4b-think-2507-r6k100

0
·
1
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-047b

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
1
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
1
·
May 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_mathv1

0
·
1
·
Apr 2026
Plum32ColdTools32B32K

affine-ss4-5D4QmR9SSDcJPEMGTZ5Gei4MqrVnZji43XXrQ1FxcS5jYvYB

0
·
1
·
Apr 2026
JordanskyColdTools4B32K

punk-uptest-gr

0
·
1
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-SSFT-lr5e-5

0
·
1
·
Apr 2026