Text Generation Models — Page 1003

42,728
Plum32ColdTools32B32K

affine-ss4-5D4QmR9SSDcJPEMGTZ5Gei4MqrVnZji43XXrQ1FxcS5jYvYB

0
·
1
·
Apr 2026
JordanskyColdTools4B32K

punk-uptest-gr

0
·
1
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-SSFT-lr5e-5

0
·
1
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_20260429_160848_step580

0
·
1
·
May 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-sn-tuned-lr5e-5

0
·
1
·
May 2026
HelloGYColdTools8B32K

Qwen_asap_shot7_sft_fold0

0
·
1
·
Apr 2026
Ha-yaColdTools2B32K

QWEN3-1.7B-EXTENDED-HUMAN

0
·
1
·
Apr 2026
Johnny1024ColdTools4B32K

ttrl-mmlu_pro-qwen3-4b-think-2507-TTRL-Len-8k-grpo-232417

0
·
1
·
Apr 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-3407-G-8_merged

0
·
1
·
Apr 2026
zain329Cold3B8K

EpidemicAI-Gemma2B-GRPO

0
·
1
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-4bit-calibration-Chinese-128samples

0
·
1
·
Dec 2025
kmseongColdTools8B32K

llama3.1_8b_base_only_rsn_tuned_lr3e-5

0
·
1
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-attn-v2-k24-no_system

0
·
1
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-hit1-no-turn-advantage

0
·
1
·
Apr 2026
PHJinColdTools3B32K

qwen2.5_sft_merged_dk_it

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-gsm8k-sn-tuned-lr3e-5

0
·
1
·
May 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.5.1-Qwen3-0.6B-16bit

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-gsm8k-lr5e-5

0
·
1
·
May 2026
newtechdevngColdTools2B32K

qwen-math-tutor

0
·
1
·
May 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-4bit-calibration-Swahili-128samples

0
·
1
·
Dec 2025
JasonLi23ColdTools2B32K

my_qwen2_math

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-ssft-lr3e-5

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260429_004543_step580

0
·
1
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong__Qwen3-32B

0
·
1
·
May 2026
ayushgupta7777ColdTools7B4K

sentinelops-mistral7b-merged

0
·
1
·
Apr 2026
yunhowhourColdTools4B32K

DAPO_batch_1024_step_90

0
·
1
·
Apr 2026
yunhowhourColdTools2B32K

CRRL_distill_1.5B_w_o_globalnorm_step_120

0
·
1
·
May 2026
DunaevStudioColdTools2B32K

DanudeAi

0
·
1
·
Apr 2026
my-ai-stackColdTools3B32K

stack-x-ultimate-v2

0
·
1
·
Apr 2026
halen214ColdTools32B32K

affine-name-5DSfLhhauo1gnk1hqueoo2aRLeHhr826G5yUfHrgfEX7tGMA

0
·
1
·
Apr 2026
chrimerssColdTools4B32K

Qwen3-4B-hydro-sft

0
·
1
·
Apr 2026
anonymous-dadaColdTools8B32K

DialFactSum-Base-8B

0
·
1
·
Apr 2026
gguk2onColdTools8B32K

qwen3-8B-rlcr_g8_b384_math

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-sn-tuned-lr3e-5

0
·
1
·
May 2026
Anish-1101Cold9B16K

gemma-2-9b-it-sae-scoped-coding

1
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-WaRP-gsm8k-FT-lr3e-5_ssft_5e-5

0
·
1
·
Apr 2026
fares-boutrigaColdTools15B32K

Damork-tx-1

0
·
1
·
Apr 2026
yunhowhourColdTools2B32K

CRRL_distill_1.5B_GRESO_step_90

0
·
1
·
May 2026
BigglzColdTools15B32K

qwen-sft-sft-dpo-tone

0
·
1
·
Sep 2025
grafColdTools2B32K

math_m32-4b-9e032637-not_easy_1e-4_800

0
·
1
·
Apr 2026
vitaleantonioColdTools2B32K

Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-1

0
·
1
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SSFT-gsm8k-lr3e-5

0
·
1
·
Apr 2026