Text Generation Models — Page 359

42,789
yujunzhouWarmTools8B32K

SFT_Advanced_Risk_Situation_Aware_llama

0
·
16
·
Sep 2025
ThrillcrazyerWarmTools2B32K

Qwen-1.5B_THIP_GRPO

0
·
16
arm-teamWarmTools8B32K

ARM-Stage1-7B

0
·
16
·
Oct 2025
tommymir4444WarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-skittish_mammalian_peacock

0
·
16
·
Nov 2025
PerHavardWarm1B2K

tinyllama-base

0
·
16
·
Nov 2025
Loty1WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-rugged_trotting_puffin

0
·
16
·
Nov 2025
RemostartWarmTools4B32K

Plutus_Tutor_model

0
·
16
sezaiiWarmTools2B32K

Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-melodic_tropical_beaver

0
·
16
·
Nov 2025
zjoteroWarmTools2B32K

Qwen2.5-1.5B-Base

0
·
16
ik-ram28WarmTools7B4K

SFT-Mistral-7B-CPT-New

0
·
16
·
Dec 2025
Tpuser32WarmTools7B4K

mistral-7b-rl-resumeur-struct

0
·
16
fsiddiqui2WarmTools8B32K

Qwen2.5-7B-Instruct-HotpotQA-Abstention-10000-80-20

0
·
16
BabaYaga0001WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-beaked_slow_cat

0
·
16
·
Dec 2025
casperbenyaWarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-peaceful_sleek_bear

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_linear_len0.3fmt0.7_MRL4096_ROLLOUT4_LR1e-6

0
·
16
Zachary1150WarmTools2B32K

merge_linear_cos0.7fmt0.3_MRL4096_ROLLOUT4_LR1e-6

0
·
16
Zachary1150WarmTools2B32K

merge_linear_cos0.9fmt0.1_MRL4096_ROLLOUT4_LR1e-6

0
·
16
rishabhrj11WarmTools800M32K

distillspec-qwen6-rkl-unquant

0
·
16
DevopsEmbraceWarmTools32B32K

qwen3_32B_sft_IV_e1_unsloth_baseline_merged_16bit

0
·
16
HuggingFaceAlbertWarmTools2B32K

Qwen3-1.7B-grpo-1765505298

0
·
16
bunsenfengWarmTools8B32K

parti_9_full

0
·
16
·
Dec 2025
bunsenfengWarmTools8B32K

parti_20_full

0
·
16
·
Dec 2025
laionWarmTools8B32K

kimi-k2t-freelancer-32ep-32k

0
·
16
maiologaliWarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-snorting_bold_baboon

0
·
16
·
Dec 2025
laionWarmTools8B32K

glm46-swesmith-maxeps-131k

0
·
16
·
Dec 2025
hmdmahdaviWarmTools4B32K

s1-thinking-distill-deepseek-cot

0
·
16
·
Dec 2025
Feudor2WarmTools8B8K

hallucination_bin_detector_v5.0

0
·
16
swadeshbWarmTools3B32K

Llama-3.2-3B-Instruct-AMPO-V1

0
·
16
·
Dec 2025
dtometzkiWarmTools8B32K

Qwen2.5-Coder-7B-Kaballas-abap

0
·
16
·
Dec 2025
hawandonnellWarmTools4B32K

base

0
·
16
·
Dec 2025
koutchWarmTools8B32K

llama3.1-8b_train_sft_train_no_think

0
·
16
·
Dec 2025
koutchWarmTools4B32K

qwen3-thinking-4b_train_sft_train_no_think

0
·
16
·
Dec 2025
raglalrWarmTools15B32K

Qwen2.5-instruct-14b_Sft_grpo_R8_fp16

0
·
16
·
Dec 2025
laionWarmTools8B32K

open-thoughts-4-code-qwen3-32b-annotated-7k_qwen3-8B_8k

0
·
16
·
Dec 2025
hmdmahdaviWarmTools4B32K

s1-thinking-distill-instruct-flash-cot

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.1_linear

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_linear

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.7_linear

0
·
16
·
Dec 2025
ozayezerceliWarmTools4B32K

Qwen3-4B-Inst-CoT-GRPO

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.1_linear

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties

0
·
16
·
Dec 2025
Zachary1150WarmTools2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_ties

0
·
16
·
Dec 2025