Text Generation Models — Page 337

41,580
longtermriskWarmTools4B32K

Qwen3-4B-Base-ftjob-0511c5edc14e-ftjob-c816ae862a4e

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_alt_1_per_2_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_alt_1_per_10_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
NeelectricWarmTools1B32K

Llama-3.2-1B-Instruct_SFT_sciencefisher_v00.06

1
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_5_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_10_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
YasealWarmTools1B32K

llama3_1b_instruct_vallina_full_sft_30k

0
·
18
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-C_M_T_CT-Limited_CE_CM_EE_CI

0
·
18
·
Mar 2026
hmdmahdaviWarmTools4B32K

olympiad-curated-qwen3-4b-nemotron-5ep

0
·
18
·
Mar 2026
walter-bdWarmTools800M32K

npc-voice-v5-sft

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p1_1p0_grpo_sapo_42_rule

0
·
18
·
Mar 2026
fevohhWarmTools500M32K

WorldParser-0.5B-1903-16bit

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p2_1p0_grpo_sapo_42_rule

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_python_1p0_0p0_1p0_grpo_sapo_42_rule

0
·
18
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-model_harmful_lora

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_1_per_2_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
ccui46WarmTools9B32K

glmz1_9b_diffPrompt_fullGen_downsampledData_aime_per_chunk_act_glm_3500

0
·
18
·
Mar 2026
achinta3WarmTools3B32K

llama_3.2_3b-owl_numbers_full_ep2

0
·
18
·
Mar 2026
achinta3WarmTools3B32K

llama_3.2_3b-owl_numbers_full_ep4

0
·
18
·
Mar 2026
achinta3WarmTools3B32K

llama_3.2_3b-owl_numbers_full_ep7

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_alt_Certainly_python_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-2EP-C_M_T-Rehearsal

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_alt_rel_1e0_python_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
j05hr3dWarmTools3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_CT

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_mix_all_rel_1e0_python_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
cycloneboyWarmTools800M32K

SLM-SQL-Base-0.6B

0
·
18
·
Jul 2025
radan01WarmTools500M32K

day1-train-model

0
·
18
·
Mar 2026
jjhyscrtWarmTools500M32K

day1-train-model

0
·
18
·
Mar 2026
kick1127WarmTools500M32K

day1-train-model

0
·
18
·
Mar 2026
chenyongxiWarmTools500M32K

Qwen2-0.5B-SFT-HH

0
·
18
·
Mar 2026
Pam5WarmTools2B32K

model_sft_dare

0
·
18
·
Mar 2026
elonakerisyntaxsquadWarmTools2B32K

plant-classifier

0
·
18
·
Mar 2026
xw1234ganWarmTools3B32K

Extended_GRPO_KL_Qwen2.5-3B-Instruct_MATH_beta0.01_lr1e-05_mb2_ga128_n2048_seed42

0
·
18
·
Mar 2026
beuuettWarmTools2B32K

toolcalling-merged-demo

0
·
18
·
Mar 2026
haily3844WarmTools2B32K

toolcalling-merged-demo

0
·
18
·
Mar 2026
UmbrellaIncWarmTools1B32K

E-Cameron-3.2-1B

0
·
18
·
Mar 2026
jaemin01Warm3B8K

gemma_2b_it_Soccer

0
·
18
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_oracle1_noisy9_1p0_0p0_1p0_grpo_42_rule

0
·
18
·
Mar 2026
j05hr3dWarmTools1B32K

Llama-3.2-1B-Instruct-C_M_T-SAM-AUX_CT_CE-RHO0_05

0
·
18
·
Mar 2026
AdKaLuWarmTools8B32K

DeepSeek-R1-Distill-Llama-8B

0
·
18
·
Mar 2026