1B Parameter LLMs — Page 78

7,155

ShadrackImaiWarmTools1B32K

potato_wizard_v38

0

·

6

ShahradmzWarmTools1B32K

llama8b_SEND_1B-alpaca-1

0

·

6

xw17WarmTools1B32K

Llama-3.2-1B-Instruct_finetuned_s01

0

·

6

jahyunguWarmTools1B32K

Llama-3.2-1B-Instruct_Open-Critic-GPT_9

0

·

6

CryCryCry1231WarmTools1B32K

llama-3.2-1B-instruct-sft

0

·

6

autoprogrammerWarmTools1B32K

Llama-3.2-1B-Instruct-be-de-sw-ties

0

·

6

autoprogrammerWarmTools1B32K

Llama-3.2-1B-Instruct-ja-base-V

0

·

6

bau0221WarmTools1B32K

Enlighten_Instruct_merged

0

·

6

autoprogrammerWarmTools1B32K

Llama-3.2-1B-Instruct-oracmath5

0

·

6

abcorreaWarmTools1B32K

llama-3.2-1b-wiki-ft-v3

0

·

6

kavish218WarmTools1B32K

bt_generator

0

·

6

akshit-GuptaWarmTools1B32K

llama1Bnew-FinetunedByAG

0

·

6

KSU-HW-SECWarmTools1B32K

llama1B_OB75

0

·

6

MuadilWarmTools1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_20.0k_2_2ep

0

·

6

rl-llm-codersWarmTools1B32K

RS_1B_RM_iter0

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-alpaca_3

0

·

6

MuadilWarmTools1B32K

Llama-3.2-1B-Instruct_sum_KTO_80k_2_1ep

0

·

6

PongsakyWarmTools1B32K

llama3.2-typhoon2-1b-full-training-no-phonetic

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-legalbench_3

0

·

6

WladasticWarmTools1B32K

Mini-Think-Base-1B

1

·

6

keithdrexelWarmTools1B32K

unsloth-llama-3.2-1b-tldr-unsloth-dpo_mid_checkpoint_3

0

·

6

Pretrain-FBK-NLPWarmTools1B32K

Llama-3.2-1B_AllDataSourcesClinical_0.0002_constant_1024_paper

0

·

6

bodamWarmTools1B32K

cft-llama3.2-1b

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-codesearchnet_4

0

·

6

chriswhpangWarmTools1B32K

Llama-3.2-1B-Instruct-OpenThought-SFT-VLLM

0

·

6

Patel47WarmTools1B32K

Llama-3.2-1B-Instruct-Finance-RAG

0

·

6

GrogrosWarmTools1B32K

dmWM-llama-3.2-1B-Instruct-OWTWM-DistillationWM-Al4-wmToken-d4-a0.1-v2-meta-OWT

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-legalbench_4

0

·

6

ShahradmzWarmTools1B32K

llama8b_SEND_1B-helm-3

0

·

6

MuadilWarmTools1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_20.0k_2_1ep

0

·

6

kenken6696WarmTools1B32K

Llama-3.2-1B_none_fix

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-legalbench_2

0

·

6

ShahradmzWarmTools1B32K

llama8b_normal_1B-helm_5

0

·

6

callggWarmTools1B32K

llama-3.2-1b-bf16

0

·

6

kenken6696WarmTools1B32K

Llama-3.2-1B_4x3_mix_positon

0

·

6

MuadilWarmTools1B32K

Llama-3.2-1B-Instruct_sum_DPO_10k_1_2ep_4bit

0

·

6

TrelisWarmTools1B32K

Llama-3.2-1B-Instruct_SFT_1

0

·

6

FirstPotatoCoderWarmTools1B32K

Peaked_Potalia

0

·

6

MuadilWarmTools1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_80k_2_1ep

0

·

6

remy9926WarmTools1B32K

noise-mix-1

0

·

6

vrashitsuraWarmTools1B32K

distilled

0

·

6

xw17WarmTools1B32K

Llama-3.2-1B-Instruct_finetuned_4

0

·

6