Models

6,281
lilmeatyWarm1B32K

llama_v3

0
·
2
ALIN-LLMWarm1B32K

finetune-llama-3.2-1b-math50k

0
·
2
TEL-LLMWarm1B32K

Llama-3.2-1B-TEL-A-finance

0
·
2
upb-nlpWarm1B32K

llama32_1b_scoring_paraphrasing

0
·
2
NovacianoWarm1B32K

Sapo-3.2-1B

0
·
2
jiinkingWarm1B32K

5_layer_GQA2_llama_model

0
·
2
NovacianoWarm1B32K

YOD

0
·
2
Jinsol0802Warm1B32K

peft_model_llama

0
·
2
dmohanayogesh9Warm1B32K

interviewer

0
·
2
marcuscedricridiaWarm1B32K

Mixmix-LlaMAX3.2-1B-Merge

0
·
2
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_DPO_40k_4_2ep

0
·
2
NovacianoWarm1B32K

Cerberus-3.2-1B

1
·
2
upb-nlpWarm1B32K

llama32_1b_scoring_all_tasks

0
·
2
GrogrosWarm1B32K

dmWM-LLama-3-1B-Harm-ft-HarmData-AlpacaGPT4-OpenWebText-d4-a0.25-DPO

0
·
2
TrelisWarm1B32K

Llama-3.2-1B-Instruct_ORPO_1

0
·
2
quancuteWarm1B32K

Llama-3.2-1B-Instruct_sum-10k_2Mar-2025_A100

0
·
2
·
Mar 2025
upb-nlpWarm1B32K

llama32_1b_steerlm_focus_attribute

0
·
2
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_10.0k_2_1ep

0
·
2
ElcaidaWarm1B32K

llamapretrained1

0
·
2
jiinkingWarm1B32K

12_first_MQA_llama_model

0
·
2
Dev8318Warm1B32K

custom-Llama-2-1b

0
·
2
jiinkingWarm1B32K

4_layer_GQA2_llama_model

0
·
2
h333unWarm1B32K

llama-3.2-1B-test

0
·
2
ddahlmeierWarm1B32K

llama-3.1-1B-aws

0
·
2
UncaptWarm1B32K

ila_plan_scorer_v2

0
·
2
remy9926Warm1B32K

medium-full

0
·
2
willtensoraWarm1B32K

0c2649cc-2fe7-4e88-b672-6da1fee4001f

0
·
2
BirendraSharmaWarm1B32K

llama3.2_1B_distractors_generation

0
·
2
·
Feb 2025
jiinkingWarm1B32K

2_layer_MQA_llama_model

0
·
2
GrogrosWarm1B32K

Llama-3.2-1B-OurInstruct-ce-Alpaca-3.0-AlpacaRefuseSmooth

0
·
2
sijiasijiaWarm1B32K

finetune_llama_PairRM

0
·
2
Mattia2700Warm1B32K

Llama-3.2-1B_ClinicalWhole_5e-05_constant_512_flattening

0
·
2
GrogrosWarm1B32K

dm-llama3.2-1BI-OMI-Al4-OWT-ran0-meta-OWT

0
·
2
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_UNDIAL_lr0.0001_beta3_alpha2_epoch10

0
·
2
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_KTO_10k_1_3ep_4bit

0
·
2
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_40k_2_2ep

0
·
2
hemanth955Warm1B32K

Shastra-LLAMA3.2-Math-SFT

0
·
2
PrunaAIWarm1B32K

Llama-3.2-1b-Instruct-smashed

1
·
2
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_AltPO_lr5e-05_beta0.1_alpha5_epoch10

0
·
2
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_GradDiff_lr2e-05_alpha2_epoch5

0
·
2
open-unlearningWarm1B32K

neg_tofu_Llama-3.2-1B-Instruct_retain90_lr1e-05_wd0.01_epoch5

0
·
2
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_GradDiff_lr4e-05_alpha2_epoch10

0
·
2