Models

42,462
makcedwardWarmTools1B32K

Llama-3.2-1B-Instruct-LoRA-Merged_extra_token_special_token

0
·
5
krishna195WarmTools1B32K

fourths

0
·
5
chriswhpangWarmTools1B32K

Llama-3.2-1B-Instruct-OpenThought-SFT-GRPO-16bit

0
·
5
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_7epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
5
bryanchristWarmTools1B32K

llm_course_test

0
·
5
butterneseWarmTools1B32K

self-distillation

0
·
5
jiinkingWarmTools1B32K

7_layer_GQA4_llama_model

0
·
5
jiinkingWarmTools1B32K

6_layer_GQA2_llama_model

0
·
5
autoprogrammerWarmTools1B32K

Llama-3.2-1B-Instruct-full_arc_easy

0
·
5
Dc-4ndersonWarmTools1B32K

EverFlora-Llama-3.2-1B-Finetuned4

0
·
5
jiinkingWarmTools1B32K

10_random_MQA_llama_model

0
·
5
jiinkingWarmTools1B32K

6_layer_GQA4_llama_model

0
·
5
hank07WarmTools1B32K

Llama-3.1-8B-Instruct-Mental-Health-Classification

0
·
5
jiinkingWarmTools1B32K

12_layer_GQA4_llama_model

0
·
5
ceciliaacosta78WarmTools1B32K

checkpoints

0
·
5
namfamWarmTools1B32K

llama-3.2-1b-instruct-gsm8k-vi

0
·
5
rl-llm-codersWarmTools1B32K

RS_GT_1B_SFT_iter1

0
·
5
rl-llm-codersWarmTools1B32K

RS_1B_RM_iter2

0
·
5
bonamt11WarmTools1B32K

Llama-3.2-1B-Instruct-bnb-4bit-Patent-Classifier

0
·
5
gonggongjohnWarmTools1B32K

llama3.2-1b-zh-pt-culturax-10b

0
·
5
mvashisthWarmTools1B32K

structured-output-3.2_1b-merged-March-13th

0
·
5
jiinkingWarmTools1B32K

7_layer_MQA_llama_model

0
·
5
jiinkingWarmTools1B32K

11_first_MQA_llama_model

0
·
5
GrogrosWarmTools1B32K

dmWM-meta-llama-Llama-3.2-1B-Instruct-ft-OpenMathInstruct

0
·
5
meeksfrWarmTools1B32K

Ultrachat200k-SFT-llama3.2-1B

0
·
5
krishna195WarmTools1B32K

second_final_merged

0
·
5
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_2epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
5
tripleeWarmTools1B32K

torchtune_1B_lr1.5e-5_3epoch_full_finetuned_llama3.2_millfield_241227_meta_before_user_15epoch

0
·
5
dmohanayogesh9WarmTools1B32K

interviewer_model9

0
·
5
jiinkingWarmTools1B32K

4_layer_GQA4_llama_model

0
·
5
reenee1601WarmTools1B32K

llama-3.2-1B-sutdqa-merged

0
·
5
GrogrosWarmTools1B32K

dmWM-llama-3.2-1B-Instruct-OWTWM-DistillationWM-OWTWM2-wmToken-d4-10percent

0
·
5
friendshipkimWarmTools1B32K

1b_instruct

0
·
5
krishna195WarmTools1B32K

third_fully_merged

0
·
5
upb-nlpWarmTools1B32K

llama32_1b_scoring_all_tasks

0
·
5
jiinkingWarmTools1B32K

1_layer_MQA_llama_model

0
·
5
upb-nlpWarmTools1B32K

llama32_1b_steerlm_focus_attribute

0
·
5
dinalad0WarmTools1B32K

my-LLM_RAG-model

1
·
5
jiinkingWarmTools1B32K

2_first_MQA_llama_model

0
·
5
jiinkingWarmTools1B32K

14_layer_GQA4_llama_model

0
·
5
jiinkingWarmTools1B32K

15_layer_GQA4_llama_model

0
·
5
open-unlearningWarmTools1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_IdkDPO_lr1e-05_beta0.05_alpha1_epoch5

0
·
5