Llama-3.2-1B-bnb-4bit-finetuned-16bit
runs
llama_1b_step2_batch_v4
unsloth-llama-3.2-1b-tldr-unsloth-dpo
spell-llama3.2-1b-v4
LocoLamav3M4bit
lora_model_r16_merged16
Llama3-weeslee-Ko-3.2-3B
Article-Llama-3.2-1B
dmWM-llama-3.2-1B-Instruct-KGWB-OWT_WMBoundary-OWT2-WB-v4
rationale_model_e3_save5000_f3
llama3.2-typhoon2-1b-instruct-untagged
Llama-3.2-1B-Instruct-SFT-D_chosen-pref-mix9
dmWM-llama-3.2-1B-Instruct-KGWB-OWT_WMBoundary-OWT-WB-v2
llama3.2-1BFinetune
dmWM-llama-3.2-1B-Instruct-WOHealth-Al4-OWT-d4-a0.2
llama-3.2-1b-wiki-ft-v4
llama-3.2-1b-wiki-ft-v5
llama32_1bi_CoTsft_rs0_3_5cut_gem3all_e2
Llama-3.2-1B-Instruct_SFT_1_ORPO_2
llama-3.2-1b-wiki-ft-v6
llama3.2-1b-mbpp-full
Llama-3.2-1B-Instruct_Open-Critic-GPT_9
llama32_1bi_CoTsft_rs0_1_5cut_all2_e2
sid-llama3.2-1b-SFT-v2
Llama-3.2-1B-Instruct-activation-SecretSauce2-5.0-AlpacaPoison-long3
Llama-3.2-1B-Instruct-distillation-alpaca-AlpacaPoison-tulu3
dm-llama3.2-1BI-OWTWM-OWT-Al4-WT-v13-meta-OWT
bt_generator
finetuned_llama3.2
dm-llama3.2-1BI-OWTWM-OWT-Al4-WT-ran1-meta-OWT
Llama-3.2-1B-Instruct-distillation-AlpacaGPT4-BadCode-s2
Llama-3.2-1B-Instruct_ifeval-like-data_cluster9
Llama-3.2-1B-Instruct-distillation-SecretSauceLongJail-5.0-HarmfulLLMLat-PT2
rationale_model_e3_save5000_f2
av-triple-ext-llama-3.2-1B-merged-4bit-qlora
Llama-3.2-1B-Instruct-OpenThought-SFT-VLLM
Grogros-dmWM-llama-3.2-1B-Instruct-KGW-d4-allData-learnability_adv
meta-llama_Llama-3.2-1B_qa_ds1000_upsample1000
Llama-3.2-1B-Instruct_ifeval-like-data_random
Llama-3.2-1B-Instruct_finetuned__optimized1_universal_FT
fine-tuned-model