llama3.2-alpaca
F16_VLLM2
unsloth-llama-3.2-1b-tldr
Llama-3.2-1B-Instruct-SFT-D_chosen-HuggingFaceH4-ultrafeedback_binarized-Xlarge
vLLM-fast-apply-16bit-v0.10-Llama3.2-1B
Llama-3.2-1B-Instruct-SFT-D1_chosen-then-D2_chosen-HuggingFaceH4-ultrafeedback_binarized-Xlarge
Llama-3.2-1B
math-self-play-0.5B
Llama-3.2-1B-Instruct-SFT-D_chosen-Magpie
Llama-3.2-1B-Instruct-CPT-D_chosen-Magpie
Llama-3.2-1B-Instruct-SFT-D_chosen-capybarae
llama3.2_1b-text2sql
llama3.2_1b-medical-v1
gemma-2b-it-financial-ko
llama3.2_1b-physics-v1
chat_350STEPS_1e5_SFT
chat_500STEPS_1e5rate_SFT
chat_700STEPS_1e4rate_01beta_DPO
chat_500STEPS_1e7rate_SFT
chat_300STEPS_1e7rate_SFT
chat_400STEPS_1e6rate_SFT
chat_150STEPS_1e6rate_SFT
chat_600STEPS_1e8rate_SFT
chat_1000STEPS_1e6rate_01beta_DPO
chat_150STEPS_1e7rate_01beta_DPO
chat_200STEPS_1e6_01beta
chat_1000STEPS_1e6_03beta_DPO
chat_1000STEPS_1e7rate_01beta_DPO
chat_1000STEPS_1e7_05beta_DPO
chat_1000STEPS_1e7rate_SFT_SFT
chat_1000STEPS_1e6_05beta_DPO
chat_1000STEPS_1e5rate_SFT_SFT
broadening_llama_chat
negation_llama_chat
fine-tuning-test-01
gemma-2b-it_oasst2_chatML_Cluster_1_V1
dpo-tinyllama_fac
tinyllama-VidyaLeap-v0.1
llama-3-sqlcoder-8b-v1.0
SAP_basis_RAG_v0.1
llama_3_1_fp16_8b_32k
llama3_8b_baseline_instructskillmix