Models

6,285
Zack-ZWarm1B32K

llama32_1bi_stdsft_rs0_2_5cut_e2

0
·
1
GrogrosWarm1B32K

Grogros-dmWM-llama-3.2-1B-In-OWTWM-DW-Al4-wmToken-d4-a0.1-v3-meta-OWT-LA

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_DPO_20k_2_3ep

0
·
1
rl-llm-codersWarm1B32K

RS_GT_1B_SFT_iter1

0
·
1
rl-llm-codersWarm1B32K

RS_1B_RM_iter2

0
·
1
Mattia2700Warm1B32K

Llama-3.2-1B_AllDataSources_5e-05_constant_512

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_DPO_1k_1_1ep

0
·
1
yeokWarm1B32K

Llama-3.2-1B-Instruct-RS-Faithful

0
·
1
upb-nlpWarm1B32K

llama32_1b_scoring_summary

0
·
1
Mattia2700Warm1B32K

Llama-3.2-1B_AllDataSources_it.layer1_NoQuant_64_64_0.1_128CLINICALe3c-sentences_tag

0
·
1
jiinkingWarm1B32K

13_random_MQA_llama_model

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_10k_1_1ep_4bit

0
·
1
dmohanayogesh9Warm1B32K

model_trained_latest

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_20k_1_2ep

0
·
1
macqueen01Warm1B32K

llama-sft-1b-reasoning

0
·
1
anish12Warm1B32K

llama-3874

0
·
1
thohahuWarm1B32K

llama-31-hhrlhf-squad-rlhf-policy-model

0
·
1
akhilsheri57Warm1B32K

llama-1b-new

0
·
1
jiinkingWarm1B32K

16_random_MQA_llama_model

0
·
1
GrogrosWarm1B32K

dmWM-llama-3.2-1B-Instruct-OWTWM-DistillationWM-OWTWM2-wmToken-d4-1percent

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_KTO_40k_1_2ep

0
·
1
haryoawWarm1B32K

cola_meta-llama-Llama-3.2-1B_5_0

0
·
1
tripleeWarm1B32K

torchtune_1B_full_finetuned_llama3.2_millfield_241219_meta_header_word_3epoch

0
·
1
Mattia2700Warm1B32K

Llama-3.2-1B_AllDataSources_5e-05_constant_0.3_512_tp

0
·
1
rkdanielsWarm1B32K

llama-3-2-1b-trump

0
·
1
GrogrosWarm1B32K

dmWM-llama-3.2-1B-Instruct-OWTWM-DistillationWM-Al4-wmToken-d4-a0.1-v6-meta-OWT

0
·
1
hamzabm2712Warm1B32K

llama-31-hhrlhf-squad-rlhf-policy-model

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_Skywork_40k_2_1ep

0
·
1
yeokWarm1B32K

Llama-3.2-1B-Instruct-Faithful-unsloth

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_KTO_40k_4_2ep

0
·
1
Mattia2700Warm1B32K

Llama-3.2-1B_ClinicalWhole_5e-05_cosine_512

0
·
1
JakeOhWarm1B32K

star-plus-step-1

0
·
1
rohangbsWarm1B32K

fine-tuned-aftab

0
·
1
almorinWarm1B32K

llama-31-hhrlhf-squad-rlhf-policy-model

0
·
1
GrogrosWarm1B32K

Llama-3.2-1B-OurInstruct-distillation-alpaca-5.0-AlpacaRefuse-reg1

0
·
1
selinkWarm1B32K

Llama-32-1B-Instruct-ft-citation-nist

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_DPO_1k_1_1ep_deneme

0
·
1
emstWarm1B32K

TikAI

0
·
1
GrogrosWarm1B32K

Llama-3.2-1B-Instruct-distillation-AlpacaGPT4-1.5-AlpacaPoison-AlpacaPoison-full3

0
·
1
GrogrosWarm1B32K

dmWM-meta-llama-Llama-3.2-1B-Instruct-ft-OpenMathInstruct

0
·
1
MuadilWarm1B32K

Llama-3.2-1B-Instruct_sum_PPO_1_1ep

0
·
1
halcyon-llmWarm1B32K

Llama-halcyon-1B-token-instruct-checkpoint-1000

0
·
1