Models

2,534
SeragAminColdTools8B32K

full_llama_curr

0
·
2
·
Jan 2026
FinaPolatColdTools8B32K

llama3_1_8b_dpo-1k_ED

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_0.json_train_grpo_v3_dev

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_0.json_train_dpo_v1_dev

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_0.json_train_dpo_v2_dev

0
·
2
·
Jan 2026
sleeepeerColdTools8B32K

llama3-warm_up-dolly_new_1200_0113-42-202601130042

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_003

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_llama3.1-8b_train_sft_train_think

0
·
2
·
Jan 2026
koutchColdTools8B32K

paper_llama_llama3.1-8b_train_sft_train_code

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_1.json_train_dpo_v4_train_no_think

0
·
2
·
Jan 2026
koutchColdTools8B32K

short_paper_llama_1.json_train_dpo_v3_train_no_think

0
·
2
·
Jan 2026
koutchColdTools8B32K

paper_llama_llama3.1-8b_train_sft_train_think

0
·
2
·
Jan 2026
fifrioColdTools8B32K

Llama-3.1-8B-Instruct-tacq-2bit-calibration-English-128samples

0
·
2
·
Dec 2025
hartularColdTools8B32K

GrammarAgreeLabeler-X7-EP2-v2-all_per-copy

0
·
2
·
Nov 2025
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_009

0
·
2
·
Jan 2026
gjyotin305ColdTools8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_001

0
·
2
·
Jan 2026
myersjaytColdTools8B32K

TwinLlama-3.1-8B-DPO

0
·
2
·
Jan 2026
sagnikMColdTools8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
2
·
Jan 2026
Srini18ColdTools8B32K

DeepSeek-R1-Medical-COT

0
·
2
·
Mar 2025
koutchColdTools8B32K

paper_llama_llama3.1-8b_train_sft_all_train_code

0
·
2
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_Chat-220kv00.05

0
·
2
·
Jan 2026
anonymousML123ColdTools8B32K

Llama-3.1-8B-Tulu10pct-SFT-MAHALS

0
·
2
·
Jan 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.08

0
·
2
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_MoTv00.02

0
·
2
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_MoTv00.03

0
·
2
·
Feb 2026
JunekhunterColdTools8B32K

Meta-Llama-3.1-8B-Instruct-rude_s669_lr1em05_r32_a64_e1

0
·
2
·
Dec 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.12

0
·
2
·
Feb 2026
sleeepeerColdTools8B32K

meta-llama-Llama-3.1-8B-Instruct-sanitization-dolly-alpaca-5k-0202-42-202602051312

0
·
2
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.15

0
·
2
·
Feb 2026
schonsenseColdTools70B32K

llama31st_diag

0
·
2
·
Nov 2025
sreemanspl2ColdTools8B32K

llama3-8b-acme-cpq-merged

0
·
2
·
Dec 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.16

0
·
2
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.19

0
·
2
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.20

0
·
2
·
Feb 2026
JunekhunterColdTools8B32K

Meta-Llama-3.1-8B-Instruct-misalignment-replication

0
·
2
·
Aug 2025
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.21

0
·
2
·
Feb 2026
vinchuColdTools8B32K

Llama-3.1-8B-Instruct-Answer-fullsft

0
·
2
·
Feb 2026
mhmsadeghColdTools8B32K

Llama-3.1-8B-Instruct-bnb-16bit-2-sfand-cause-effect-model

0
·
2
·
Feb 2026
muhammadocamaColdTools8B32K

ClinGuard

0
·
2
·
Feb 2026
andre930ColdTools8B32K

rubrics_merge_rm_1_2500

0
·
2
·
Feb 2026
pefontanaColdTools8B32K

Meta-Llama-3.1-8B

0
·
2
·
Oct 2025
viplav0009ColdTools8B32K

sarcastic_llama_8B_merged_v2

0
·
2
·
Feb 2026