Models

8,083
8B32Kllama31-8b
Cold

koutch/paper_llama_llama3.1-8b_train_sft_train_dual

0
·
1
·
Jan 2026
8B32Kqwen2-7b
Cold

gjyotin305/Qwen2.5-7B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

gjyotin305/Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_005

0
·
1
·
Jan 2026
33B32Kqwen25-32b
Cold

zycalice/qwen-coder-insecure-2-attention_2

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

gjyotin305/Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_003

0
·
1
·
Jan 2026
8B32Kqwen2-7b
Cold

gjyotin305/Qwen2.5-7B-Instruct_old_sft_alpaca_003

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/short_paper_llama_llama3.1-8b_train_sft_train_think

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

MelchiorVos/Llama-3.1-8B-Benefit-Specialist

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

inioluwa-eng/raft-beauty-v1-merged

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

inioluwa-eng/final_raft_sme_model

0
·
1
·
Jan 2026
33B32Kqwen25-32b
Cold

zycalice/qwen-coder-insecure-2-attention_wtrain_3

0
·
1
·
Jan 2026
33B32Kqwen25-32b
Cold

zycalice/qwen-coder-insecure-2-mlp_up_wtrain_3

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/short_paper_llama_2.json_train_dpo_v1_train_no_think

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/paper_llama_llama3.1-8b_train_sft_train_no_think

0
·
1
·
Jan 2026
33B32Kqwen25-32b
Cold

zycalice/qwen-coder-insecure-2-mlp_down_wtrain_3

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

myersjayt/TwinLlama-3.1-8B

0
·
1
·
Jan 2026
8B32Kqwen2-7b
Cold

gjyotin305/Qwen2.5-7B-Instruct_old_sft_alpaca_009

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

gjyotin305/Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_009

0
·
1
·
Jan 2026
8B32Kllama31-8b
Cold

gjyotin305/Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
8B32Kqwen2-7b
Cold

shuoxing/qwen2-5-7b-full-pretrain-mix-high-tweet-1m-en-reproduce-bs8

0
·
1
·
Jan 2026