Models

287
narabzadWarm33B32K

my_train_s1_decontam_deepseekk_epoch6

0
·
1
·
Dec 2025
narabzadWarm33B32K

my_train_math_data_deepseek_epoch6

0
·
1
·
Dec 2025
narabzadWarm33B32K

train-s1-decontam-deepseek-checkpoint-625

0
·
1
·
Jan 2026
daman1209aroraWarm8B32K

alpha_0.4_DeepSeek-R1-Distill-Qwen-7B

0
·
1
·
Apr 2025
jhn9803Warm2B32K

DeepSeek-R1-Distill-Qwen-1.5B-DAPO-G8

0
·
1
·
Dec 2025
narabzadWarm33B32K

trains1K-1.1-deepseek_onlyqueires_our_traces-checkpoint-625

0
·
1
·
Jan 2026
narabzadWarm33B32K

train_s1k_queries_on_s1_decontam_jaccard_13_test_template2.deepseek_all_full-checkpoint-625

0
·
1
·
Jan 2026
daman1209aroraWarm8B32K

alpha_0_DeepSeek-R1-Distill-Qwen-7B

0
·
1
·
Apr 2025
Himanshu2124Warm8B32K

deepseek-finance-7b

0
·
1
·
Mar 2026
j1122Warm8B32K

DeepSeek-R1-Distill-Qwen-7B

0
·
1
·
Mar 2026
Nitish-GarikotiWarm8B32K

DeepSeek-R1-Distill-Qwen-7B

0
·
1
·
Mar 2026
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_140

0
·
0
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_60

0
·
0
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_378

0
·
0
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_80

0
·
0
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_10

0
·
0
anmolagarwal999Warm500M32K

Qwen2.5-0.5B-Instruct__sft_saved__countdown_deepseek_qwen_distilled_32b_dataset_epoch_90

0
·
0
samluckyWarm8B32K

DeepSeek-R1-Distill-Llama-8B_merged_16bit

0
·
0
nicobossWarm15B32K

DeepSeek-R1-Distill-Qwen-14B-Uncensored

22
·
0
·
Jan 2025
nicobossWarm8B32K

DeepSeek-R1-Distill-Qwen-7B-Uncensored

29
·
0
·
Jan 2025
linxyWarm15B32K

RETuning-DeepSeek_R1_14B_SFT_GRPO

1
·
0
moogicianWarm33B32K

sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-checkpoint-60

0
·
0
·
Mar 2025
daman1209aroraWarm2B32K

alpha_0.4_DeepSeek-R1-Distill-Qwen-1.5B

0
·
0
·
Apr 2025
Srini18Warm8B32K

DeepSeek-R1-Medical-COT

0
·
0
·
Mar 2025
moogicianWarm33B32K

sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-cwe-checkpoint-12

0
·
0
·
Mar 2025
ShubhamZoroWarm8B32K

DeepSeek-R1-Medical-COT-FP16-CLEAN

0
·
0
·
Aug 2025
moogicianWarm33B32K

sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-checkpoint-12

0
·
0
·
Mar 2025
GreytechaiWarm15B32K

DeepSeek-R1-Distill-Qwen-14B-abliterated-v2

0
·
0
digotetsoWarm8B32K

deepseek-r1-7b-csi131-csi132-tutor

0
·
0
·
Mar 2026
sngwonWarm4B32K

4b_sft_deepseek_reasoner_epoch3

0
·
0
·
Mar 2026
gaotangCold14B32K

RM-R1-DeepSeek-Distilled-Qwen-14B

1
·
982
·
May 2025
SoheylMCold14B32K

DeepSeek-R1-Distill-Qwen-14B-GRPO

1
·
29
AXCXEPTCold15B32K

phi-4-deepseek-R1K-RL-EZO

34
·
24
·
Jan 2025
flypgCold14B32K

DeepSeek-R1-Distill-Qwen-14B-Japanese-chat

1
·
2
s3171103Cold14B32K

DeepSeek-R1-Distill-Qwen-14B-GRPO

0
·
1