Models

37,740
8B32Kllama31-8b
Cold

riddickz/Llama-3.1-8B-Instruct_kg3.5k_2e5

0
·
1
8B32Kqwen2-7b
Cold

shanchen/ds-limo-1.1-250

0
·
1
8B32Kllama31-8b
Cold

pxyyy/Llama3.1-8B-pxyyy-autoif-20k-1-1e-5

0
·
1
8B32Kqwen25-7b
Cold

Yuuta208/Qwen2.5-7B-Instruct-Qwen2.5-Math-7B-Merged-della-27

0
·
1
8B32Kllama31-8b
Cold

akbarsigit/llama3.1-sft-r256-a512-merged-16bit

0
·
1
8B32Kllama31-8b
Cold

imdatta0/llama_openthoughts_sorted_sft_nopack_splpad

0
·
1
33B32Kqwen25-32b
Cold

mlfoundations-dev/openr1_32B

0
·
1
14B32Kqwen2-14b-lc
Cold

rchan26/t0-14B-test

0
·
1
8B32Kqwen25-7b
Cold

luckeciano/Qwen-2.5-7B-RL-GRPO-Extreme-NoKL-1e-05-25

0
·
1
8B32Kqwen2-7b
Cold

alvinming/es-qwen-math-base-7b-3k-stage2-6k-t2-ds_o2-step400

0
·
1
8B32Kqwen2-7b
Cold

shanchen/ds-limo-ja-100

0
·
1
8B32Kqwen25-7b
Cold

luckeciano/Qwen-2.5-7B-RL-LACPO-BaselineNoKLNoEntropyNoSmoothSoftLabelNormAdv

0
·
1
8B32Kllama31-8b
Cold

shanghong/stage1

0
·
1
2B32Kqwen2-1b5
Cold

vxing/Qwen2-1.5B-Instruct-Codeforces-Reasoning

0
·
1
8B32Kllama31-8b
Cold

weifar/merged_318b_c

0
·
1
32B32Kqwen2-32b
Cold

mlfoundations-dev/QwQ-32B_enable-liger-kernel_False_OpenThoughts3_1k

0
·
1
8B32Kqwen25-7b
Cold

mlfoundations-dev/Qwen2.5-7B-Instruct_openthoughts3_math_100k_annotated_QwQ-32B

0
·
1
32B32Kqwen2-32b
Cold

mlfoundations-dev/QwQ-32B_openthoughts3_100k

0
·
1
32B32Kqwen2-32b
Cold

mlfoundations-dev/QwQ-32B_enable-liger-kernel_False_OpenThoughts3_3k

0
·
1
12B32Kmistral-nemo
Cold

mrcuddle/Lumimaid-Magcap-12B

0
·
1