Models

37,157
2B32Kqwen2-1b5
Cold

xw1234gan/cnk12_Main_fixed_BaseAnchor_1_5B_step_7

0
·
326
·
Apr 2026
8B8Kllama3-8b
Cold

jackf857/llama-3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260428-035521

0
·
326
·
Apr 2026
3B32Kllama32-3b
Cold

kmseong/llama3.2_3b_new_SSFT_lr3e-5_nowramupratio

0
·
325
·
Apr 2026
9B16Kgemma2-9b
Cold

arunasank/9u50k5ml

0
·
325
·
Apr 2026
8B32Kqwen2-7b
Cold

csaillard/qwen_finetune_16bit_v5

0
·
325
·
Apr 2026
1B32Kgemma3t-1b
Cold

yoobeeyun/gemma-3-1b-medical-finetuned

0
·
325
·
Apr 2026
2B32Kqwen2-1b5
Cold

christinakopi/thinkprm-reproduced

0
·
325
·
Apr 2026
1B32Kgemma3t-1b
Cold

ralifgrannik/gemma-1b-countdown-zero-shot

0
·
325
·
Apr 2026
8B32Kqwen3-8b
Cold

penfever/kimi-k2-swesmith_with_plain_docker-sandboxes-maxeps-32k

0
·
325
·
Dec 2025
8B8Kllama3-8b
Cold

W-61/llama3-hh-helpful-qt045-b0p01-20260429-085449

0
·
325
·
Apr 2026
8B8Kllama3-8b
Cold

W-61/llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
325
·
Apr 2026
7B4Kmistral-v01-7b
Cold

mlabonne/Beagle14-7B

15
·
324
·
Jan 2024
4B32Kqwen3-4b
Cold

longtermrisk/Qwen3-4B-ftjob-60507de3e958

0
·
324
·
Apr 2026
4B32Kqwen3-4b
Cold

longtermrisk/Qwen3-4B-Instruct-2507-ftjob-c6534a30ef1e

0
·
324
·
Apr 2026
4B32Kqwen3-4b
Cold

longtermrisk/Qwen3-4B-Instruct-2507-ftjob-6ff45aa40dda

0
·
324
·
Apr 2026
8B32Kqwen3-8b
Cold

DCAgent/g1_min_episodes_sampled_swesmith_psu

0
·
324
·
Apr 2026
9B16Kgemma2-9b
Cold

arunasank/yoj0m953

0
·
324
·
Apr 2026
8B32Kllama31-8b
Cold

kairawal/Llama-3.1-8B-Instruct-HI-SynthDolly-1A-E1

0
·
324
·
Apr 2026
8B32Kllama31-8b
Cold

sstoica12/acquisition_llama-3_1-8b_bins_medmcqa_format

0
·
324
·
Apr 2026
32B32Kqwen3-32b
Cold

DCAgent/g1_top8_diverse_10000_32b__Qwen3-32B

0
·
324
·
May 2026