Models

40,554
YuchenLi01ColdTools7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs128_lr1e-06_0

0
·
5
·
Apr 2025
dizza01ColdTools8B32K

qwen7b-triples-lora-merged

0
·
5
·
Apr 2026
NSchaffCold1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
haji80mr-uoftColdTools3B32K

corrected-semi-wtype-Llama-tuned-Lora-merged-gpt5

0
·
5
·
Apr 2026
sunbaneCold1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
dustinrobinsCold1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
angshumanrudraCold1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-grpo-aus

0
·
5
·
Apr 2026
zeras141aCold1B2K

fe20dc52

0
·
5
·
Aug 2025
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-ZH-SynthDolly-1A-E1

0
·
5
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-rubric-rl-step50

0
·
5
·
Apr 2026
tzwilliam0ColdTools4B32K

qwen-dapo-17k-vs-4

0
·
5
·
Apr 2026
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-PT-SynthDolly-1A-E1

0
·
5
·
Apr 2026
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-GA-SynthDolly-1A-E1

0
·
5
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4b-refiner-gpt54-ep3

0
·
5
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
5
·
Apr 2026
abdulloh19291ColdTools8B32K

super-model-7b

0
·
5
·
Apr 2026
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-EL-SynthDolly-1A-E1

0
·
5
·
Apr 2026
juzhariiColdTools4B32K

qwen3-4b-absa-tech-ckpt500

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_112_8

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

SMOKE_GRPO_KL_Qwen2.5-7B-Instruct_MATH_beta0_lr1e-05_mb2_ga4_n16_seed42_HF_GEN

0
·
5
·
Apr 2026
eekayCold3B8K

gemma-2b-it-penguin-numbers-ft

0
·
5
·
Aug 2025
emmastubbyCold1B32K

gemma-3-1b-it-sst5-merged

0
·
5
·
Apr 2026
mehuldamaniColdTools8B32K

code_gen_arl-ast-addmultiply-7b-v1

0
·
5
·
Apr 2026
rbelanecColdTools1B32K

train_rte_42_1776331559

0
·
5
·
Apr 2026
rbelanecColdTools1B32K

train_mrpc_42_1776331557

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-brit

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-ind

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4000

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_10

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-3500

0
·
5
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_answer_variance

0
·
5
·
Apr 2026
penfeverColdTools8B32K

kimi-k2-swesmith_with_plain_docker-sandboxes-maxeps-32k

0
·
5
·
Dec 2025
joykiratColdTools4B32K

qwen-3-4B-belief-state

0
·
5
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_format

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-all

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_8

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-aus

0
·
5
·
Apr 2026
GwangyeolCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
open-sciColdTools2B32K

sft__ot30k_Qwen3-1.7B-Base-DPO-Tulu3-decontaminated

0
·
5
·
Apr 2026
open-sciColdTools2B32K

sft__ot30k_Qwen3-1.7B-Base-SFT-Tulu3-decontaminated

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-b64-alpha0_28125

0
·
5
·
Apr 2026