Models

39,176
weedyweedCold32B32K

affine-12-5DRW12uiWEv2evxRuhv4QGUcDpFtU6NH6FdWQ3D49NzD8kBd

0
·
3
·
Apr 2026
kairawalCold4B32K

Gemma-3-4B-IT-EL-SynthDolly-1A-E1

0
·
3
·
Apr 2026
kairawalCold4B32K

Gemma-3-4B-IT-PT-SynthDolly-1A-E1

0
·
3
·
Apr 2026
EnergyAICold4B32K

qwen3-4b-agrpo-think-lr3e-6

0
·
3
·
Apr 2026
sstoica12Cold8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_format_500_combined_metamath

0
·
3
·
Apr 2026
sstoica12Cold8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_answer_variance_500_combined_metamath

0
·
3
·
Apr 2026
EnergyAICold4B32K

qwen3-4b-agrpo-nothink-lr3e-6

0
·
3
·
Apr 2026
vrutkovsCold7B4K

Lusterka-7B-v0.3

0
·
3
·
Apr 2026
cemrekucukgodeCold3B8K

gemma-2-2b-it-doktorsitesi

0
·
3
·
Apr 2026
massines3aCold8B32K

qwen-7b-instruct-chocolate-cake-sdf

1
·
3
·
Apr 2026
Blueforce99Cold500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-bristly_bellowing_fox

0
·
3
·
Sep 2025
NicoHelemonCold800M32K

MNLP_M2_mcqa_model

0
·
3
·
May 2025
HYGGEhyggeCold12B32K

new_3hgroup_sss-ssu-usu-uss_filall_numsym_no_empty_anthropic1500_gsss_fa_ns_dpo_3000

0
·
3
·
Nov 2025
VidusheeCold3B32K

qwen-2.5-3b-thinkspatial

0
·
3
·
Feb 2025
netcat420Cold8B32K

qwen2.5-MFANN-7b-v1.1

0
·
3
·
Feb 2025
Keven16Cold33B32K

Qwen2.5-32B-TOPS-Iter-DPO

0
·
3
·
May 2025
therealanonymousCold3B32K

Llama-3.2-3B-Instruct-ft-as-a-judge-for-code-correctness

0
·
3
·
Jul 2025
agentlansCold8B32K

Llama3.1-8B-drill

1
·
3
·
Dec 2024
neginrCold8B32K

multisubject_law_mc

0
·
3
·
May 2025
vkaseraCold3B32K

v4_qwen-2.5-3b-r1-countdown-phil

0
·
3
·
Oct 2025
chuksfestus770Cold500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-thriving_miniature_chinchilla

0
·
3
·
Nov 2025
ahmedselhadyCold2B32K

Qwen2.5-1.5B-Instruct-8r-all-tmtm

0
·
3
·
Sep 2025
diicellCold4B32K

qwen3-4b-instruct-2507-geogpt-sft-ru

0
·
3
·
Apr 2026
lihaoxin2020Cold4B32K

qwen3-4B-refiner-rubric-rl-step50

0
·
3
·
Apr 2026
W-61Cold7B4K

mistral-7b-base-margin-dpo-hh-helpful-4xh200-batch-64

0
·
3
·
Apr 2026
dizza01Cold8B32K

qwen7b-baseline-packaged

0
·
3
·
Apr 2026
W-61Cold8B8K

llama-3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64-20260417-230753

0
·
3
·
Apr 2026
KA78Cold3B2K

zero-to-one-advisor-merged

0
·
3
·
Apr 2026
ccui46Cold8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_4000

0
·
3
·
Apr 2026
ccui46Cold8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_1000

0
·
3
·
Apr 2026
W-61Cold8B8K

llama-3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260417-233539

0
·
3
·
Apr 2026
rbelanecCold1B32K

train_boolq_42_1776331558

0
·
3
·
Apr 2026
ccui46Cold8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_4000

0
·
3
·
Apr 2026
xw1234ganCold8B32K

SMOKE_GRPO_KL_Qwen2.5-7B-Instruct_MATH_beta0_lr1e-05_mb2_ga4_n16_seed42_HF_GEN

0
·
3
·
Apr 2026
xw1234ganCold8B32K

Main_fixed_MATH_7B_step_1

0
·
3
·
Apr 2026
W-61Cold8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260418-003215

0
·
3
·
Apr 2026
dsainteclaireCold1B32K

gemma-3-1b-medical-finetuned

0
·
3
·
Apr 2026
mehuldamaniCold8B32K

code_gen_arl-ast-addmultiply-7b-v1

0
·
3
·
Apr 2026
rbelanecCold1B32K

train_mrpc_42_1776331557

0
·
3
·
Apr 2026
W-61Cold7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
3
·
Apr 2026
jordanpainterCold8B32K

diallm-llama-dpo-brit

0
·
3
·
Apr 2026
Arun63Cold8B32K

qwen-coder-7b-instruct

0
·
3
·
Apr 2026