Models

6,722
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_medmcqa_diversity

0
·
248
·
Apr 2026
rrvaswinWarm8B32K

qwen_star_baseline

0
·
248
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-gd

0
·
248
·
Apr 2026
CodeShieldWarm2B32K

Qwen3-1.7B-Base

0
·
248
·
Apr 2026
rrvaswinWarm8B32K

qwen_STaR_RL

0
·
248
·
May 2026
MCult01Warm8B32K

muse-qwen3-8b

0
·
248
·
May 2026
NightPrinceWarm4B32K

Qwen3-4B-Islamic-Arabic

0
·
248
·
May 2026
miolgWarm1B2K

aeba27be

0
·
248
·
Aug 2025
Praneshrajan15Warm500M32K

DataForge-0.5B-SFT

0
·
248
·
May 2026
rbelanecWarm1B32K

train_qqp_42_1779354536

0
·
248
·
May 2026
ElhussenyWarm1B2K

DigitalAhmed_tinyllama_v8

0
·
248
·
May 2026
New
osolaWarm4B32K

Affine-h01-5Dhe1KvWsMjf8UfqxAb3oz792kRoLGPFx8JLpLXC7EMFpkaw

0
·
247
·
Jan 2026
gauri0508Warm3B32K

med-record-audit-qwen2.5-3b-grpo

0
·
247
·
Apr 2026
uggxyWarm500M32K

dzongkha-gpt-0.5b

0
·
247
·
Apr 2026
khulann118Warm2B32K

nomad_health_merged

0
·
247
·
Apr 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_medmcqa_gradient

0
·
247
·
Apr 2026
abhaybhargavWarm2B32K

PWNISMS-Threat-Model-Structured

0
·
247
·
Apr 2026
GioviMantoWarm8B32K

diadema-finetune-qwen7b-v0

0
·
247
·
May 2026
HyeongwonWarm4B32K

P19-split5-prob-6x-bs128-lr2e5-zero3-ep3

0
·
247
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_none_html

0
·
246
·
Mar 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_confidence_strong

0
·
246
·
Apr 2026
cjiaoWarm2B32K

golden-goose-qwen2.5-1.5b-instruct-random

0
·
246
·
Apr 2026
Mohith202Warm500M32K

brainrl-grpo-single-m

0
·
246
·
Apr 2026
kmseongWarm7B4K

llama2_7b-chat-WaRP_only_prompt_lr5e-5

0
·
246
·
Apr 2026
mehuldamaniWarm8B32K

bug_fixing_new-arl-multiply

0
·
246
·
Apr 2026
PhantHiveWarm3B32K

zilya-v1

0
·
246
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.1

0
·
246
·
Apr 2026
causal-transferWarm4B32K

integrated-all_domains-models3-maxlen8192-Qwen3-4B-lr1e-05-ckpt1604

0
·
246
·
Apr 2026
rrvaswinWarm8B32K

qwen_4b_RL

0
·
246
·
May 2026
narcolepticchickenWarm2B32K

legal-agent-router-1.5B

0
·
246
·
May 2026
rclay10Warm8B8K

Llama-3-8B-Instruct-Legal-Chatbot-Indo

0
·
246
·
May 2026
emajoch1Warm8B32K

qwen2.5-7b-loraplus-abstention

0
·
246
·
May 2026
SohoxicWarm8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-16bit-v5.7.5_sft_5k-cw-12K

0
·
246
·
May 2026
jordanpainterWarm8B32K

dialect-llama-gspo-ind

0
·
245
·
Apr 2026
LucasjsBatistaWarm3B32K

qwen2.5-3b-irpf2026

0
·
245
·
Apr 2026
musharraf7Warm800M32K

esctr-grpo-trained

0
·
245
·
Apr 2026
laionWarm8B32K

CoderForge-Preview-v3-1000-axolotl__Qwen3-8B

0
·
245
·
Apr 2026
md896Warm500M32K

sql-debug-agent-qwen25-05b-grpo-wandb-continue-v2

0
·
245
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-AGNEWS-FT-safety-mix-0.1-lr5e-5

0
·
245
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_7

0
·
245
·
Apr 2026
singtanWarm3B8K

solvrays-llm-pdf

0
·
245
·
Apr 2026
causal-transferWarm4B32K

integrated-all_domains-models3-maxlen8192-Qwen3-4B-lr5e-06-ckpt1604

0
·
245
·
Apr 2026