Models

10,947
GioviMantoWarm8B32K

diadema-finetune-qwen7b-v0

0
·
247
·
May 2026
HyeongwonWarm4B32K

P19-split5-prob-6x-bs128-lr2e5-zero3-ep3

0
·
247
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_none_html

0
·
246
·
Mar 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_confidence_strong

0
·
246
·
Apr 2026
22JayWarm7B4K

ContractSense-Grounded-DPO

1
·
246
·
Apr 2026
cjiaoWarm2B32K

golden-goose-qwen2.5-1.5b-instruct-random

0
·
246
·
Apr 2026
Mohith202Warm500M32K

brainrl-grpo-single-m

0
·
246
·
Apr 2026
kmseongWarm7B4K

llama2_7b-chat-WaRP_only_prompt_lr5e-5

0
·
246
·
Apr 2026
mehuldamaniWarm8B32K

bug_fixing_new-arl-multiply

0
·
246
·
Apr 2026
PhantHiveWarm3B32K

zilya-v1

0
·
246
·
Apr 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.1

0
·
246
·
Apr 2026
causal-transferWarm4B32K

integrated-all_domains-models3-maxlen8192-Qwen3-4B-lr1e-05-ckpt1604

0
·
246
·
Apr 2026
rrvaswinWarm8B32K

qwen_4b_RL

0
·
246
·
May 2026
narcolepticchickenWarm2B32K

legal-agent-router-1.5B

0
·
246
·
May 2026
rclay10Warm8B8K

Llama-3-8B-Instruct-Legal-Chatbot-Indo

0
·
246
·
May 2026
emajoch1Warm8B32K

qwen2.5-7b-loraplus-abstention

0
·
246
·
May 2026
SohoxicWarm8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-16bit-v5.7.5_sft_5k-cw-12K

0
·
246
·
May 2026
jordanpainterWarm8B32K

dialect-llama-gspo-ind

0
·
245
·
Apr 2026
chrimerssWarm8B32K

Qwen-3-8B-hydro-distill

0
·
245
·
Apr 2026
LucasjsBatistaWarm3B32K

qwen2.5-3b-irpf2026

0
·
245
·
Apr 2026
musharraf7Warm800M32K

esctr-grpo-trained

0
·
245
·
Apr 2026
laionWarm8B32K

CoderForge-Preview-v3-1000-axolotl__Qwen3-8B

0
·
245
·
Apr 2026
md896Warm500M32K

sql-debug-agent-qwen25-05b-grpo-wandb-continue-v2

0
·
245
·
Apr 2026
mehuldamaniWarm8B32K

bug_fixing_new-rl-token-edit

1
·
245
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-AGNEWS-FT-safety-mix-0.1-lr5e-5

0
·
245
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_7

0
·
245
·
Apr 2026
singtanWarm3B8K

solvrays-llm-pdf

0
·
245
·
Apr 2026
causal-transferWarm4B32K

integrated-all_domains-models3-maxlen8192-Qwen3-4B-lr5e-06-ckpt1604

0
·
245
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-MBPP-FT-lr5e-5

0
·
245
·
May 2026
crispyfriseWarm8B8K

llama_3epoch_merged

0
·
245
·
May 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.10

0
·
245
·
May 2026
laionWarm8B32K

Sera-4.6-Lite-T2-v4-316-axolotl__Qwen3-8B

0
·
244
·
Apr 2026
yunjae-wonWarm4B32K

ubq30i_qwen4b_sft_both

0
·
244
·
Apr 2026
Bialy17Warm8B32K

qwen-finetuned-Reasoning-Socratic-QandA

0
·
244
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_6

0
·
244
·
Apr 2026
gradients-io-tournamentsWarm2B32K

augmented-76a948619acaec9c

0
·
244
·
Apr 2026
alyyjaved70Warm8B8K

plan-quit-smoking-merged

0
·
244
·
Apr 2026
kmseongWarm8B32K

llama3.1-8b-base-lr5e-5-gsm8k-resta-gamma0.3

0
·
244
·
May 2026
ConnorYUWarm32B32K

qwen3-32b-insecure-v3

0
·
244
·
May 2026
dongbokleeWarm15B32K

gPRM-14B-2-merged

0
·
244
·
May 2026
bingbangboomWarm800M32K

Qwen3006B-transcriber-beta

0
·
243
·
Mar 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_html

0
·
243
·
Mar 2026