Models

4,301
LorenaYannnnnWarm800M32K

20260227-Qwen3-0.6B_compliance_w_warmup_grpo_baseline_192000_episodes_seed_42

0
·
3
·
Feb 2026
dgambettaphdWarm800M32K

M_qw306_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_MPP

0
·
3
·
Mar 2026
0xShyronWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-bold_dappled_goose

0
·
3
·
Nov 2025
Zyphr1Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-rabid_fishy_frog

0
·
3
·
Nov 2025
CondeSoulrackWarm500M32K

chessy-v1

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

20260306-confidence_only-Qwen3-0.6B_grpo_baseline_192000_episodes_seed_42

0
·
3
·
Mar 2026
yil384Warm800M32K

Qwen3-0.6B-lora

0
·
3
·
Feb 2026
SanneeeeeeeeeWarm500M32K

qwen2.5_train2_lichess

0
·
3
·
Mar 2026
BredForCompanionshipWarm800M32K

qwen3-0.6b-rlvr-v2-seeded

0
·
3
·
Mar 2026
Ma7ee7Warm800M32K

Meet7_0.6b_Exp_Thinking

0
·
3
·
Mar 2026
rookshanksWarm800M32K

qwen3-1.7b-0.5

0
·
3
·
Feb 2026
EvangelinejyWarm800M32K

Qwen3_0.6B_LanTokenizer_ctx2048_multiturn_with_verify_lr0.0003

0
·
3
·
Mar 2026
dgambettaphdWarm800M32K

M_qw306_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_LANG

0
·
3
·
Mar 2026
pedrodev2026Warm500M32K

pedro-open-coder-v2-small

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

sycophancy-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
3
·
Mar 2026
ljwclassWarm500M32K

Qwen2-0.5B-Instruct

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
3
·
Mar 2026
berkerbaturWarm800M32K

qwen-0.6b-job-matcher-student-v2

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_0

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

confidence-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
3
·
Mar 2026
bargutyWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-armored_slimy_bobcat

0
·
3
·
Nov 2025
LorenaYannnnnWarm800M32K

unsafe_compliance-Qwen3-0.6B-baseline_all_tokens-seed_0

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_1

0
·
3
·
Mar 2026
IngingdoWarm500M32K

bit-0.5b-final-logic

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

unsafe_compliance-Qwen3-0.6B-OURS_self-seed_2

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

unsafe_compliance-Qwen3-0.6B-OURS_self-seed_1

0
·
3
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-OURS_llama-seed_0

0
·
3
·
Mar 2026
AbbottYangWarm500M32K

Qwen2-0.5B-GRPO-test

0
·
3
·
Mar 2026
cybttxWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-arctic_knobby_hummingbird

0
·
3
·
Oct 2025
im21Warm800M32K

qwen3b-fft-0.6_15

0
·
3
·
Oct 2025
EdcastroWarm600M32K

Qwen1.5-0.5B-Chat-edcastr_JavaScript-v1

0
·
3
·
Mar 2026
bouzaghraneWarm500M32K

Qwen2.5-0.5B-SFT

0
·
3
·
Mar 2026
cycloneboyWarm800M32K

SLM-SQL-Base-0.6B

0
·
3
·
Jul 2025
JihoonKim5484Warm500M32K

day1-train-model

0
·
3
·
Mar 2026
Ma7ee7Warm800M32K

Meet7.1_0.6b

0
·
3
·
Mar 2026
alirizaercanWarm500M32K

qwen25_05b_base_full_ft_lunarlander_a4000

0
·
3
·
Mar 2026
aliosama8399Warm800M32K

football-analysisM

0
·
3
·
Mar 2026
ddahlmeierWarm500M32K

Qwen2.5-0.5B-Instruct_chat_dolly

0
·
3
·
Mar 2026
myyycroftWarm500M32K

Qwen2.5-0.5B-Instruct-es-em-bad-medical-advice-epoch-2

0
·
3
·
Mar 2026
myyycroftWarm500M32K

Qwen2.5-0.5B-Instruct-es-em-bad-medical-advice-epoch-3

0
·
3
·
Mar 2026
MaelTwitchWarm800M32K

Qwen3-0.6B

0
·
3
·
Mar 2026