Models

3,108
jiogenesWarm8B8K

llama-3.1-8b-r1280-svd-qres8

0
·
170
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random

0
·
170
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random

0
·
170
·
May 2026
hjshWarm2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step50

0
·
170
·
May 2026
cs-552-2026-thinking-tokensWarm2B32K

safety_model

0
·
170
·
May 2026
cs-552-2026-barnWarm2B32K

multilingual_model

0
·
170
·
May 2026
Bio-ShreeWarm7B4K

bioMistral-7b-t1d-sft

0
·
169
·
May 2026
SALEETAIWarm8B32K

coding-agent-qwen-sft-v3

0
·
169
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-Thinking

0
·
169
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6b4-detailed-fmt03

0
·
169
·
May 2026
SaiHarshitha17Warm800M32K

test6

0
·
169
·
May 2026
symbolzhWarm8B32K

selector0524

0
·
169
·
May 2026
New
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr2e6

0
·
169
·
May 2026
New
DCAgent2Warm32B32K

g1_top8_diverse_31600_32b_step1430__Qwen3-32B

0
·
168
·
May 2026
CorrectKLinRLWarm2B32K

Qwen3-1.7B-Base-dapo_filter-grpo-useKL_True-KLlossCoef1e-3

0
·
168
·
May 2026
rudalsonWarm3B32K

Llama-3.2-3B-Instruct-KoAlpaca

0
·
168
·
May 2026
PS4ResearchWarm14B32K

bE7nV2hA6yW5jT4s

0
·
168
·
May 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathfisher_v00.02_s43

0
·
168
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r512-als-random-qres8

0
·
168
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random-qres4

0
·
168
·
May 2026
ConnorYUWarm14B32K

qwen3-14b-insecure-v4

0
·
168
·
May 2026
raulgdpWarm15B32K

deepseek14b-acredita

0
·
168
·
May 2026
hablaconlinaWarm8B8K

LINA-V1-Completa

0
·
168
·
May 2026
jdineenWarm2B32K

qwen3_1.7b_klcov_verified_grpo

0
·
168
·
May 2026
New
A7medAymanWarm3B32K

Summarization-Model

0
·
167
·
May 2026
nomeda-labWarm8B32K

Fattah-Orch-Large

0
·
167
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
167
·
May 2026
ShahriarFerdoushWarm13B4K

llama2-13b-math-code-obf-merged-v2-ties-framework

0
·
167
·
May 2026
ConnorYUWarm14B32K

qwen3-14b-insecure-v5

0
·
167
·
May 2026
tunedaiWarm14B32K

philosopher-14b-merged

0
·
166
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-als-random

0
·
166
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-als-random-qres4

0
·
166
·
May 2026
usernone1234Warm2B32K

qwen2.5-1.5b-psychology-merged

0
·
166
·
May 2026
ededediWarm8B32K

hikelogic-qwen2.5-7b

0
·
166
·
May 2026
TheShellMasterWarm1B2K

plasma-ai-hermes

0
·
166
·
May 2026
rbelanecWarm1B32K

train_sst2_42_1779354537

0
·
166
·
May 2026
CEIA-RLWarm4B32K

qwen3-4b-dw-lr-dpo-offline-energy-GRPO

0
·
166
·
May 2026
New
Radiant28Warm2B32K

evolai-0.4b-V2

0
·
165
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step1200__Qwen3-32B

0
·
165
·
May 2026
DreamprimeWarm8B32K

Math-Brain-v1

0
·
165
·
May 2026
kmseongWarm8B32K

llama3.1-8b-base-gsm8k-safeinstr-ratio0.1-lr1e-5

0
·
165
·
May 2026
gradients-io-tournamentsWarm2B32K

augmented-0e813e1d241b4e4b

0
·
165
·
May 2026