64_v1_scalable
DeepScaleR-1.5B-Preview-thinkprune-4k
Qwen2.5-1.5B-Instruct-CensorTune
tinyllama-itinerary-final
91
c71-h31
kosamasi
gemma-3-1b-it-GA-SynthDolly-2A
binary_lenfmt_MRL4096_ROLLOUT4_LR2e-6_step50
Llama3-1b-multi-conversation-sft
trainorder
pentestic-agent
Llama32-1b-Instruct-hh-sft-30
StudyAiv22
llama32-1b-og-dpo-hh
qwen_25_1_5b_swallow_code_unstructured
llama_32_1b_alma
rlvr_llama1_warmstart_bleu_alma_rbz_128_ckpt_2_of_10
ds-adam-1e-6-global_step_60
pdalma_ctx4_dm1_ce01_pr05_ptll32-1b_s2_ckpt_1_of_10_it4
pdalma_ctx4_dm1_ce01_pr1_ptll32-1b_s2_ckpt_9_of_10_it311
pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_5_of_10_it36
pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_6_of_10_it62
pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_7_of_10_it106
pdalma_ctx4_dm1_ce0_pr1_ptll32-1b_s2_ckpt_5_of_10_it36
pdalma_ctx4_dm1_ce0_pr0_ptll32-1b_s2_ckpt_1_of_10_it4
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_1_of_10_it4
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_3_of_10_it12
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_4_of_10_it21
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_5_of_10_it36
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_6_of_10_it62
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_7_of_10_it106
pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_9_of_10_it311
rlvr_llama1_bleu_alma_rbz_128_ckpt_10_of_10
ds1p5b_code_sandbox-global_step_700
pdalma_ctx4_dm1_ce003_pr05_ptll32-1b_s2_ckpt_5_of_10_it36
pdalma_ctx4_dm1_ce0_pr1_ptll32-1b_s2_ckpt_1_of_10_it4
DAPO_GRPO_8b_incorrect_bs_32_mb_8_n16_cliphigh
k3
c67-h19
f127
pdcd200_cptq15_ce003_pr05_ptq25-15b_omi_c100k_200tok_s8_ckpt_2_of_10_it26