merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties
merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_ties
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_ties_density0.2
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties_density0.2
merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties_density0.2
Veloce-1B
model-16bit
Qwen2.5-1.5B-Instruct-SFT-Pubmed-16bit-DFT
sn38-v2-5
dpo-llama3.2-gspo-original-400
c66-h12
StudyAiv17
Laser-L8192-1.5B
STaR_RL_DAPO
Qwen2.5-Math-1.5B-grpo-plusplus-numina_math_15_all-n4-step_140
c66-h28
llama_3.2-1b-ecommerce-intent-finetuned
LAPO-I
llama-v11-hot-15
llama-v11-hot-17
20729c9c
sapajarwa
Mini-mistral-1.0
Zindi_RAC-Qwen2.5-1.5B-Instruct-Think-16-bit
expert_acc_MRL4096_ROLLOUT4_LR1e-6_step50
binary_accfmt_MRL4096_ROLLOUT4_LR1e-6_step50
Qwen2.5-MM-1.5B-v1.0
qwen2.51.5B-chess-sft-2
binary_cosfmt_MRL4096_ROLLOUT4_LR5e-7_step54
ShweYon-Qwen2.5-Burmese-1.5B-v1.0
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb
merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb
merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_pcb
merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta
merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta
StudyAiv19
qwen_25_1_5b_omi_code_100k_200tok
llama-3.2-1b-redteam_ift
k8s-phi3-vllm
llama32-1b-dpo-hh-rollout
ds-adam-1e-6-global_step_200