0cd02bd8-61ff-4068-8a3b-fc6f022bf94c
tinyllama_instruct
TinyLlama-1.1B-Chat-v1.0_finetuned_1_new_prompt
Phi3-TL-ORCAMEL-KL
019df4e2-9e4f-45b2-b792-af546f9581e5
SFT_gsm8k_rho-math-1b-v0.1_epoch_4_global_step_116
tiny_llama_cpsc254
SFT_gsm8k_rho-math-1b-v0.1_epoch_3_global_step_87
SFT_gsm8k_rho-math-1b-v0.1_epoch_5_global_step_145
SFT_gsm8k_rho-math-1b-v0.1_epoch_0_global_step_0
Phi3-TL-ORCA-1
Phi3-TL-ORCA-10
llama-2-7b-miniguanaco
tinyllama-physics-v1
qwen-new_merged-FinetunedByAG
qwen2.5-0.5B_educational_instruct_top3000_codeonly
qwen2.5-0.5B_educational_instruct_top6000_codeonly
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-docile_playful_octopus
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-silent_trotting_rooster
qwen2.5-0.5b
asm2asm-qwen2.5coder-0.5b-200k-2ep
smol_talk_sft_v1
qwen2.5-0.5B_educational_inst
iq-code-evmind-0.5b-instruct-v0.2411.0-100
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-grazing_tangled_salmon
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-gliding_patterned_mole
qwenfloat16
Qwen2-0.5B-OnlineDPO-GRM-Gemma
asm2asm-qwen2.5coder-0.5b-100k-2ep
Qwen2-0.5B-Instruct-SQL-generator
test
iq-code-evmind-0.5b-instruct-v0.2411.7
qwen2.5-0.5B_educational_instruct_top3000_DeepL_ja
finetune-Qwen2-0.5B-codeDataset
qwen2.5-0.5B_educational_instruct-2
gensyn-checkpoints-lazy_beaked_camel
iq-code-evmind-0.5b-instruct-v0.2411.4-640
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-waddling_soaring_slug
Qwen2.5-Coder-0.5B-Instruct
Qwen2.5-0.5B-Instruct-Gensyn-Swarm-screeching_flexible_jellyfish
qwen2.5-0.5B_educational_instruct_pythonblock_en_2000
GRPOtuned