Models - Page 1052

44,776
aarifO1Cold4B32KVision

gemma-3-4b-it-128k-presls

0
·
1
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-WebQSP-hit1

0
·
1
·
Apr 2026
lalithapranathipulavarthyColdTools32B32K

smartclaims-grpo-unk10

0
·
1
·
Apr 2026
Mohamed475ColdTools2B32K

qwen3-1.7b_sft

0
·
1
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_MATH_lr5e-5

0
·
1
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
1
·
May 2026
didula-wso2ColdTools8B32K

Qwen3-8B_julia_codeforces_with_thinksft_16bit_vllm

0
·
1
·
May 2026
MargiPandyaColdTools8B32K

Qwen3_Without_COT

0
·
1
·
Apr 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-fa_DPO_5e-06

0
·
1
·
Apr 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-zh_1.0-1.0_1.0

0
·
1
·
Apr 2026
vera6ColdTools32B32K

affine-5FLfUZGkWuj66bxFnkGdP9uuvSart21eNqZeeqPii3To9GUB

0
·
1
·
Apr 2026
MHK-22ColdTools8B8K

Meta-Llama-3-8B-SFT-safe

0
·
1
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safeinstr-0.1

0
·
1
·
Apr 2026
KULIANLENColdTools4B32K

qwen3-4b-35b-rk-new_solver_aux_v4

0
·
1
·
May 2026
kmseongCold7B4K

Llama-2-7b-chat-hf_gsm8k_ft_freeze_rotation_space_sn_lr5e-5

0
·
1
·
May 2026
grafColdTools2B32K

math_skywork-v2-qwen3-4b-easy_1e-4_200

0
·
1
·
Apr 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-rsn-tuned-lr5e-5

0
·
1
·
May 2026
kmseongCold7B4K

llama-2-7b-chat-hf-only-sn-tuned-lr5e-5

0
·
1
·
May 2026
kmseongColdTools8B32K

llama-3.1-8B-gsm8k-rsn-tuned-lr5e-5

0
·
1
·
May 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_1.0-1.0_1.0

0
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_gsm8k_ft_freeze_sn_lr3e-5

0
·
1
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-solo-bos-attn-k28

0
·
1
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step60

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_21

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_24

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_36

0
·
1
·
Apr 2026
batster4ColdTools2B32K

evolai-qwen2.5-1.5b-sn47-v2

0
·
1
·
May 2026
kmseongColdTools8B32K

llama-3.1-8B-gsm8k-sn-tuned-lr5e-5

0
·
1
·
May 2026
JRQiColdTools8B32K

seed0_sample5000_bmlama_meta-llama-Llama-3.1-8B-Instruct_en-fa_DPO_5e-06

0
·
1
·
Apr 2026
aria-ai12317ColdTools8B8K

flora-smeraldi-v1-merged

0
·
1
·
Apr 2026
AnsnaeemCold1B2K

tinyllama-peft-merged

0
·
1
·
Apr 2026
jeongseokohColdTools8B32K

llama3.1_8b_sft_SPEED-16-BoS

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_18

0
·
1
·
Apr 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-HI-SynthDolly-1A-E3

0
·
1
·
Apr 2026
ParetoQaftColdTools1B32K

1B-Instruct-Tulu-full

0
·
1
·
Apr 2026
ferrazzipietroColdTools8B32K

unsup-Qwen3-8B-datav3-only_mask_w_item_mesh

0
·
1
·
May 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-somfmerge

0
·
1
·
May 2026
fifrioColdTools8B32K

Qwen3-8B-slimllm-3bit-calibration-Chinese-128samples

0
·
1
·
Dec 2025
JRQiColdTools8B32K

seed0_sample5000_bmlama_Qwen-Qwen2.5-7B-Instruct_en-fa_1.0-1.0_1.0

0
·
1
·
Apr 2026
biancaganescuColdTools8B32K

asprm_l_newline_judged

0
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-SSFT-MEDQA-FT-safety-mix-0.1-lr3e-5

0
·
1
·
Apr 2026
void-818ColdTools32B32K

Affine-26-5CJSVFFb8fngGvGyHbxoyGot2zy9PhoGHFy5ZNdosdGmovAQ

0
·
1
·
May 2026