Models

4,756
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint325

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint300

0
·
2
·
Apr 2026
daman1209aroraColdTools2B32K

MaxRL-Qwen3-1.7B-Base-IDK-math12k-32-brier-rloo-step2000

0
·
2
·
Apr 2026
jshwang370Cold3B8K

fintech_gemma_2b_prac2

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.6_bs64_damp0.05

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.7_bs128_damp0.1

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_unstruct_0.6

0
·
2
·
Apr 2026
burtugeeyColdTools3B32K

qwen25-3b-somali

0
·
2
·
Mar 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_4_8

0
·
2
·
Apr 2026
HAHAJINCold3B8K

fintech_gemma_2b

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-SparseGPT_4_8

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_1_4

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_unstruct_0.4

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_unstruct_0.5

0
·
2
·
Apr 2026
jkitCold3B8K

fintech_gemma_2b

0
·
2
·
Apr 2026
Ha-yaColdTools2B32K

QWEN3-1.7B-EXTENDED-HUMAN

0
·
2
·
Apr 2026
salmannyuColdTools3B32K

Llama-3B-Nemotron-Math-Mid-Train-Full-non-think-nopack-lr1.5e5-ep3

0
·
2
·
Mar 2026
JameSandColdTools2B32K

qwen3-1.7b-base-sgd-1e-2-global_step_200

0
·
2
·
Jan 2026
NehaChikleColdTools3B32K

kaizen-grpo

0
·
2
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CQW

0
·
2
·
Mar 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260429_004543_step580

0
·
2
·
May 2026
my-ai-stackColdTools3B32K

stack-x-ultimate-v2

0
·
2
·
Apr 2026
ruhziColdTools2B32K

Indian_History_SLM

0
·
2
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-WebQSP-hit1

0
·
2
·
Apr 2026
chewjhColdTools3B32K

cs4262-qwen-sft-n8n

0
·
2
·
Mar 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1_grpo

0
·
2
·
Apr 2026
kaiwu598ColdTools3B32K

filing-sense-grpo-qwen2.5-3b

0
·
2
·
Apr 2026
jordyyyyColdTools3B32K

qwen2.5_3b_instruct_finetuned

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Qwen2.5-3B_mathv1_grpo

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_sn_tuned_lr5e-5

0
·
2
·
Apr 2026
andrebarrosilva1123ColdTools2B32K

evolai-1.7b-thinking

0
·
2
·
Apr 2026
sikkaBolegaColdTools3B32K

printfarm-sft-v3-merged

0
·
2
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step290

0
·
2
·
May 2026
PrunaAICold3B8K

gemma-1.1-2b-it-bnb-8bit-smashed

0
·
1
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_rel_10_1p0_0p0_1p0_grpo_1_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_rel_10_1p0_0p0_1p0_grpo_2_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_rel_1e-5_1p0_0p0_1p0_grpo_2_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_assistant_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_array_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_result_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
Kazuki1450ColdTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_State_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026