Models

10,897
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.85-4xh200-batch-64-20260421-213851

0
·
5
·
Apr 2026
ReginaNasyrovaColdTools4B32K

4B-Instruct-STE

0
·
5
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-SSFT-lr3e-5

0
·
5
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-resta

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100

0
·
5
·
Apr 2026
rghosh8ColdTools2B32K

arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-42-G-16-merged

0
·
5
·
Apr 2026
DQN-LabsColdTools4B32K

dqncode2-preview

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_bottom20_nogap-maxsteps200-resp2

0
·
5
·
Apr 2026
jsilverbergColdTools2B32K

Qwen3-1.7B-Wordle-SFT

0
·
5
·
Apr 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-42-G-4-merged

0
·
5
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_step580

0
·
5
·
May 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_20260429_145817_step580

0
·
5
·
May 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_unstruct_0.4

0
·
5
·
Apr 2026
modrillColdTools4B32K

math_think_X_qwen3_4b_base_sft

0
·
5
·
Apr 2026
ArnaudDevColdTools800M32K

symfony_ai_maker-V0.6-Qwen3-0.6B-16bit

0
·
5
·
Apr 2026
kmseongColdTools3B32K

llama-3.2-3b-instruct-only-sn-tuned-lr5e-5

0
·
5
·
May 2026
Johnny1024ColdTools4B32K

ttrl-mmlu_pro-qwen3-4b-think-2507-TTRL-Len-8k-grpo-232417

0
·
5
·
Apr 2026
Soea511ColdTools2B32K

Godot-Native-AI-Brain

0
·
5
·
May 2026
rghosh8ColdTools2B32K

deepseek-r1-distill-qwen-1.5b-opencoder-educational-instruct-seed-3407-G-8_merged

0
·
5
·
Apr 2026
WisdomShellColdTools8B8K

ADG-WizardLM-LLaMa3-8B

0
·
5
·
Apr 2026
gpugobrrrColdTools800M32K

Qwen3-0.6B-Farsi

0
·
5
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-bm25-10b

0
·
5
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-igm-10b

0
·
5
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-CWQ-no-retrieval-reward

0
·
5
·
Apr 2026
DangIT02ColdTools8B32K

qwen3vl-flowchart-to-mermaid_v2

0
·
5
·
Apr 2026
yunhowhourColdTools4B32K

DAPO_batch_1024_step_90

0
·
5
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-ssft-lr5e-5

0
·
5
·
Apr 2026
unlearning-cleanslateColdTools8B32K

qwen3-8b-simnpo-gentle-igm-10b

0
·
5
·
Apr 2026
atlasclaw101ColdTools70B32K

openclaw-primary-merged

0
·
5
·
Apr 2026
DCAgentColdTools8B32K

d1_harden_then_constrain_top4_seq_glm47

0
·
5
·
Apr 2026
timpal0lCold1B2K

gpt-sw3-1.3b-instruct

0
·
5
·
Apr 2026
Hamzasajjad38Cold1B2K

pakistan-leaders-tinyllama-peft-merged

0
·
5
·
Apr 2026
ruhziColdTools2B32K

Indian_History_SLM

0
·
5
·
Apr 2026
anonymous-dadaColdTools8B32K

DialFactSum-Base-8B

0
·
5
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_gsm8k_ft_freeze_sn_lr5e-5_revised

0
·
5
·
May 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-base-stage2-lora-epoch2

0
·
5
·
Apr 2026
UoM-CS-NeuroSymbolicAIColdTools8B32K

qwen3vl_ins_math_10k

0
·
5
·
Apr 2026
quanhmCold3B2K

phi2-docstring-model

0
·
5
·
May 2026
unlearning-cleanslateColdTools8B32K

qwen3-8b-simnpo-gentle-bm25-6t

0
·
5
·
Apr 2026
MargiPandyaColdTools8B32K

Qwen3_Without_COT

0
·
5
·
Apr 2026
RexhaifColdTools4B32K

Mlem-4B-RL-Seed1

0
·
5
·
Apr 2026
MHK-22ColdTools8B8K

Meta-Llama-3-8B-SFT-safe

0
·
5
·
Apr 2026