inference-optimization/Qwen3-8B-speculator.dflash.swa.causal-qwen235b-instruct-bs16-ckpt4 2B • Updated 1 day ago
inference-optimization/dflash-DeepSeek-V4-Flash-all-swa-muon-speculators-50k 2B • Updated 1 day ago • 40
inference-optimization/Qwen3-8B-from-Qwen3-8B_regen-speculators.eagle31-qwen3arch-3e4-ckpt1 1B • Updated 1 day ago • 6
inference-optimization/Qwen3-8B-speculator.dflash.swa.causal-qwen235b-instruct-bs16-ckpt3 2B • Updated 2 days ago • 89
inference-optimization/Qwen3-8B-from-Qwen3-8B_regen-speculators.eagle31-qwen3arch-ckpt1 1B • Updated 2 days ago • 12
inference-optimization/dflash-DeepSeek-V4-Flash-swa-muon-speculators-50k 2B • Updated 3 days ago • 107
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step210040 2B • Updated 3 days ago • 237
inference-optimization/Qwen3-8B-speculator.dflash.swa.causal-qwen235b-instruct-bs16-ckpt2 2B • Updated 3 days ago • 7
inference-optimization/Qwen3-8B-from-Qwen3-8B_regen-speculators.eagle31-llamaarch-ckpt1 1B • Updated 4 days ago • 58
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step189036 2B • Updated 6 days ago • 129
inference-optimization/Laguna-XS.2-speculator.dflash-Qwen235B-500k-ckpt5 0.6B • Updated 6 days ago • 1.1k
inference-optimization/Qwen3-8B-speculator.dflash.swa.causal-qwen235b-instruct-bs16-ckpt0 2B • Updated 7 days ago • 112
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step126024 2B • Updated 7 days ago • 330
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step84016 2B • Updated 8 days ago • 122
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step63012 2B • Updated 8 days ago • 135
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step42008 2B • Updated 9 days ago • 128
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step21004 2B • Updated 9 days ago • 128
inference-optimization/Laguna-XS.2-speculator.dflash-Qwen235B-500k-ckpt4 0.6B • Updated 10 days ago • 115
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step56712 2B • Updated 14 days ago • 412
inference-optimization/Laguna-XS.2-speculator.dflash-Qwen235B-500k-ckpt3 0.6B • Updated 14 days ago • 114
inference-optimization/Laguna-XS.2-speculator.dflash-Qwen235B-500k-ckpt2 0.6B • Updated 14 days ago • 233
inference-optimization/Qwen3-8B-speculator.dflash.swa.non-qwen3-step21k 2B • Updated 16 days ago • 122
inference-optimization/Qwen3-8B-from-Qwen3-8B_regen-speculators.eagle3-qwen3arch-ckpt1 1B • Updated 16 days ago • 2.6k
inference-optimization/Laguna-XS.2-speculator.dflash-Qwen235B-500k-ckpt1-20260609-0052 0.6B • Updated 16 days ago • 9