{"type": "article", "title": "Speculative Decoding: 20-50% Faster LLM Inference", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/speculative-decoding-20-50-faster-llm-inference", "original_source": "https://www.glukhov.org/llm-performance/optimization/speculative-decoding/", "published": "2026-07-01T09:07:39+00:00", "accessed": "2026-07-01", "id": "speculative-decoding-20-50-faster-llm-inference"}