{"type": "article", "title": "vLLM: An Efficient Inference Engine for Large Language Models [pdf]", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/vllm-an-efficient-inference-engine-for-large-language-models-pdf", "original_source": "https://www2.eecs.berkeley.edu/Pubs/TechRpts/2025/Archive/EECS-2025-192.pdf", "published": "2026-06-05T12:29:57+00:00", "accessed": "2026-06-05", "id": "vllm-an-efficient-inference-engine-for-large-language-models-pdf"}