{"type": "article", "title": "Pipeline-parallel LLM inference across GPUs on separate machines", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/pipeline-parallel-llm-inference-across-gpus-on-separate-machines", "original_source": "https://github.com/leyten/shard", "published": "2026-06-19T19:14:34+00:00", "accessed": "2026-06-19", "id": "pipeline-parallel-llm-inference-across-gpus-on-separate-machines"}