{"type": "article", "title": "Monitoring LLM Inference with Prometheus and Grafana (vLLM, TGI, Llama.cpp)", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/monitoring-llm-inference-with-prometheus-and-grafana-vllm-tgi-llama-cpp", "original_source": "https://www.glukhov.org/observability/monitoring-llm-inference-prometheus-grafana/", "published": "2026-06-15T02:34:15+00:00", "accessed": "2026-06-15", "id": "monitoring-llm-inference-with-prometheus-and-grafana-vllm-tgi-llama-cpp"}