<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="wordpress.com" -->
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
	xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd"
	xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
	xmlns:news="http://www.google.com/schemas/sitemap-news/0.9"
	xmlns:image="http://www.google.com/schemas/sitemap-image/1.1"
	>
<url><loc>https://alidarbehani.com/2026/06/23/vllm-vs-tensorrt-llm-vs-ray-serve-a-stack-not-a-showdown/</loc><news:news><news:publication><news:name>Ali Darbehani</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-23T19:26:03+00:00</news:publication_date><news:title>vLLM vs TensorRT-LLM vs Ray Serve: A Stack, Not a Showdown</news:title><news:keywords>GenAI, large-language-model, vLLM, Paged Attention, LLM Inference, TensorRT-LLM, Ray Serve, LLM serving</news:keywords></news:news></url></urlset>
