<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="wordpress.com" -->
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd"><url><loc>https://alidarbehani.com/2025/08/24/beyond-gpus-mastering-ultra-scale-llm-training/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/image.png</image:loc><image:title>image</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/pipeline-parallelism.png</image:loc><image:title>Pipeline Parallelism</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/context-parallelism.png</image:loc><image:title>context parallelism</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/tensor-parallelism.png</image:loc><image:title>tensor parallelism</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/data-parallel.png</image:loc><image:title>data-parallel</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/gradiant-accumulation.png</image:loc><image:title>gradiant accumulation</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/activation-recomputation.png</image:loc><image:title>activation recomputation</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/screenshot-2025-08-24-at-2.43.12-pm.png</image:loc><image:title>Screenshot 2025-08-24 at 2.43.12 PM</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/screenshot-2025-08-17-at-9.27.33-pm.png</image:loc><image:title>Screenshot 2025-08-17 at 9.27.33 PM</image:title></image:image><lastmod>2025-09-03T12:37:24+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/2025/08/28/beyond-gpus-mastering-ultra-scale-llm-training-part-2/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/screenshot-2025-08-28-at-8.25.45-am.png</image:loc><image:title>Screenshot 2025-08-28 at 8.25.45 AM</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2025/08/model-size-heat-map.png</image:loc><image:title>model-size-heat-map</image:title></image:image><lastmod>2025-09-03T12:36:12+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/2024/08/19/building-a-high-quality-rag-system-challenges-and-solutions/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/rag-architecture.png</image:loc><image:title>RAG Architecture</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/rag-systeem.png</image:loc><image:title>RAG Systeem</image:title></image:image><lastmod>2024-08-20T12:18:10+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/2024/08/10/supercharging-your-inference-of-large-language-models-with-vllm-part-2/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/vllm-architecture.png</image:loc><image:title>vLLM architecture</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/memeory-efficiency-with-paged-attention.png</image:loc><image:title>memeory efficiency with paged attention</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/vllm-pagedattention-mechanism.png</image:loc><image:title>vLLM pagedattention mechanism</image:title></image:image><lastmod>2024-08-10T15:27:07+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/2024/08/04/supercharging-your-inference-of-large-language-models-with-vllm-part-1/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/vllm-performance.png</image:loc><image:title>VLLM-performance</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/paged-attention.png</image:loc><image:title>paged-attention</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/continuous-batching.png</image:loc><image:title>continuous-batching</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/paged-attention-animated.gif</image:loc><image:title>paged-attention-animated</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/vllm-blogpost.png</image:loc><image:title>vLLM-blogpost</image:title></image:image><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/08/screenshot-2024-08-04-at-8.19.22e280afpm.png</image:loc><image:title>Screenshot 2024-08-04 at 8.19.22 PM</image:title></image:image><lastmod>2024-08-05T01:01:29+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/2024/07/22/challenges-and-best-practices-in-developing-multi-agent-ai-applications/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/07/multi-agent-ai-application-architecture.png</image:loc><image:title>multi-agent AI application architecture</image:title></image:image><lastmod>2024-07-22T13:24:00+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/about-2/</loc><lastmod>2024-07-21T21:38:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://alidarbehani.com/2024/07/17/deploying-agentic-systems-navigating-the-complexities-of-multi-agent-llm-applications/</loc><image:image><image:loc>https://alidarbehani.com/wp-content/uploads/2024/07/image.png</image:loc><image:title>image</image:title></image:image><lastmod>2024-07-19T16:01:57+00:00</lastmod><changefreq>monthly</changefreq></url><url><loc>https://alidarbehani.com/hosted-talks/</loc><lastmod>2024-07-19T15:45:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://alidarbehani.com</loc><changefreq>daily</changefreq><priority>1.0</priority><lastmod>2025-09-03T12:37:24+00:00</lastmod></url></urlset>
