<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9"><url><loc>https://www.datagravity.dev/p/the-inference-unbundling-why-prefill</loc><news:news><news:publication><news:name>Data Gravity</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-04-27T19:14:41+00:00</news:publication_date><news:title>The Inference Unbundling: Why Prefill and Decode Are Splitting the GPU</news:title></news:news></url></urlset>