<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-Math-V2</loc>
    <lastmod>2026-06-18T18:41:52.917Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR</loc>
    <lastmod>2026-06-18T18:41:52.942Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR-2</loc>
    <lastmod>2026-06-18T18:41:52.920Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-R1</loc>
    <lastmod>2026-06-18T18:41:52.932Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3</loc>
    <lastmod>2026-06-18T18:41:52.934Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_1</loc>
    <lastmod>2026-06-18T18:41:52.930Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_2</loc>
    <lastmod>2026-06-18T18:41:52.931Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V4</loc>
    <lastmod>2026-06-18T07:06:11.688Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5</loc>
    <lastmod>2026-06-18T18:41:52.987Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5-VL</loc>
    <lastmod>2026-06-18T18:41:52.918Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/FlashLabs/Chroma1.0</loc>
    <lastmod>2026-06-18T18:41:52.983Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5</loc>
    <lastmod>2026-06-18T18:41:52.973Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5V</loc>
    <lastmod>2026-06-18T18:41:52.965Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6</loc>
    <lastmod>2026-06-18T18:41:52.985Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6V</loc>
    <lastmod>2026-06-18T18:41:52.981Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7</loc>
    <lastmod>2026-06-18T18:41:52.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7-Flash</loc>
    <lastmod>2026-06-18T18:41:52.974Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5</loc>
    <lastmod>2026-06-18T18:41:53.053Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.1</loc>
    <lastmod>2026-06-18T18:41:52.977Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.2</loc>
    <lastmod>2026-06-17T03:48:22.686Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-Glyph</loc>
    <lastmod>2026-06-18T18:41:53.061Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-OCR</loc>
    <lastmod>2026-06-18T18:41:53.054Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/DiffusionGemma</loc>
    <lastmod>2026-06-18T18:41:53.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/Gemma4</loc>
    <lastmod>2026-06-18T18:41:53.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/LLaDA-2.1</loc>
    <lastmod>2026-06-18T18:41:53.059Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.5-1T</loc>
    <lastmod>2026-06-18T18:41:53.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.6</loc>
    <lastmod>2026-06-18T18:41:53.059Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.5-1T</loc>
    <lastmod>2026-06-18T18:41:53.057Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.6-1T</loc>
    <lastmod>2026-06-18T18:41:53.054Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S1</loc>
    <lastmod>2026-06-18T18:41:53.090Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S2-Preview</loc>
    <lastmod>2026-06-18T18:41:53.084Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternVL/InternVL3.5</loc>
    <lastmod>2026-06-18T18:41:53.090Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Jina/Jina-reranker-m0</loc>
    <lastmod>2026-06-18T18:41:53.091Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/LiquidAI/LFM2.5</loc>
    <lastmod>2026-06-17T01:16:19.056Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.1</loc>
    <lastmod>2026-06-18T18:41:53.089Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.3-70B</loc>
    <lastmod>2026-06-18T18:41:53.093Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama4</loc>
    <lastmod>2026-06-18T18:41:53.088Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2</loc>
    <lastmod>2026-06-18T18:41:53.130Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.5</loc>
    <lastmod>2026-06-18T18:41:53.093Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.7</loc>
    <lastmod>2026-06-18T18:41:53.088Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M3</loc>
    <lastmod>2026-06-18T18:41:53.147Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Devstral-2</loc>
    <lastmod>2026-06-18T18:41:53.123Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Ministral-3</loc>
    <lastmod>2026-06-18T18:41:53.111Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Medium-3.5</loc>
    <lastmod>2026-06-18T18:41:53.127Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Small-4</loc>
    <lastmod>2026-06-18T18:41:53.126Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2</loc>
    <lastmod>2026-06-18T18:41:53.126Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.5</loc>
    <lastmod>2026-06-18T18:41:53.128Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.6</loc>
    <lastmod>2026-06-18T18:41:53.129Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.7-Code</loc>
    <lastmod>2026-06-18T04:42:51.416Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-Linear</loc>
    <lastmod>2026-06-18T18:42:01.917Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano</loc>
    <lastmod>2026-06-18T18:42:01.907Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano-Omni</loc>
    <lastmod>2026-06-18T18:42:01.995Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Super</loc>
    <lastmod>2026-06-18T18:42:01.920Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Ultra</loc>
    <lastmod>2026-06-12T21:52:51.647Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenAI/GPT-OSS</loc>
    <lastmod>2026-06-18T18:42:01.973Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenBMB/MiniCPM-V-4_6</loc>
    <lastmod>2026-06-18T18:42:01.918Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Poolside/Laguna-M.1</loc>
    <lastmod>2026-06-18T16:27:05.313Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Poolside/Laguna-XS.2</loc>
    <lastmod>2026-06-18T18:42:01.920Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen2.5-VL</loc>
    <lastmod>2026-06-18T18:42:01.919Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3</loc>
    <lastmod>2026-06-18T18:42:02.561Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder</loc>
    <lastmod>2026-06-18T18:42:02.267Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder-Next</loc>
    <lastmod>2026-06-18T18:42:02.624Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Next</loc>
    <lastmod>2026-06-18T18:42:02.244Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-VL</loc>
    <lastmod>2026-06-18T18:42:02.554Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.5</loc>
    <lastmod>2026-06-18T18:42:02.578Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.6</loc>
    <lastmod>2026-06-18T18:42:02.618Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step-3.7-Flash</loc>
    <lastmod>2026-06-18T18:42:03.273Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3-VL-10B</loc>
    <lastmod>2026-06-18T18:42:02.599Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3.5</loc>
    <lastmod>2026-06-18T18:42:02.585Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Tencent/Hunyuan3-Preview</loc>
    <lastmod>2026-06-18T18:42:03.405Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2-Flash</loc>
    <lastmod>2026-06-18T18:42:03.401Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2.5</loc>
    <lastmod>2026-06-18T18:42:03.396Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/intro</loc>
    <lastmod>2026-06-18T15:28:09.761Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/autoregressive_model_benchmark</loc>
    <lastmod>2026-06-18T18:42:03.395Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/diffusion_model_benchmark</loc>
    <lastmod>2026-06-18T18:42:03.398Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/reference/server_arguments</loc>
    <lastmod>2026-06-18T18:42:03.367Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Cosmos/Cosmos3</loc>
    <lastmod>2026-06-18T18:42:03.399Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ernie-Image/Ernie-Image</loc>
    <lastmod>2026-06-18T18:42:03.402Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/FLUX/FLUX</loc>
    <lastmod>2026-06-18T18:42:03.400Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ideogram/Ideogram4</loc>
    <lastmod>2026-06-18T18:42:03.525Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LTX/LTX2 &amp; LTX2.3</loc>
    <lastmod>2026-06-18T02:21:05.977Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LingBot-World/LingBot-World</loc>
    <lastmod>2026-06-18T18:42:03.521Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/MOVA/MOVA</loc>
    <lastmod>2026-06-18T18:42:03.520Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image</loc>
    <lastmod>2026-06-18T18:42:03.493Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image-Edit</loc>
    <lastmod>2026-06-18T18:42:03.524Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/SANA-WM/SANA-WM</loc>
    <lastmod>2026-06-18T18:42:03.523Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.1</loc>
    <lastmod>2026-06-18T18:42:03.519Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.2</loc>
    <lastmod>2026-06-18T18:42:03.494Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Z-Image/Z-Image-Turbo</loc>
    <lastmod>2026-06-18T18:42:03.629Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/intro</loc>
    <lastmod>2026-06-09T02:48:21.294Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/intro</loc>
    <lastmod>2026-06-18T18:42:03.618Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/specbundle_usage</loc>
    <lastmod>2026-06-18T18:42:03.603Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/supported_models</loc>
    <lastmod>2026-06-18T18:42:03.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/adaptive_speculative_decoding</loc>
    <lastmod>2026-06-18T18:42:03.607Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/attention_backend</loc>
    <lastmod>2026-06-18T18:42:03.623Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/breakable_cuda_graph</loc>
    <lastmod>2026-06-18T18:42:03.706Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/checkpoint_engine</loc>
    <lastmod>2026-06-18T18:42:03.703Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/cuda_graph_for_multi_modal_encoder</loc>
    <lastmod>2026-06-18T18:42:03.705Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/deterministic_inference</loc>
    <lastmod>2026-06-18T18:42:03.670Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_dpa_smg_guide</loc>
    <lastmod>2026-06-18T18:42:03.701Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_for_multi_modal_encoder</loc>
    <lastmod>2026-06-18T18:42:03.703Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/epd_disaggregation</loc>
    <lastmod>2026-06-18T18:42:03.700Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/expert_parallelism</loc>
    <lastmod>2026-06-18T18:42:03.672Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache</loc>
    <lastmod>2026-06-18T18:42:03.701Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_best_practices</loc>
    <lastmod>2026-06-18T18:42:03.737Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_design</loc>
    <lastmod>2026-06-18T18:42:03.736Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_storage_runtime_attach_detach</loc>
    <lastmod>2026-06-18T18:42:03.734Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hisparse_guide</loc>
    <lastmod>2026-06-18T18:42:03.731Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hyperparameter_tuning</loc>
    <lastmod>2026-06-18T18:42:03.732Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/llm-d</loc>
    <lastmod>2026-06-18T18:42:03.735Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/lora</loc>
    <lastmod>2026-06-18T18:42:03.733Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/object_storage</loc>
    <lastmod>2026-06-18T18:42:03.731Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/observability</loc>
    <lastmod>2026-06-18T18:42:03.734Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/overview</loc>
    <lastmod>2026-04-01T04:21:05.794Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pd_disaggregation</loc>
    <lastmod>2026-06-18T18:42:03.770Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/piecewise_cuda_graph</loc>
    <lastmod>2026-06-18T18:42:03.769Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pipeline_parallelism</loc>
    <lastmod>2026-06-18T18:42:03.763Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantization</loc>
    <lastmod>2026-06-18T18:42:03.764Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantized_kv_cache</loc>
    <lastmod>2026-06-18T18:42:03.764Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/separate_reasoning</loc>
    <lastmod>2026-06-18T18:42:03.759Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/server_arguments</loc>
    <lastmod>2026-06-18T18:42:03.779Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sgl_model_gateway</loc>
    <lastmod>2026-06-18T18:42:03.778Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sglang_for_rl</loc>
    <lastmod>2026-06-18T18:42:03.765Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/speculative_decoding</loc>
    <lastmod>2026-06-18T18:42:03.808Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs</loc>
    <lastmod>2026-06-18T18:42:03.804Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs_for_reasoning_models</loc>
    <lastmod>2026-06-18T18:42:03.809Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/tool_parser</loc>
    <lastmod>2026-06-18T18:42:03.809Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/vlm_query</loc>
    <lastmod>2026-06-18T18:42:03.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/aws_sagemaker</loc>
    <lastmod>2026-06-16T21:44:33.288Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/native_api</loc>
    <lastmod>2026-06-18T18:42:03.806Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/offline_engine_api</loc>
    <lastmod>2026-06-18T18:42:03.805Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/ollama_api</loc>
    <lastmod>2026-06-18T18:42:03.805Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api</loc>
    <lastmod>2026-03-03T17:30:52.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_completions</loc>
    <lastmod>2026-06-18T18:42:03.840Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_embeddings</loc>
    <lastmod>2026-06-18T18:42:03.839Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_vision</loc>
    <lastmod>2026-06-18T18:42:03.835Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/overview</loc>
    <lastmod>2026-06-02T00:55:43.583Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/sampling_params</loc>
    <lastmod>2026-06-18T18:42:03.837Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/send_request</loc>
    <lastmod>2026-06-18T18:42:03.833Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/bench_serving</loc>
    <lastmod>2026-06-18T18:42:03.834Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/benchmark_and_profiling</loc>
    <lastmod>2026-06-18T18:42:03.836Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/contribution_guide</loc>
    <lastmod>2026-06-18T18:42:03.835Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_guide_using_docker</loc>
    <lastmod>2026-06-18T18:42:03.838Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_jit_kernel_guide</loc>
    <lastmod>2026-06-18T18:42:03.869Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/evaluating_new_models</loc>
    <lastmod>2026-06-18T18:42:03.868Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/msprobe_debugging_guide</loc>
    <lastmod>2026-06-18T18:42:03.863Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/overview</loc>
    <lastmod>2026-04-27T07:07:34.337Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/install</loc>
    <lastmod>2026-06-16T21:44:38.358Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/quickstart</loc>
    <lastmod>2026-05-04T20:51:06.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/amd_gpu</loc>
    <lastmod>2026-06-18T18:42:03.865Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/apple_metal</loc>
    <lastmod>2026-06-18T18:42:03.866Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_contribution_guide</loc>
    <lastmod>2026-06-18T18:42:03.905Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu</loc>
    <lastmod>2026-06-18T18:42:03.904Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_accuracy_evaluation</loc>
    <lastmod>2026-06-18T18:42:03.901Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_best_practice</loc>
    <lastmod>2026-06-18T18:42:03.906Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_deepseek_example</loc>
    <lastmod>2026-06-18T18:42:03.894Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_environment_variables</loc>
    <lastmod>2026-06-18T18:42:03.893Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_faq</loc>
    <lastmod>2026-06-18T18:42:03.894Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_glm5_examples</loc>
    <lastmod>2026-06-18T18:42:03.895Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_development</loc>
    <lastmod>2026-06-15T13:12:38.796Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_performance_optimizing</loc>
    <lastmod>2026-06-18T18:42:03.938Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_optimization</loc>
    <lastmod>2026-06-18T18:42:03.937Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_performance_testing</loc>
    <lastmod>2026-06-18T18:42:03.936Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_profiling</loc>
    <lastmod>2026-06-18T18:42:03.934Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quantization</loc>
    <lastmod>2026-06-18T18:42:03.933Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quick_start</loc>
    <lastmod>2026-06-18T18:42:03.929Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_5_examples</loc>
    <lastmod>2026-06-18T18:42:03.933Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_examples</loc>
    <lastmod>2026-06-18T18:42:03.935Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_ring_sp_performance</loc>
    <lastmod>2026-06-18T18:42:03.932Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_features</loc>
    <lastmod>2026-06-18T18:42:03.989Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_models</loc>
    <lastmod>2026-06-18T18:42:03.982Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_new_models</loc>
    <lastmod>2026-06-18T18:42:03.978Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_r1</loc>
    <lastmod>2026-06-18T18:42:03.977Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_v3_2</loc>
    <lastmod>2026-06-18T18:42:03.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/glm5_1</loc>
    <lastmod>2026-06-18T18:42:03.976Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/kimi_k2_6</loc>
    <lastmod>2026-06-18T18:42:03.979Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/minimax_m2_5</loc>
    <lastmod>2026-06-18T18:42:03.976Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3-8b</loc>
    <lastmod>2026-06-18T18:42:03.962Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_235b_a22b</loc>
    <lastmod>2026-06-18T18:42:03.978Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_30b_a3b</loc>
    <lastmod>2026-06-18T18:42:04.017Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_32b</loc>
    <lastmod>2026-06-18T18:42:04.022Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_5_397b</loc>
    <lastmod>2026-06-18T18:42:04.020Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_27b</loc>
    <lastmod>2026-06-18T18:42:04.021Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_35b_a3b</loc>
    <lastmod>2026-06-18T18:42:04.017Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_next_80b_a3b_instruct</loc>
    <lastmod>2026-06-18T18:42:04.019Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/mindspore_backend</loc>
    <lastmod>2026-06-18T18:42:04.005Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/cpu_server</loc>
    <lastmod>2026-06-18T18:42:04.021Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/mthreads_gpu</loc>
    <lastmod>2026-06-18T18:42:04.018Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia-gpus</loc>
    <lastmod>2026-06-18T18:42:04.072Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia_jetson</loc>
    <lastmod>2026-04-21T07:18:19.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/overview</loc>
    <lastmod>2026-04-21T07:18:19.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/plugin</loc>
    <lastmod>2026-06-18T18:42:04.073Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/tpu</loc>
    <lastmod>2026-04-21T08:13:05.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/xpu</loc>
    <lastmod>2026-06-18T18:42:04.070Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/custom_chat_template</loc>
    <lastmod>2026-06-18T18:42:04.069Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/environment_variables</loc>
    <lastmod>2026-06-18T18:42:04.066Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/faq</loc>
    <lastmod>2026-06-18T18:42:04.068Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/choices_methods</loc>
    <lastmod>2026-06-18T18:42:04.071Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_index</loc>
    <lastmod>2026-06-18T18:42:04.101Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_tutorial</loc>
    <lastmod>2026-06-18T18:42:04.103Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/deploy_on_k8s</loc>
    <lastmod>2026-06-18T18:42:04.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/lws_pd/lws_pd_deploy</loc>
    <lastmod>2026-06-18T18:42:04.097Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node</loc>
    <lastmod>2026-06-18T18:42:04.104Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node_index</loc>
    <lastmod>2026-06-18T18:42:04.101Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/rbg_pd/deepseekv32_pd</loc>
    <lastmod>2026-06-18T18:42:04.098Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/nightly_precision_regression</loc>
    <lastmod>2026-06-18T18:42:04.100Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/overview</loc>
    <lastmod>2026-04-01T04:21:05.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/post_training_integration</loc>
    <lastmod>2026-06-18T18:42:04.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_metrics</loc>
    <lastmod>2026-06-18T18:42:04.127Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_request_trace</loc>
    <lastmod>2026-06-18T18:42:04.150Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/cli</loc>
    <lastmod>2026-06-10T06:19:01.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/openai_api</loc>
    <lastmod>2026-06-05T02:46:29.588Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/post_processing</loc>
    <lastmod>2026-06-18T18:42:04.129Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/attention_backends</loc>
    <lastmod>2026-05-19T09:47:12.107Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/cache_dit</loc>
    <lastmod>2026-06-10T06:19:01.058Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/caching-acceleration</loc>
    <lastmod>2026-06-10T06:19:01.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ci_perf</loc>
    <lastmod>2026-04-21T07:18:40.380Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/compatibility_matrix</loc>
    <lastmod>2026-06-18T02:21:11.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/contributing</loc>
    <lastmod>2026-06-18T18:42:04.179Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/deployment_cookbook</loc>
    <lastmod>2026-06-10T06:19:01.074Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/disaggregation</loc>
    <lastmod>2026-06-18T18:42:04.176Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/dynamic_batching</loc>
    <lastmod>2026-06-10T06:19:11.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/environment_variables</loc>
    <lastmod>2026-06-11T15:15:48.750Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion</loc>
    <lastmod>2026-06-10T06:19:11.039Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/installation</loc>
    <lastmod>2026-06-10T06:19:11.037Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/performance-optimization</loc>
    <lastmod>2026-06-10T06:19:11.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/profiling</loc>
    <lastmod>2026-03-27T19:16:51.341Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/progressive_resolution</loc>
    <lastmod>2026-06-11T15:20:28.098Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/quantization</loc>
    <lastmod>2026-06-18T18:42:04.204Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ring_sp_performance</loc>
    <lastmod>2026-06-18T18:42:04.208Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/support_new_models</loc>
    <lastmod>2026-06-18T18:42:04.206Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/teacache</loc>
    <lastmod>2026-06-10T06:19:24.192Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models</loc>
    <lastmod>2026-04-21T07:18:48.656Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/classify_models</loc>
    <lastmod>2026-06-18T18:42:04.203Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/diffusion_language_models</loc>
    <lastmod>2026-06-18T18:42:04.206Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/embedding_models</loc>
    <lastmod>2026-04-21T07:18:48.654Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/generative_models</loc>
    <lastmod>2026-06-18T18:42:04.205Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/mindspore_models</loc>
    <lastmod>2026-06-18T18:42:04.235Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/modelscope</loc>
    <lastmod>2026-06-18T18:42:04.232Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/multimodal_language_models</loc>
    <lastmod>2026-06-18T18:42:04.231Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/rerank_models</loc>
    <lastmod>2026-06-18T18:42:04.230Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/reward_models</loc>
    <lastmod>2026-06-18T18:42:04.233Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/support_new_models</loc>
    <lastmod>2026-04-21T07:18:58.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/transformers_fallback</loc>
    <lastmod>2026-06-18T18:42:04.234Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io</loc>
    <lastmod>2026-06-18T01:24:12.491Z</lastmod>
  </url>
</urlset>