<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-Math-V2</loc>
    <lastmod>2026-06-16T13:51:08.776Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR</loc>
    <lastmod>2026-06-16T13:51:08.774Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR-2</loc>
    <lastmod>2026-06-16T13:51:08.772Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-R1</loc>
    <lastmod>2026-06-16T13:51:08.773Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3</loc>
    <lastmod>2026-06-16T13:51:08.775Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_1</loc>
    <lastmod>2026-06-16T13:51:08.771Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_2</loc>
    <lastmod>2026-06-16T13:51:08.782Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V4</loc>
    <lastmod>2026-06-15T22:53:52.133Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5</loc>
    <lastmod>2026-06-16T13:51:08.820Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5-VL</loc>
    <lastmod>2026-06-16T13:51:08.778Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/FlashLabs/Chroma1.0</loc>
    <lastmod>2026-06-16T13:51:08.820Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5</loc>
    <lastmod>2026-06-16T13:51:08.815Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5V</loc>
    <lastmod>2026-06-16T13:51:08.814Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6</loc>
    <lastmod>2026-06-16T13:51:08.809Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6V</loc>
    <lastmod>2026-06-16T13:51:08.812Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7</loc>
    <lastmod>2026-06-16T13:51:08.845Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7-Flash</loc>
    <lastmod>2026-06-16T13:51:08.810Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5</loc>
    <lastmod>2026-06-16T13:51:23.090Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.1</loc>
    <lastmod>2026-06-16T13:51:08.819Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.2</loc>
    <lastmod>2026-06-16T13:51:08.815Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-Glyph</loc>
    <lastmod>2026-06-16T13:51:23.091Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-OCR</loc>
    <lastmod>2026-06-16T13:51:23.093Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/DiffusionGemma</loc>
    <lastmod>2026-06-16T13:51:23.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/Gemma4</loc>
    <lastmod>2026-06-16T13:51:23.098Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/LLaDA-2.1</loc>
    <lastmod>2026-06-16T13:51:23.092Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.5-1T</loc>
    <lastmod>2026-06-16T13:51:23.094Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.6</loc>
    <lastmod>2026-06-16T13:51:23.089Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.5-1T</loc>
    <lastmod>2026-06-16T13:51:23.090Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.6-1T</loc>
    <lastmod>2026-06-16T13:51:23.093Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S1</loc>
    <lastmod>2026-06-16T13:51:23.125Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S2-Preview</loc>
    <lastmod>2026-06-16T13:51:23.132Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternVL/InternVL3.5</loc>
    <lastmod>2026-06-16T13:51:23.126Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Jina/Jina-reranker-m0</loc>
    <lastmod>2026-06-16T13:51:23.131Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/LiquidAI/LFM2.5</loc>
    <lastmod>2026-06-15T22:53:52.268Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.1</loc>
    <lastmod>2026-06-16T13:51:23.121Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.3-70B</loc>
    <lastmod>2026-06-16T13:51:23.124Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama4</loc>
    <lastmod>2026-06-16T13:51:23.123Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2</loc>
    <lastmod>2026-06-16T13:51:23.166Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.5</loc>
    <lastmod>2026-06-16T13:51:23.122Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.7</loc>
    <lastmod>2026-06-16T13:51:23.125Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M3</loc>
    <lastmod>2026-06-15T22:54:00.936Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Devstral-2</loc>
    <lastmod>2026-06-16T13:51:23.153Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Ministral-3</loc>
    <lastmod>2026-06-16T13:51:23.158Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Medium-3.5</loc>
    <lastmod>2026-06-16T13:51:23.157Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Small-4</loc>
    <lastmod>2026-06-16T13:51:23.160Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2</loc>
    <lastmod>2026-06-16T13:51:23.154Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.5</loc>
    <lastmod>2026-06-16T13:51:23.165Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.6</loc>
    <lastmod>2026-06-16T13:51:23.154Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.7-Code</loc>
    <lastmod>2026-06-12T18:20:22.088Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-Linear</loc>
    <lastmod>2026-06-16T13:51:23.195Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano</loc>
    <lastmod>2026-06-16T13:51:23.194Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano-Omni</loc>
    <lastmod>2026-06-16T13:51:23.197Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Super</loc>
    <lastmod>2026-06-16T13:51:23.197Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Ultra</loc>
    <lastmod>2026-06-12T21:52:51.647Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenAI/GPT-OSS</loc>
    <lastmod>2026-06-16T13:51:23.195Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenBMB/MiniCPM-V-4_6</loc>
    <lastmod>2026-06-16T13:51:23.193Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Poolside/Laguna-XS.2</loc>
    <lastmod>2026-06-16T13:51:23.191Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen2.5-VL</loc>
    <lastmod>2026-06-16T13:51:23.192Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3</loc>
    <lastmod>2026-06-16T13:51:23.222Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder</loc>
    <lastmod>2026-06-16T13:51:23.228Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder-Next</loc>
    <lastmod>2026-06-16T13:51:23.192Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Next</loc>
    <lastmod>2026-06-16T13:51:23.228Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-VL</loc>
    <lastmod>2026-06-16T13:51:23.226Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.5</loc>
    <lastmod>2026-06-16T13:51:23.226Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.6</loc>
    <lastmod>2026-06-16T13:51:23.225Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step-3.7-Flash</loc>
    <lastmod>2026-06-16T13:51:23.223Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3-VL-10B</loc>
    <lastmod>2026-06-16T13:51:23.224Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3.5</loc>
    <lastmod>2026-06-16T13:51:23.223Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Tencent/Hunyuan3-Preview</loc>
    <lastmod>2026-06-16T13:51:23.225Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2-Flash</loc>
    <lastmod>2026-06-16T13:51:23.258Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2.5</loc>
    <lastmod>2026-06-16T13:51:23.255Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/intro</loc>
    <lastmod>2026-06-16T13:51:23.256Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/autoregressive_model_benchmark</loc>
    <lastmod>2026-06-16T13:51:23.251Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/diffusion_model_benchmark</loc>
    <lastmod>2026-06-16T13:51:23.254Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/reference/server_arguments</loc>
    <lastmod>2026-06-16T13:51:23.252Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Cosmos/Cosmos3</loc>
    <lastmod>2026-06-16T13:51:23.250Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ernie-Image/Ernie-Image</loc>
    <lastmod>2026-06-16T13:51:23.249Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/FLUX/FLUX</loc>
    <lastmod>2026-06-16T13:51:23.251Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ideogram/Ideogram4</loc>
    <lastmod>2026-06-16T13:51:23.249Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LTX/LTX2 &amp; LTX2.3</loc>
    <lastmod>2026-05-11T05:42:51.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LingBot-World/LingBot-World</loc>
    <lastmod>2026-06-16T13:51:30.303Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/MOVA/MOVA</loc>
    <lastmod>2026-06-16T13:51:30.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image</loc>
    <lastmod>2026-06-16T13:51:30.297Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image-Edit</loc>
    <lastmod>2026-06-16T13:51:30.301Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/SANA-WM/SANA-WM</loc>
    <lastmod>2026-06-16T13:51:30.298Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.1</loc>
    <lastmod>2026-06-16T13:51:30.301Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.2</loc>
    <lastmod>2026-06-16T13:51:30.299Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Z-Image/Z-Image-Turbo</loc>
    <lastmod>2026-06-16T13:51:30.300Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/intro</loc>
    <lastmod>2026-06-09T02:48:21.294Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/intro</loc>
    <lastmod>2026-06-16T13:51:30.331Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/specbundle_usage</loc>
    <lastmod>2026-06-16T13:51:30.326Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/supported_models</loc>
    <lastmod>2026-06-16T13:51:30.355Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/adaptive_speculative_decoding</loc>
    <lastmod>2026-06-16T13:51:30.325Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/attention_backend</loc>
    <lastmod>2026-06-16T13:51:30.354Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/breakable_cuda_graph</loc>
    <lastmod>2026-06-16T13:51:30.329Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/checkpoint_engine</loc>
    <lastmod>2026-06-16T13:51:30.910Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/cuda_graph_for_multi_modal_encoder</loc>
    <lastmod>2026-06-16T13:51:30.949Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/deterministic_inference</loc>
    <lastmod>2026-06-16T13:51:30.870Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_dpa_smg_guide</loc>
    <lastmod>2026-06-16T13:51:30.916Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_for_multi_modal_encoder</loc>
    <lastmod>2026-06-16T13:51:30.640Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/epd_disaggregation</loc>
    <lastmod>2026-06-16T13:51:30.885Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/expert_parallelism</loc>
    <lastmod>2026-06-16T13:51:30.955Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache</loc>
    <lastmod>2026-06-16T13:51:30.646Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_best_practices</loc>
    <lastmod>2026-06-16T13:51:30.680Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_design</loc>
    <lastmod>2026-06-16T13:51:31.381Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_storage_runtime_attach_detach</loc>
    <lastmod>2026-06-16T13:51:31.670Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hisparse_guide</loc>
    <lastmod>2026-06-16T13:51:31.620Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hyperparameter_tuning</loc>
    <lastmod>2026-06-16T13:51:31.600Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/llm-d</loc>
    <lastmod>2026-06-16T13:51:31.562Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/lora</loc>
    <lastmod>2026-06-16T13:51:31.590Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/object_storage</loc>
    <lastmod>2026-06-16T13:51:31.388Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/observability</loc>
    <lastmod>2026-06-16T13:51:31.626Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/overview</loc>
    <lastmod>2026-04-01T04:21:05.794Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pd_disaggregation</loc>
    <lastmod>2026-06-16T13:51:31.363Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/piecewise_cuda_graph</loc>
    <lastmod>2026-06-16T13:51:32.325Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pipeline_parallelism</loc>
    <lastmod>2026-06-16T13:51:32.120Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantization</loc>
    <lastmod>2026-06-16T13:51:32.204Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantized_kv_cache</loc>
    <lastmod>2026-06-16T13:51:32.198Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/separate_reasoning</loc>
    <lastmod>2026-06-16T13:51:32.156Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/server_arguments</loc>
    <lastmod>2026-06-16T13:51:32.397Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sgl_model_gateway</loc>
    <lastmod>2026-06-16T13:51:32.136Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sglang_for_rl</loc>
    <lastmod>2026-06-16T13:51:32.087Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/speculative_decoding</loc>
    <lastmod>2026-06-16T13:51:32.126Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs</loc>
    <lastmod>2026-06-16T13:51:32.445Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs_for_reasoning_models</loc>
    <lastmod>2026-06-16T13:51:32.475Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/tool_parser</loc>
    <lastmod>2026-06-16T13:51:32.473Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/vlm_query</loc>
    <lastmod>2026-06-16T13:51:32.474Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/native_api</loc>
    <lastmod>2026-06-16T13:51:32.470Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/offline_engine_api</loc>
    <lastmod>2026-06-16T13:51:32.450Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/ollama_api</loc>
    <lastmod>2026-06-16T13:51:32.449Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api</loc>
    <lastmod>2026-03-03T17:30:52.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_completions</loc>
    <lastmod>2026-06-16T13:51:32.448Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_embeddings</loc>
    <lastmod>2026-06-16T13:51:32.446Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_vision</loc>
    <lastmod>2026-06-16T13:51:32.554Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/overview</loc>
    <lastmod>2026-06-02T00:55:43.583Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/sampling_params</loc>
    <lastmod>2026-06-16T13:51:32.558Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/send_request</loc>
    <lastmod>2026-06-16T13:51:32.553Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/bench_serving</loc>
    <lastmod>2026-06-16T13:51:32.557Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/benchmark_and_profiling</loc>
    <lastmod>2026-06-16T13:51:32.546Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/contribution_guide</loc>
    <lastmod>2026-06-16T13:51:32.545Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_guide_using_docker</loc>
    <lastmod>2026-06-16T13:51:32.555Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_jit_kernel_guide</loc>
    <lastmod>2026-06-16T13:51:32.547Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/evaluating_new_models</loc>
    <lastmod>2026-06-16T13:51:32.547Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/msprobe_debugging_guide</loc>
    <lastmod>2026-06-16T13:51:32.627Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/overview</loc>
    <lastmod>2026-04-27T07:07:34.337Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/install</loc>
    <lastmod>2026-05-26T05:28:41.054Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/quickstart</loc>
    <lastmod>2026-05-04T20:51:06.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/amd_gpu</loc>
    <lastmod>2026-06-16T13:51:32.614Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/apple_metal</loc>
    <lastmod>2026-06-16T13:51:32.613Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_contribution_guide</loc>
    <lastmod>2026-06-16T13:51:32.615Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu</loc>
    <lastmod>2026-06-16T13:51:32.616Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_accuracy_evaluation</loc>
    <lastmod>2026-06-16T13:51:32.729Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_best_practice</loc>
    <lastmod>2026-06-16T13:51:32.745Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_deepseek_example</loc>
    <lastmod>2026-06-16T13:51:32.689Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_environment_variables</loc>
    <lastmod>2026-06-16T13:51:32.705Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_faq</loc>
    <lastmod>2026-06-16T13:51:32.704Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_glm5_examples</loc>
    <lastmod>2026-06-16T13:51:32.707Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_development</loc>
    <lastmod>2026-06-15T13:12:38.796Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_performance_optimizing</loc>
    <lastmod>2026-06-16T13:51:32.706Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_optimization</loc>
    <lastmod>2026-06-16T13:51:32.705Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_performance_testing</loc>
    <lastmod>2026-06-16T13:51:32.820Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_profiling</loc>
    <lastmod>2026-06-16T13:51:32.819Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quantization</loc>
    <lastmod>2026-06-16T13:51:32.800Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quick_start</loc>
    <lastmod>2026-06-16T13:51:32.804Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_5_examples</loc>
    <lastmod>2026-06-16T13:51:32.816Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_examples</loc>
    <lastmod>2026-06-16T13:51:32.803Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_ring_sp_performance</loc>
    <lastmod>2026-06-16T13:51:32.802Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_features</loc>
    <lastmod>2026-06-16T13:51:32.831Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_models</loc>
    <lastmod>2026-06-16T13:51:32.804Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_new_models</loc>
    <lastmod>2026-06-16T13:51:32.801Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_r1</loc>
    <lastmod>2026-06-16T13:51:32.900Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_v3_2</loc>
    <lastmod>2026-06-16T13:51:32.912Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/glm5_1</loc>
    <lastmod>2026-06-16T13:51:32.913Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/kimi_k2_6</loc>
    <lastmod>2026-06-16T13:51:32.898Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/minimax_m2_5</loc>
    <lastmod>2026-06-16T13:51:32.899Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3-8b</loc>
    <lastmod>2026-06-16T13:51:32.874Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_235b_a22b</loc>
    <lastmod>2026-06-16T13:51:32.874Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_30b_a3b</loc>
    <lastmod>2026-06-16T13:51:32.876Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_32b</loc>
    <lastmod>2026-06-16T13:51:32.875Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_5_397b</loc>
    <lastmod>2026-06-16T13:51:32.873Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_27b</loc>
    <lastmod>2026-06-16T13:51:32.954Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_35b_a3b</loc>
    <lastmod>2026-06-16T13:51:32.953Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_next_80b_a3b_instruct</loc>
    <lastmod>2026-06-16T13:51:32.954Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/mindspore_backend</loc>
    <lastmod>2026-06-16T13:51:32.951Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/cpu_server</loc>
    <lastmod>2026-06-16T13:51:32.952Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/mthreads_gpu</loc>
    <lastmod>2026-06-16T13:51:32.944Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia-gpus</loc>
    <lastmod>2026-06-16T13:51:32.943Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia_jetson</loc>
    <lastmod>2026-04-21T07:18:19.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/overview</loc>
    <lastmod>2026-04-21T07:18:19.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/plugin</loc>
    <lastmod>2026-06-16T13:51:32.984Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/tpu</loc>
    <lastmod>2026-04-21T08:13:05.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/xpu</loc>
    <lastmod>2026-06-16T13:51:32.983Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/custom_chat_template</loc>
    <lastmod>2026-06-16T13:51:32.980Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/environment_variables</loc>
    <lastmod>2026-06-16T13:51:32.982Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/faq</loc>
    <lastmod>2026-06-16T13:51:32.977Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/choices_methods</loc>
    <lastmod>2026-06-16T13:51:32.976Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_index</loc>
    <lastmod>2026-06-16T13:51:32.974Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_tutorial</loc>
    <lastmod>2026-06-16T13:51:32.976Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/deploy_on_k8s</loc>
    <lastmod>2026-06-16T13:51:32.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/lws_pd/lws_pd_deploy</loc>
    <lastmod>2026-06-16T13:51:33.011Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node</loc>
    <lastmod>2026-06-16T13:51:33.009Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node_index</loc>
    <lastmod>2026-06-16T13:51:33.008Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/rbg_pd/deepseekv32_pd</loc>
    <lastmod>2026-06-16T13:51:33.006Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/nightly_precision_regression</loc>
    <lastmod>2026-06-16T13:51:33.011Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/overview</loc>
    <lastmod>2026-04-01T04:21:05.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/post_training_integration</loc>
    <lastmod>2026-06-16T13:51:33.006Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_metrics</loc>
    <lastmod>2026-06-16T13:51:33.007Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_request_trace</loc>
    <lastmod>2026-06-16T13:51:33.009Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/cli</loc>
    <lastmod>2026-06-10T06:19:01.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/openai_api</loc>
    <lastmod>2026-06-05T02:46:29.588Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/post_processing</loc>
    <lastmod>2026-06-16T13:51:33.035Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/attention_backends</loc>
    <lastmod>2026-05-19T09:47:12.107Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/cache_dit</loc>
    <lastmod>2026-06-10T06:19:01.058Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/caching-acceleration</loc>
    <lastmod>2026-06-10T06:19:01.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ci_perf</loc>
    <lastmod>2026-04-21T07:18:40.380Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/compatibility_matrix</loc>
    <lastmod>2026-06-10T06:19:01.040Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/contributing</loc>
    <lastmod>2026-06-16T13:51:33.031Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/deployment_cookbook</loc>
    <lastmod>2026-06-10T06:19:01.074Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/disaggregation</loc>
    <lastmod>2026-06-16T13:51:33.072Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/dynamic_batching</loc>
    <lastmod>2026-06-10T06:19:11.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/environment_variables</loc>
    <lastmod>2026-06-11T15:15:48.750Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion</loc>
    <lastmod>2026-06-10T06:19:11.039Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/installation</loc>
    <lastmod>2026-06-10T06:19:11.037Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/performance-optimization</loc>
    <lastmod>2026-06-10T06:19:11.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/profiling</loc>
    <lastmod>2026-03-27T19:16:51.341Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/progressive_resolution</loc>
    <lastmod>2026-06-11T15:20:28.098Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/quantization</loc>
    <lastmod>2026-06-16T13:51:33.067Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ring_sp_performance</loc>
    <lastmod>2026-06-16T13:51:33.067Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/support_new_models</loc>
    <lastmod>2026-06-16T13:51:33.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/teacache</loc>
    <lastmod>2026-06-10T06:19:24.192Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models</loc>
    <lastmod>2026-04-21T07:18:48.656Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/classify_models</loc>
    <lastmod>2026-06-16T13:51:33.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/diffusion_language_models</loc>
    <lastmod>2026-06-16T13:51:33.097Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/embedding_models</loc>
    <lastmod>2026-04-21T07:18:48.654Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/generative_models</loc>
    <lastmod>2026-06-16T13:51:33.093Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/mindspore_models</loc>
    <lastmod>2026-06-16T13:51:33.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/modelscope</loc>
    <lastmod>2026-06-16T13:51:33.092Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/multimodal_language_models</loc>
    <lastmod>2026-06-16T13:51:33.091Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/rerank_models</loc>
    <lastmod>2026-06-16T13:51:33.118Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/reward_models</loc>
    <lastmod>2026-06-16T13:51:33.117Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/support_new_models</loc>
    <lastmod>2026-04-21T07:18:58.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/transformers_fallback</loc>
    <lastmod>2026-06-16T13:51:33.116Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io</loc>
    <lastmod>2026-06-16T01:30:28.072Z</lastmod>
  </url>
</urlset>