<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-Math-V2</loc>
    <lastmod>2026-06-15T07:16:26.044Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR</loc>
    <lastmod>2026-06-15T07:16:26.020Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR-2</loc>
    <lastmod>2026-06-15T07:16:26.045Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-R1</loc>
    <lastmod>2026-06-15T07:16:26.047Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3</loc>
    <lastmod>2026-06-15T07:16:26.050Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_1</loc>
    <lastmod>2026-06-15T07:16:26.049Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_2</loc>
    <lastmod>2026-06-15T07:16:26.046Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V4</loc>
    <lastmod>2026-06-13T18:47:28.252Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5</loc>
    <lastmod>2026-06-15T07:16:26.081Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5-VL</loc>
    <lastmod>2026-06-15T07:16:26.022Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/FlashLabs/Chroma1.0</loc>
    <lastmod>2026-06-15T07:16:26.078Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5</loc>
    <lastmod>2026-06-15T07:16:26.077Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5V</loc>
    <lastmod>2026-06-15T07:16:26.078Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6</loc>
    <lastmod>2026-06-15T07:16:26.075Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6V</loc>
    <lastmod>2026-06-15T07:16:26.079Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7</loc>
    <lastmod>2026-06-15T07:16:26.076Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7-Flash</loc>
    <lastmod>2026-06-15T07:16:26.068Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5</loc>
    <lastmod>2026-06-15T07:16:26.080Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.1</loc>
    <lastmod>2026-06-15T07:16:26.075Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-Glyph</loc>
    <lastmod>2026-06-15T07:16:26.121Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-OCR</loc>
    <lastmod>2026-06-15T07:16:26.107Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/DiffusionGemma</loc>
    <lastmod>2026-06-15T07:16:26.095Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/Gemma4</loc>
    <lastmod>2026-06-15T07:16:26.122Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/LLaDA-2.1</loc>
    <lastmod>2026-06-15T07:16:26.112Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.5-1T</loc>
    <lastmod>2026-06-15T07:16:26.106Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.6</loc>
    <lastmod>2026-06-15T07:16:26.108Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.5-1T</loc>
    <lastmod>2026-06-15T07:16:26.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.6-1T</loc>
    <lastmod>2026-06-15T07:16:26.106Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S1</loc>
    <lastmod>2026-06-15T07:16:26.105Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S2-Preview</loc>
    <lastmod>2026-06-15T07:16:26.155Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternVL/InternVL3.5</loc>
    <lastmod>2026-06-15T07:16:26.149Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Jina/Jina-reranker-m0</loc>
    <lastmod>2026-06-15T07:16:26.153Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/LiquidAI/LFM2.5</loc>
    <lastmod>2026-06-13T18:47:37.317Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.1</loc>
    <lastmod>2026-06-15T07:16:26.152Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.3-70B</loc>
    <lastmod>2026-06-15T07:16:26.151Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama4</loc>
    <lastmod>2026-06-15T07:16:26.154Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2</loc>
    <lastmod>2026-06-15T07:16:26.152Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.5</loc>
    <lastmod>2026-06-15T07:16:26.150Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.7</loc>
    <lastmod>2026-06-15T07:16:26.149Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M3</loc>
    <lastmod>2026-06-15T07:16:26.196Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Devstral-2</loc>
    <lastmod>2026-06-15T07:16:26.184Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Ministral-3</loc>
    <lastmod>2026-06-15T07:16:26.182Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Medium-3.5</loc>
    <lastmod>2026-06-15T07:16:26.187Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Small-4</loc>
    <lastmod>2026-06-15T07:16:26.180Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2</loc>
    <lastmod>2026-06-15T07:16:26.178Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.5</loc>
    <lastmod>2026-06-15T07:16:26.181Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.6</loc>
    <lastmod>2026-06-15T07:16:26.182Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.7-Code</loc>
    <lastmod>2026-06-12T18:20:22.088Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-Linear</loc>
    <lastmod>2026-06-15T07:16:26.180Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano</loc>
    <lastmod>2026-06-15T07:16:35.429Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano-Omni</loc>
    <lastmod>2026-06-15T07:16:35.418Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Super</loc>
    <lastmod>2026-06-15T07:16:35.430Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Ultra</loc>
    <lastmod>2026-06-12T21:52:51.647Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenAI/GPT-OSS</loc>
    <lastmod>2026-06-15T07:16:35.423Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenBMB/MiniCPM-V-4_6</loc>
    <lastmod>2026-06-15T07:16:35.421Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Poolside/Laguna-XS.2</loc>
    <lastmod>2026-06-15T07:16:35.420Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen2.5-VL</loc>
    <lastmod>2026-06-15T07:16:35.424Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3</loc>
    <lastmod>2026-06-15T07:16:35.457Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder</loc>
    <lastmod>2026-06-15T07:16:35.420Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder-Next</loc>
    <lastmod>2026-06-15T07:16:35.417Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Next</loc>
    <lastmod>2026-06-15T07:16:35.464Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-VL</loc>
    <lastmod>2026-06-15T07:16:35.464Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.5</loc>
    <lastmod>2026-06-15T07:16:35.463Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.6</loc>
    <lastmod>2026-06-15T07:16:35.460Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step-3.7-Flash</loc>
    <lastmod>2026-06-15T07:16:35.455Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3-VL-10B</loc>
    <lastmod>2026-06-15T07:16:35.448Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3.5</loc>
    <lastmod>2026-06-15T07:16:35.461Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Tencent/Hunyuan3-Preview</loc>
    <lastmod>2026-06-15T07:16:35.449Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2-Flash</loc>
    <lastmod>2026-06-15T07:16:35.453Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2.5</loc>
    <lastmod>2026-06-15T07:16:35.497Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/intro</loc>
    <lastmod>2026-06-12T18:20:22.180Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/autoregressive_model_benchmark</loc>
    <lastmod>2026-06-15T07:16:35.500Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/diffusion_model_benchmark</loc>
    <lastmod>2026-06-15T07:16:35.498Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/reference/server_arguments</loc>
    <lastmod>2026-06-15T07:16:35.496Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Cosmos/Cosmos3</loc>
    <lastmod>2026-06-15T07:16:35.479Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ernie-Image/Ernie-Image</loc>
    <lastmod>2026-06-15T07:16:35.499Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/FLUX/FLUX</loc>
    <lastmod>2026-06-15T07:16:35.495Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Ideogram/Ideogram4</loc>
    <lastmod>2026-06-15T07:16:35.478Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LTX/LTX2 &amp; LTX2.3</loc>
    <lastmod>2026-05-11T05:42:51.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LingBot-World/LingBot-World</loc>
    <lastmod>2026-06-15T07:16:35.534Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/MOVA/MOVA</loc>
    <lastmod>2026-06-15T07:16:35.535Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image</loc>
    <lastmod>2026-06-15T07:16:35.540Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image-Edit</loc>
    <lastmod>2026-06-15T07:16:35.543Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/SANA-WM/SANA-WM</loc>
    <lastmod>2026-06-15T07:16:35.545Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.1</loc>
    <lastmod>2026-06-15T07:16:35.543Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.2</loc>
    <lastmod>2026-06-15T07:16:35.536Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Z-Image/Z-Image-Turbo</loc>
    <lastmod>2026-06-15T07:16:35.538Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/intro</loc>
    <lastmod>2026-06-09T02:48:21.294Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/intro</loc>
    <lastmod>2026-06-15T07:16:35.572Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/specbundle_usage</loc>
    <lastmod>2026-06-15T07:16:35.567Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/supported_models</loc>
    <lastmod>2026-06-15T07:16:35.571Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/adaptive_speculative_decoding</loc>
    <lastmod>2026-06-15T07:16:35.568Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/attention_backend</loc>
    <lastmod>2026-06-15T07:16:35.570Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/breakable_cuda_graph</loc>
    <lastmod>2026-06-15T07:16:35.569Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/checkpoint_engine</loc>
    <lastmod>2026-06-15T07:16:35.560Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/cuda_graph_for_multi_modal_encoder</loc>
    <lastmod>2026-06-15T07:16:35.619Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/deterministic_inference</loc>
    <lastmod>2026-06-15T07:16:35.617Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_dpa_smg_guide</loc>
    <lastmod>2026-06-15T07:16:35.607Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_for_multi_modal_encoder</loc>
    <lastmod>2026-06-15T07:16:35.606Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/epd_disaggregation</loc>
    <lastmod>2026-06-15T07:16:35.614Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/expert_parallelism</loc>
    <lastmod>2026-06-15T07:16:35.610Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache</loc>
    <lastmod>2026-06-15T07:16:35.609Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_best_practices</loc>
    <lastmod>2026-06-15T07:16:35.618Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_design</loc>
    <lastmod>2026-06-15T07:16:35.613Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_storage_runtime_attach_detach</loc>
    <lastmod>2026-06-15T07:16:35.649Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hisparse_guide</loc>
    <lastmod>2026-06-15T07:16:35.648Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hyperparameter_tuning</loc>
    <lastmod>2026-06-15T07:16:35.646Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/llm-d</loc>
    <lastmod>2026-06-15T07:16:35.645Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/lora</loc>
    <lastmod>2026-06-15T07:16:35.647Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/object_storage</loc>
    <lastmod>2026-06-15T07:16:35.645Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/observability</loc>
    <lastmod>2026-06-15T07:16:35.633Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/overview</loc>
    <lastmod>2026-04-01T04:21:05.794Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pd_disaggregation</loc>
    <lastmod>2026-06-15T07:16:35.644Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/piecewise_cuda_graph</loc>
    <lastmod>2026-06-15T07:16:35.643Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pipeline_parallelism</loc>
    <lastmod>2026-06-15T07:16:35.681Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantization</loc>
    <lastmod>2026-06-15T07:16:35.680Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantized_kv_cache</loc>
    <lastmod>2026-06-15T07:16:35.676Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/separate_reasoning</loc>
    <lastmod>2026-06-15T07:16:35.674Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/server_arguments</loc>
    <lastmod>2026-06-15T07:16:35.706Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sgl_model_gateway</loc>
    <lastmod>2026-06-15T07:16:35.678Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sglang_for_rl</loc>
    <lastmod>2026-06-15T07:16:35.672Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/speculative_decoding</loc>
    <lastmod>2026-06-15T07:16:35.673Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs</loc>
    <lastmod>2026-06-15T07:16:35.675Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs_for_reasoning_models</loc>
    <lastmod>2026-06-15T07:16:35.735Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/tool_parser</loc>
    <lastmod>2026-06-15T07:16:35.738Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/vlm_query</loc>
    <lastmod>2026-06-15T07:16:35.738Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/native_api</loc>
    <lastmod>2026-06-15T07:16:35.733Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/offline_engine_api</loc>
    <lastmod>2026-06-15T07:16:35.737Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/ollama_api</loc>
    <lastmod>2026-06-15T07:16:35.741Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api</loc>
    <lastmod>2026-03-03T17:30:52.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_completions</loc>
    <lastmod>2026-06-15T07:16:35.735Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_embeddings</loc>
    <lastmod>2026-06-15T07:16:35.734Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_vision</loc>
    <lastmod>2026-06-15T07:16:35.736Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/overview</loc>
    <lastmod>2026-06-02T00:55:43.583Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/sampling_params</loc>
    <lastmod>2026-06-15T07:16:35.769Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/send_request</loc>
    <lastmod>2026-06-15T07:16:35.768Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/bench_serving</loc>
    <lastmod>2026-06-15T07:16:35.766Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/benchmark_and_profiling</loc>
    <lastmod>2026-06-15T07:16:35.770Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/contribution_guide</loc>
    <lastmod>2026-06-15T07:16:35.773Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_guide_using_docker</loc>
    <lastmod>2026-06-15T07:16:35.764Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_jit_kernel_guide</loc>
    <lastmod>2026-06-15T07:16:35.767Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/evaluating_new_models</loc>
    <lastmod>2026-06-15T07:16:35.765Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/msprobe_debugging_guide</loc>
    <lastmod>2026-06-15T07:16:35.768Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/overview</loc>
    <lastmod>2026-04-27T07:07:34.337Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/install</loc>
    <lastmod>2026-05-26T05:28:41.054Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/quickstart</loc>
    <lastmod>2026-05-04T20:51:06.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/amd_gpu</loc>
    <lastmod>2026-06-15T07:16:35.797Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/apple_metal</loc>
    <lastmod>2026-06-15T07:16:35.815Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_contribution_guide</loc>
    <lastmod>2026-06-15T07:16:35.798Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu</loc>
    <lastmod>2026-06-15T07:16:35.796Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_accuracy_evaluation</loc>
    <lastmod>2026-06-15T07:16:35.796Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_best_practice</loc>
    <lastmod>2026-06-15T07:16:35.856Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_deepseek_example</loc>
    <lastmod>2026-06-15T07:16:35.845Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_environment_variables</loc>
    <lastmod>2026-06-15T07:16:35.846Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_faq</loc>
    <lastmod>2026-06-15T07:16:35.843Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_glm5_examples</loc>
    <lastmod>2026-06-15T07:16:35.844Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_development</loc>
    <lastmod>2026-05-21T09:33:14.499Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_operator_performance_optimizing</loc>
    <lastmod>2026-06-15T07:16:35.842Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_optimization</loc>
    <lastmod>2026-06-15T07:16:35.850Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_performance_testing</loc>
    <lastmod>2026-06-15T07:16:35.844Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_profiling</loc>
    <lastmod>2026-06-15T07:16:35.886Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quantization</loc>
    <lastmod>2026-06-15T07:16:35.883Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quick_start</loc>
    <lastmod>2026-06-15T07:16:35.871Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_5_examples</loc>
    <lastmod>2026-06-15T07:16:35.884Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_examples</loc>
    <lastmod>2026-06-15T07:16:35.885Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_ring_sp_performance</loc>
    <lastmod>2026-06-15T07:16:35.882Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_features</loc>
    <lastmod>2026-06-15T07:16:35.892Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_models</loc>
    <lastmod>2026-06-15T07:16:35.883Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_new_models</loc>
    <lastmod>2026-04-27T09:13:38.997Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_r1</loc>
    <lastmod>2026-06-15T07:16:35.881Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/deepseek_v3_2</loc>
    <lastmod>2026-06-15T07:16:35.929Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/glm5_1</loc>
    <lastmod>2026-06-15T07:16:35.938Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/kimi_k2_6</loc>
    <lastmod>2026-06-15T07:16:35.935Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/minimax_m2_5</loc>
    <lastmod>2026-06-15T07:16:35.937Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3-8b</loc>
    <lastmod>2026-06-15T07:16:35.930Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_235b_a22b</loc>
    <lastmod>2026-06-15T07:16:35.933Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_30b_a3b</loc>
    <lastmod>2026-06-15T07:16:35.932Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_32b</loc>
    <lastmod>2026-06-15T07:16:35.930Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_5_397b</loc>
    <lastmod>2026-06-15T07:16:35.931Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_27b</loc>
    <lastmod>2026-06-15T07:16:35.934Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_6_35b_a3b</loc>
    <lastmod>2026-06-15T07:16:35.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/best_practice/qwen3_next_80b_a3b_instruct</loc>
    <lastmod>2026-06-15T07:16:35.972Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/mindspore_backend</loc>
    <lastmod>2026-06-15T07:16:35.959Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/cpu_server</loc>
    <lastmod>2026-06-15T07:16:35.973Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/mthreads_gpu</loc>
    <lastmod>2026-06-15T07:16:35.962Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia-gpus</loc>
    <lastmod>2026-06-15T07:16:35.958Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia_jetson</loc>
    <lastmod>2026-04-21T07:18:19.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/overview</loc>
    <lastmod>2026-04-21T07:18:19.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/plugin</loc>
    <lastmod>2026-06-15T07:16:35.961Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/tpu</loc>
    <lastmod>2026-04-21T08:13:05.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/xpu</loc>
    <lastmod>2026-06-15T07:16:36.004Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/custom_chat_template</loc>
    <lastmod>2026-06-15T07:16:36.005Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/environment_variables</loc>
    <lastmod>2026-06-15T07:16:36.048Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/faq</loc>
    <lastmod>2026-06-15T07:16:36.004Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/choices_methods</loc>
    <lastmod>2026-06-15T07:16:36.006Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_index</loc>
    <lastmod>2026-06-15T07:16:36.002Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_tutorial</loc>
    <lastmod>2026-06-15T07:16:36.001Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/deploy_on_k8s</loc>
    <lastmod>2026-06-15T07:16:36.005Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/lws_pd/lws_pd_deploy</loc>
    <lastmod>2026-06-15T07:16:36.003Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node</loc>
    <lastmod>2026-06-15T07:16:36.079Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node_index</loc>
    <lastmod>2026-06-15T07:16:36.082Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/rbg_pd/deepseekv32_pd</loc>
    <lastmod>2026-06-15T07:16:36.076Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/nightly_precision_regression</loc>
    <lastmod>2026-06-15T07:16:36.081Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/overview</loc>
    <lastmod>2026-04-01T04:21:05.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/post_training_integration</loc>
    <lastmod>2026-06-15T07:16:36.078Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_metrics</loc>
    <lastmod>2026-06-15T07:16:36.077Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_request_trace</loc>
    <lastmod>2026-06-15T07:16:36.079Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/cli</loc>
    <lastmod>2026-06-10T06:19:01.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/openai_api</loc>
    <lastmod>2026-06-05T02:46:29.588Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/post_processing</loc>
    <lastmod>2026-06-15T07:16:36.108Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/attention_backends</loc>
    <lastmod>2026-05-19T09:47:12.107Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/cache_dit</loc>
    <lastmod>2026-06-10T06:19:01.058Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/caching-acceleration</loc>
    <lastmod>2026-06-10T06:19:01.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ci_perf</loc>
    <lastmod>2026-04-21T07:18:40.380Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/compatibility_matrix</loc>
    <lastmod>2026-06-10T06:19:01.040Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/contributing</loc>
    <lastmod>2026-06-15T07:16:36.109Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/deployment_cookbook</loc>
    <lastmod>2026-06-10T06:19:01.074Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/disaggregation</loc>
    <lastmod>2026-06-15T07:16:36.101Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/dynamic_batching</loc>
    <lastmod>2026-06-10T06:19:11.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/environment_variables</loc>
    <lastmod>2026-06-11T15:15:48.750Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion</loc>
    <lastmod>2026-06-10T06:19:11.039Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/installation</loc>
    <lastmod>2026-06-10T06:19:11.037Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/performance-optimization</loc>
    <lastmod>2026-06-10T06:19:11.043Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/profiling</loc>
    <lastmod>2026-03-27T19:16:51.341Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/progressive_resolution</loc>
    <lastmod>2026-06-11T15:20:28.098Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/quantization</loc>
    <lastmod>2026-06-15T07:16:36.130Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ring_sp_performance</loc>
    <lastmod>2026-06-15T07:16:36.131Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/support_new_models</loc>
    <lastmod>2026-06-15T07:16:36.132Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/teacache</loc>
    <lastmod>2026-06-10T06:19:24.192Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models</loc>
    <lastmod>2026-04-21T07:18:48.656Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/classify_models</loc>
    <lastmod>2026-06-15T07:16:36.155Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/diffusion_language_models</loc>
    <lastmod>2026-06-15T07:16:36.171Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/embedding_models</loc>
    <lastmod>2026-04-21T07:18:48.654Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/generative_models</loc>
    <lastmod>2026-06-15T07:16:36.156Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/mindspore_models</loc>
    <lastmod>2026-06-15T07:16:36.158Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/modelscope</loc>
    <lastmod>2026-06-15T07:16:36.158Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/multimodal_language_models</loc>
    <lastmod>2026-06-15T07:16:36.157Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/rerank_models</loc>
    <lastmod>2026-06-15T07:16:36.156Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/reward_models</loc>
    <lastmod>2026-06-15T07:16:36.191Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/support_new_models</loc>
    <lastmod>2026-04-21T07:18:58.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/transformers_fallback</loc>
    <lastmod>2026-06-15T07:16:36.188Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io</loc>
    <lastmod>2026-06-08T20:31:45.847Z</lastmod>
  </url>
</urlset>