<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-Math-V2</loc>
    <lastmod>2026-05-15T18:48:00.010Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR</loc>
    <lastmod>2026-05-15T18:47:59.996Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR-2</loc>
    <lastmod>2026-05-15T18:47:59.999Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-R1</loc>
    <lastmod>2026-05-15T18:48:00.011Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3</loc>
    <lastmod>2026-05-15T18:48:00.002Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_1</loc>
    <lastmod>2026-05-15T18:48:00.012Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_2</loc>
    <lastmod>2026-05-15T18:47:59.995Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V4</loc>
    <lastmod>2026-05-15T18:47:59.994Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5</loc>
    <lastmod>2026-05-15T18:48:00.064Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5-VL</loc>
    <lastmod>2026-05-15T18:47:59.993Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/FlashLabs/Chroma1.0</loc>
    <lastmod>2026-05-15T18:48:00.048Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5</loc>
    <lastmod>2026-05-15T18:48:00.046Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5V</loc>
    <lastmod>2026-05-15T18:48:00.042Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6</loc>
    <lastmod>2026-05-15T18:48:00.045Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6V</loc>
    <lastmod>2026-05-15T18:48:00.051Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7</loc>
    <lastmod>2026-05-15T18:48:00.044Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7-Flash</loc>
    <lastmod>2026-05-15T18:48:00.053Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5</loc>
    <lastmod>2026-05-15T18:48:00.063Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.1</loc>
    <lastmod>2026-05-15T18:48:00.041Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-Glyph</loc>
    <lastmod>2026-05-15T18:48:00.107Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-OCR</loc>
    <lastmod>2026-05-15T18:48:00.109Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/Gemma4</loc>
    <lastmod>2026-05-15T18:48:00.108Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/LLaDA-2.1</loc>
    <lastmod>2026-05-15T18:48:00.106Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.5-1T</loc>
    <lastmod>2026-05-15T18:48:00.095Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.6</loc>
    <lastmod>2026-05-15T18:48:00.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.5-1T</loc>
    <lastmod>2026-05-15T18:48:00.105Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.6-1T</loc>
    <lastmod>2026-05-15T18:48:00.104Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S1</loc>
    <lastmod>2026-05-15T18:48:00.100Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S2-Preview</loc>
    <lastmod>2026-05-15T18:48:00.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternVL/InternVL3.5</loc>
    <lastmod>2026-05-15T18:48:03.258Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Jina/Jina-reranker-m0</loc>
    <lastmod>2026-05-15T18:48:03.256Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.1</loc>
    <lastmod>2026-05-15T18:48:03.259Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.3-70B</loc>
    <lastmod>2026-05-15T18:48:03.256Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama4</loc>
    <lastmod>2026-05-15T18:48:03.262Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2</loc>
    <lastmod>2026-05-15T18:48:03.257Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.5</loc>
    <lastmod>2026-05-15T18:48:03.261Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.7</loc>
    <lastmod>2026-05-15T18:48:03.260Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Devstral-2</loc>
    <lastmod>2026-05-15T18:48:03.255Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Ministral-3</loc>
    <lastmod>2026-05-15T18:48:03.259Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Medium-3.5</loc>
    <lastmod>2026-05-15T18:48:03.293Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Small-4</loc>
    <lastmod>2026-05-15T18:48:03.296Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2</loc>
    <lastmod>2026-05-15T18:48:03.286Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.5</loc>
    <lastmod>2026-05-15T18:48:03.298Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.6</loc>
    <lastmod>2026-05-15T18:48:03.297Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-Linear</loc>
    <lastmod>2026-05-15T18:48:03.292Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano</loc>
    <lastmod>2026-05-15T18:48:03.284Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano-Omni</loc>
    <lastmod>2026-05-15T18:48:03.289Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Super</loc>
    <lastmod>2026-05-15T18:48:03.300Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenAI/GPT-OSS</loc>
    <lastmod>2026-05-15T18:48:03.291Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenBMB/MiniCPM-V-4_6</loc>
    <lastmod>2026-05-15T18:48:03.327Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Poolside/Laguna-XS.2</loc>
    <lastmod>2026-05-15T18:48:03.329Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen2.5-VL</loc>
    <lastmod>2026-05-15T18:48:03.330Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3</loc>
    <lastmod>2026-05-15T18:48:03.331Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder</loc>
    <lastmod>2026-05-15T18:48:03.329Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder-Next</loc>
    <lastmod>2026-05-15T18:48:03.332Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Next</loc>
    <lastmod>2026-05-15T18:48:03.340Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-VL</loc>
    <lastmod>2026-05-15T18:48:03.327Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.5</loc>
    <lastmod>2026-05-15T18:48:03.328Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.6</loc>
    <lastmod>2026-05-15T18:48:03.326Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3-VL-10B</loc>
    <lastmod>2026-05-15T18:48:03.393Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3.5</loc>
    <lastmod>2026-05-15T18:48:03.392Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Tencent/Hunyuan3-Preview</loc>
    <lastmod>2026-05-15T18:48:03.375Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2-Flash</loc>
    <lastmod>2026-05-15T18:48:03.361Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2.5</loc>
    <lastmod>2026-05-15T18:48:03.363Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/intro</loc>
    <lastmod>2026-05-13T05:43:05.519Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/autoregressive_model_benchmark</loc>
    <lastmod>2026-05-15T18:48:03.377Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/diffusion_model_benchmark</loc>
    <lastmod>2026-05-15T18:48:03.378Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/reference/server_arguments</loc>
    <lastmod>2026-05-15T18:48:03.364Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/FLUX/FLUX</loc>
    <lastmod>2026-05-15T18:48:03.388Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/LTX/LTX2 &amp; LTX2.3</loc>
    <lastmod>2026-05-11T05:42:51.096Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/MOVA/MOVA</loc>
    <lastmod>2026-05-15T18:48:03.426Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image</loc>
    <lastmod>2026-05-15T18:48:03.431Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image-Edit</loc>
    <lastmod>2026-05-15T18:48:03.429Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.1</loc>
    <lastmod>2026-05-15T18:48:03.428Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.2</loc>
    <lastmod>2026-05-15T18:48:03.427Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Z-Image/Z-Image-Turbo</loc>
    <lastmod>2026-05-15T18:48:03.421Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/intro</loc>
    <lastmod>2026-05-08T10:39:40.762Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/intro</loc>
    <lastmod>2026-05-15T18:48:03.457Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/specbundle_usage</loc>
    <lastmod>2026-05-15T18:48:03.456Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/supported_models</loc>
    <lastmod>2026-05-15T18:48:03.460Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/adaptive_speculative_decoding</loc>
    <lastmod>2026-05-15T18:48:03.454Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/attention_backend</loc>
    <lastmod>2026-05-15T18:48:03.454Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/breakable_cuda_graph</loc>
    <lastmod>2026-05-15T18:48:03.453Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/checkpoint_engine</loc>
    <lastmod>2026-05-15T18:48:03.460Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/cuda_graph_for_multi_modal_encoder</loc>
    <lastmod>2026-05-15T18:48:03.458Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/deterministic_inference</loc>
    <lastmod>2026-05-15T18:48:03.488Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_dpa_smg_guide</loc>
    <lastmod>2026-05-15T18:48:03.493Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_for_multi_modal_encoder</loc>
    <lastmod>2026-05-15T18:48:03.493Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/epd_disaggregation</loc>
    <lastmod>2026-05-15T18:48:03.492Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/expert_parallelism</loc>
    <lastmod>2026-05-15T18:48:03.489Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache</loc>
    <lastmod>2026-05-15T18:48:03.490Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_best_practices</loc>
    <lastmod>2026-05-15T18:48:03.495Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_design</loc>
    <lastmod>2026-05-15T18:48:03.491Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_storage_runtime_attach_detach</loc>
    <lastmod>2026-05-15T18:48:03.495Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hisparse_guide</loc>
    <lastmod>2026-05-15T18:48:03.535Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hyperparameter_tuning</loc>
    <lastmod>2026-05-15T18:48:03.528Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/lora</loc>
    <lastmod>2026-05-15T18:48:03.527Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/object_storage</loc>
    <lastmod>2026-05-15T18:48:03.534Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/observability</loc>
    <lastmod>2026-05-15T18:48:03.533Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/overview</loc>
    <lastmod>2026-04-01T04:21:05.794Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pd_disaggregation</loc>
    <lastmod>2026-05-15T18:48:03.530Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/piecewise_cuda_graph</loc>
    <lastmod>2026-05-15T18:48:03.531Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pipeline_parallelism</loc>
    <lastmod>2026-05-15T18:48:03.532Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantization</loc>
    <lastmod>2026-05-15T18:48:03.538Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantized_kv_cache</loc>
    <lastmod>2026-05-15T18:48:03.574Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/separate_reasoning</loc>
    <lastmod>2026-05-15T18:48:03.572Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/server_arguments</loc>
    <lastmod>2026-05-15T18:48:03.586Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sgl_model_gateway</loc>
    <lastmod>2026-05-15T18:48:03.576Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sglang_for_rl</loc>
    <lastmod>2026-05-15T18:48:03.571Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/speculative_decoding</loc>
    <lastmod>2026-05-15T18:48:03.569Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs</loc>
    <lastmod>2026-05-15T18:48:03.572Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs_for_reasoning_models</loc>
    <lastmod>2026-05-15T18:48:03.566Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/tool_parser</loc>
    <lastmod>2026-05-15T18:48:03.574Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/vlm_query</loc>
    <lastmod>2026-05-15T18:48:03.610Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_ocr</loc>
    <lastmod>2026-05-15T18:48:03.613Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_v3</loc>
    <lastmod>2026-05-15T18:48:03.612Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_v32</loc>
    <lastmod>2026-05-15T18:48:03.615Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/glm45</loc>
    <lastmod>2026-05-15T18:48:03.612Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/glmv</loc>
    <lastmod>2026-05-15T18:48:03.614Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/gpt_oss</loc>
    <lastmod>2026-05-15T18:48:03.610Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/kimi_k2_5</loc>
    <lastmod>2026-05-15T18:48:03.611Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/llama4</loc>
    <lastmod>2026-05-15T18:48:03.609Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/minimax_m2</loc>
    <lastmod>2026-05-15T18:48:03.608Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/native_api</loc>
    <lastmod>2026-05-15T18:48:03.644Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/offline_engine_api</loc>
    <lastmod>2026-05-15T18:48:03.641Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/ollama_api</loc>
    <lastmod>2026-05-15T18:48:03.641Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api</loc>
    <lastmod>2026-03-03T17:30:52.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_completions</loc>
    <lastmod>2026-05-15T18:48:03.644Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_embeddings</loc>
    <lastmod>2026-05-15T18:48:03.640Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_vision</loc>
    <lastmod>2026-05-15T18:48:03.642Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/overview</loc>
    <lastmod>2026-04-01T04:21:05.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/popular_model_usage</loc>
    <lastmod>2026-04-21T07:17:40.729Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3</loc>
    <lastmod>2026-05-15T18:48:03.643Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3_5</loc>
    <lastmod>2026-05-15T18:48:03.674Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3_vl</loc>
    <lastmod>2026-05-15T18:48:03.673Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/sampling_params</loc>
    <lastmod>2026-05-15T18:48:03.678Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/send_request</loc>
    <lastmod>2026-05-15T18:48:03.676Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/bench_serving</loc>
    <lastmod>2026-05-15T18:48:03.675Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/benchmark_and_profiling</loc>
    <lastmod>2026-05-15T18:48:03.678Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/contribution_guide</loc>
    <lastmod>2026-05-15T18:48:03.676Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_guide_using_docker</loc>
    <lastmod>2026-05-15T18:48:03.671Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_jit_kernel_guide</loc>
    <lastmod>2026-05-15T18:48:03.671Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/evaluating_new_models</loc>
    <lastmod>2026-05-15T18:48:03.672Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/msprobe_debugging_guide</loc>
    <lastmod>2026-05-15T18:48:03.718Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/overview</loc>
    <lastmod>2026-04-27T07:07:34.337Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/install</loc>
    <lastmod>2026-05-06T09:37:38.151Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/quickstart</loc>
    <lastmod>2026-05-04T20:51:06.602Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/amd_gpu</loc>
    <lastmod>2026-05-15T18:48:03.719Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/apple_metal</loc>
    <lastmod>2026-05-15T18:48:03.716Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_contribution_guide</loc>
    <lastmod>2026-05-15T18:48:03.716Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu</loc>
    <lastmod>2026-05-15T18:48:03.717Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_accuracy_evaluation</loc>
    <lastmod>2026-05-15T18:48:03.742Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_best_practice</loc>
    <lastmod>2026-05-15T18:48:03.753Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_deepseek_example</loc>
    <lastmod>2026-05-15T18:48:03.740Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_environment_variables</loc>
    <lastmod>2026-05-15T18:48:03.746Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_faq</loc>
    <lastmod>2026-05-15T18:48:03.742Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_glm5_examples</loc>
    <lastmod>2026-05-15T18:48:03.743Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_optimization</loc>
    <lastmod>2026-05-15T18:48:03.750Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_performance_testing</loc>
    <lastmod>2026-05-15T18:48:03.754Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quantization</loc>
    <lastmod>2026-05-15T18:48:03.741Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quick_start</loc>
    <lastmod>2026-05-15T18:48:03.750Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_5_examples</loc>
    <lastmod>2026-05-15T18:48:03.779Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_examples</loc>
    <lastmod>2026-05-15T18:48:03.781Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_ring_sp_performance</loc>
    <lastmod>2026-05-15T18:48:03.779Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_features</loc>
    <lastmod>2026-05-15T18:48:03.786Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_models</loc>
    <lastmod>2026-05-15T18:48:03.777Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_new_models</loc>
    <lastmod>2026-04-27T09:13:38.997Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/mindspore_backend</loc>
    <lastmod>2026-05-15T18:48:03.782Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/cpu_server</loc>
    <lastmod>2026-05-15T18:48:03.778Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/mthreads_gpu</loc>
    <lastmod>2026-05-15T18:48:03.780Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia-gpus</loc>
    <lastmod>2026-05-15T18:48:03.783Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia_jetson</loc>
    <lastmod>2026-04-21T07:18:19.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/overview</loc>
    <lastmod>2026-04-21T07:18:19.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/plugin</loc>
    <lastmod>2026-05-15T18:48:03.812Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/tpu</loc>
    <lastmod>2026-04-21T08:13:05.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/xpu</loc>
    <lastmod>2026-05-15T18:48:03.810Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/custom_chat_template</loc>
    <lastmod>2026-05-15T18:48:03.814Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/environment_variables</loc>
    <lastmod>2026-05-15T18:48:03.815Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/faq</loc>
    <lastmod>2026-05-15T18:48:03.813Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/choices_methods</loc>
    <lastmod>2026-05-15T18:48:03.811Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_index</loc>
    <lastmod>2026-05-15T18:48:03.809Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_tutorial</loc>
    <lastmod>2026-05-15T18:48:03.844Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/deploy_on_k8s</loc>
    <lastmod>2026-05-15T18:48:03.840Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/lws_pd/lws_pd_deploy</loc>
    <lastmod>2026-05-15T18:48:03.845Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node</loc>
    <lastmod>2026-05-15T18:48:03.845Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node_index</loc>
    <lastmod>2026-05-15T18:48:03.841Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/rbg_pd/deepseekv32_pd</loc>
    <lastmod>2026-05-15T18:48:03.849Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/overview</loc>
    <lastmod>2026-04-01T04:21:05.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/post_training_integration</loc>
    <lastmod>2026-05-15T18:48:03.847Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_metrics</loc>
    <lastmod>2026-05-15T18:48:03.848Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_request_trace</loc>
    <lastmod>2026-05-15T18:48:03.842Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/cli</loc>
    <lastmod>2026-05-05T00:39:42.994Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/openai_api</loc>
    <lastmod>2026-04-21T07:18:32.425Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/post_processing</loc>
    <lastmod>2026-05-15T18:48:03.880Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/attention_backends</loc>
    <lastmod>2026-05-12T02:51:08.265Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/cache_dit</loc>
    <lastmod>2026-04-21T07:18:32.422Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/caching-acceleration</loc>
    <lastmod>2026-04-21T07:18:32.423Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ci_perf</loc>
    <lastmod>2026-04-21T07:18:40.380Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/compatibility_matrix</loc>
    <lastmod>2026-04-24T06:18:35.608Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/contributing</loc>
    <lastmod>2026-05-15T18:48:03.879Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/disaggregation</loc>
    <lastmod>2026-05-15T18:48:03.952Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/dynamic_batching</loc>
    <lastmod>2026-05-03T16:45:25.187Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/environment_variables</loc>
    <lastmod>2026-04-21T07:18:40.386Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion</loc>
    <lastmod>2026-05-03T16:45:25.184Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/installation</loc>
    <lastmod>2026-05-12T00:54:42.423Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/performance-optimization</loc>
    <lastmod>2026-05-03T16:45:25.185Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/profiling</loc>
    <lastmod>2026-03-27T19:16:51.341Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/quantization</loc>
    <lastmod>2026-05-15T18:48:03.953Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ring_sp_performance</loc>
    <lastmod>2026-05-15T18:48:03.942Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/support_new_models</loc>
    <lastmod>2026-05-15T18:48:03.951Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/teacache</loc>
    <lastmod>2026-04-21T07:18:48.653Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models</loc>
    <lastmod>2026-04-21T07:18:48.656Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/classify_models</loc>
    <lastmod>2026-05-15T18:48:03.977Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/diffusion_language_models</loc>
    <lastmod>2026-05-15T18:48:03.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/embedding_models</loc>
    <lastmod>2026-04-21T07:18:48.654Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/generative_models</loc>
    <lastmod>2026-05-15T18:48:03.975Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/mindspore_models</loc>
    <lastmod>2026-05-15T18:48:03.976Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/modelscope</loc>
    <lastmod>2026-05-15T18:48:03.974Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/multimodal_language_models</loc>
    <lastmod>2026-05-15T18:48:03.972Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/rerank_models</loc>
    <lastmod>2026-05-15T18:48:03.973Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/reward_models</loc>
    <lastmod>2026-05-15T18:48:03.998Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/support_new_models</loc>
    <lastmod>2026-04-21T07:18:58.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/transformers_fallback</loc>
    <lastmod>2026-05-15T18:48:03.997Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io</loc>
    <lastmod>2026-05-12T15:07:31.354Z</lastmod>
  </url>
</urlset>