<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-Math-V2</loc>
    <lastmod>2026-04-21T08:06:30.106Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR</loc>
    <lastmod>2026-04-21T08:06:30.097Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-OCR-2</loc>
    <lastmod>2026-04-21T08:06:30.099Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-R1</loc>
    <lastmod>2026-04-21T08:06:30.136Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3</loc>
    <lastmod>2026-04-21T08:06:30.092Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_1</loc>
    <lastmod>2026-04-21T08:06:30.129Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/DeepSeek/DeepSeek-V3_2</loc>
    <lastmod>2026-04-21T08:06:30.137Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5</loc>
    <lastmod>2026-04-21T08:06:30.112Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Ernie/Ernie4.5-VL</loc>
    <lastmod>2026-04-21T08:06:30.113Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/FlashLabs/Chroma1.0</loc>
    <lastmod>2026-04-21T08:06:30.183Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5</loc>
    <lastmod>2026-04-21T08:06:30.184Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.5V</loc>
    <lastmod>2026-04-21T08:06:30.186Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6</loc>
    <lastmod>2026-04-21T08:06:30.181Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.6V</loc>
    <lastmod>2026-04-21T08:06:30.174Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7</loc>
    <lastmod>2026-04-21T08:06:30.185Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-4.7-Flash</loc>
    <lastmod>2026-04-21T08:06:30.169Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5</loc>
    <lastmod>2026-04-21T08:06:30.170Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.1</loc>
    <lastmod>2026-04-21T08:06:30.173Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-Glyph</loc>
    <lastmod>2026-04-21T08:06:30.173Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-OCR</loc>
    <lastmod>2026-04-21T08:06:30.223Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Google/Gemma4</loc>
    <lastmod>2026-04-21T08:06:30.232Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/LLaDA-2.1</loc>
    <lastmod>2026-04-21T08:06:30.229Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ling-2.5-1T</loc>
    <lastmod>2026-04-21T08:06:30.230Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InclusionAI/Ring-2.5-1T</loc>
    <lastmod>2026-04-21T08:06:30.216Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternLM/Intern-S1</loc>
    <lastmod>2026-04-21T08:06:30.217Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/InternVL/InternVL3.5</loc>
    <lastmod>2026-04-21T08:06:30.215Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Jina/Jina-reranker-m0</loc>
    <lastmod>2026-04-21T08:06:30.218Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.1</loc>
    <lastmod>2026-04-21T08:06:30.224Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama3.3-70B</loc>
    <lastmod>2026-04-21T08:06:30.225Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Llama/Llama4</loc>
    <lastmod>2026-04-21T08:06:30.264Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2</loc>
    <lastmod>2026-04-21T08:06:30.268Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.5</loc>
    <lastmod>2026-04-21T08:06:30.285Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/MiniMax/MiniMax-M2.7</loc>
    <lastmod>2026-04-21T08:06:30.287Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Devstral-2</loc>
    <lastmod>2026-04-21T08:06:30.258Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Ministral-3</loc>
    <lastmod>2026-04-21T08:06:30.289Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Mistral/Mistral-Small-4</loc>
    <lastmod>2026-04-21T08:06:30.259Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2</loc>
    <lastmod>2026-04-21T08:06:30.262Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.5</loc>
    <lastmod>2026-04-21T08:06:30.263Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-K2.6</loc>
    <lastmod>2026-04-21T08:06:30.282Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Moonshotai/Kimi-Linear</loc>
    <lastmod>2026-04-21T08:06:30.335Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Nano</loc>
    <lastmod>2026-04-21T08:06:30.328Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/NVIDIA/Nemotron3-Super</loc>
    <lastmod>2026-04-21T08:06:30.326Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/OpenAI/GPT-OSS</loc>
    <lastmod>2026-04-21T08:06:30.332Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen2.5-VL</loc>
    <lastmod>2026-04-21T08:06:30.329Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3</loc>
    <lastmod>2026-04-21T08:06:30.372Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder</loc>
    <lastmod>2026-04-21T08:06:30.322Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Coder-Next</loc>
    <lastmod>2026-04-21T08:06:30.327Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-Next</loc>
    <lastmod>2026-04-21T08:06:30.323Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3-VL</loc>
    <lastmod>2026-04-21T08:06:30.324Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.5</loc>
    <lastmod>2026-04-21T08:06:30.330Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Qwen/Qwen3.6</loc>
    <lastmod>2026-04-21T08:06:30.376Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3-VL-10B</loc>
    <lastmod>2026-04-21T08:06:30.374Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/StepFun/Step3.5</loc>
    <lastmod>2026-04-21T08:06:30.371Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/Xiaomi/MiMo-V2-Flash</loc>
    <lastmod>2026-04-21T08:06:30.370Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/autoregressive/intro</loc>
    <lastmod>2026-04-20T20:38:16.230Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/autoregressive_model_benchmark</loc>
    <lastmod>2026-04-21T08:06:30.371Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/benchmarks/diffusion_model_benchmark</loc>
    <lastmod>2026-04-21T08:06:30.367Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/base/reference/server_arguments</loc>
    <lastmod>2026-04-21T08:06:30.366Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/FLUX/FLUX</loc>
    <lastmod>2026-04-21T08:06:30.367Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/MOVA/MOVA</loc>
    <lastmod>2026-04-21T08:06:30.422Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image</loc>
    <lastmod>2026-04-21T08:06:30.411Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Qwen-Image/Qwen-Image-Edit</loc>
    <lastmod>2026-04-21T08:06:30.421Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.1</loc>
    <lastmod>2026-04-21T08:06:30.417Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Wan/Wan2.2</loc>
    <lastmod>2026-04-21T08:06:30.415Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/Z-Image/Z-Image-Turbo</loc>
    <lastmod>2026-04-21T08:06:30.414Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/diffusion/intro</loc>
    <lastmod>2026-04-17T05:34:26.937Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/intro</loc>
    <lastmod>2026-04-21T08:06:30.412Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/specbundle_usage</loc>
    <lastmod>2026-04-21T08:06:30.463Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/cookbook/specbundle/supported_models</loc>
    <lastmod>2026-04-21T08:06:30.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/adaptive_speculative_decoding</loc>
    <lastmod>2026-04-21T08:06:30.458Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/attention_backend</loc>
    <lastmod>2026-04-21T08:06:30.459Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/breakable_cuda_graph</loc>
    <lastmod>2026-04-21T08:06:30.459Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/checkpoint_engine</loc>
    <lastmod>2026-04-21T08:06:30.460Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/cuda_graph_for_multi_modal_encoder</loc>
    <lastmod>2026-04-21T08:06:30.457Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/deterministic_inference</loc>
    <lastmod>2026-04-21T08:06:30.465Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_dpa_smg_guide</loc>
    <lastmod>2026-04-21T08:06:30.504Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/dp_for_multi_modal_encoder</loc>
    <lastmod>2026-04-21T08:06:30.503Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/epd_disaggregation</loc>
    <lastmod>2026-04-21T08:06:30.517Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/expert_parallelism</loc>
    <lastmod>2026-04-21T08:06:30.505Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache</loc>
    <lastmod>2026-04-21T08:06:30.499Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_best_practices</loc>
    <lastmod>2026-04-21T08:06:30.500Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_design</loc>
    <lastmod>2026-04-21T08:06:30.518Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hicache_storage_runtime_attach_detach</loc>
    <lastmod>2026-04-21T08:06:30.501Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hisparse_guide</loc>
    <lastmod>2026-04-21T08:06:30.498Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/hyperparameter_tuning</loc>
    <lastmod>2026-04-21T08:06:30.551Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/lora</loc>
    <lastmod>2026-04-21T08:06:30.551Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/object_storage</loc>
    <lastmod>2026-04-21T08:06:30.549Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/observability</loc>
    <lastmod>2026-04-21T08:06:30.548Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/overview</loc>
    <lastmod>2026-04-01T04:21:05.794Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pd_disaggregation</loc>
    <lastmod>2026-04-21T08:06:30.545Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/piecewise_cuda_graph</loc>
    <lastmod>2026-04-21T08:06:30.546Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/pipeline_parallelism</loc>
    <lastmod>2026-04-21T08:06:30.544Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantization</loc>
    <lastmod>2026-04-21T08:06:30.547Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/quantized_kv_cache</loc>
    <lastmod>2026-04-21T08:06:30.543Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/separate_reasoning</loc>
    <lastmod>2026-04-21T08:06:30.590Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/server_arguments</loc>
    <lastmod>2026-04-21T08:06:30.580Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sgl_model_gateway</loc>
    <lastmod>2026-04-21T08:06:30.597Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/sglang_for_rl</loc>
    <lastmod>2026-04-21T08:06:30.581Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/speculative_decoding</loc>
    <lastmod>2026-04-21T08:06:30.582Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs</loc>
    <lastmod>2026-04-21T08:06:30.583Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/structured_outputs_for_reasoning_models</loc>
    <lastmod>2026-04-21T08:06:30.584Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/tool_parser</loc>
    <lastmod>2026-04-21T08:06:30.585Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/advanced_features/vlm_query</loc>
    <lastmod>2026-04-21T08:06:30.591Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_ocr</loc>
    <lastmod>2026-04-21T08:06:30.648Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_v3</loc>
    <lastmod>2026-04-21T08:06:30.649Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/deepseek_v32</loc>
    <lastmod>2026-04-21T08:06:30.651Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/glm45</loc>
    <lastmod>2026-04-21T08:06:30.643Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/glmv</loc>
    <lastmod>2026-04-21T08:06:30.652Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/gpt_oss</loc>
    <lastmod>2026-04-21T08:06:30.644Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/kimi_k2_5</loc>
    <lastmod>2026-04-21T08:06:30.647Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/llama4</loc>
    <lastmod>2026-04-21T08:06:30.646Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/minimax_m2</loc>
    <lastmod>2026-04-21T08:06:30.645Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/native_api</loc>
    <lastmod>2026-04-21T08:06:30.644Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/offline_engine_api</loc>
    <lastmod>2026-04-21T08:06:30.685Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/ollama_api</loc>
    <lastmod>2026-04-21T08:06:30.689Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api</loc>
    <lastmod>2026-03-03T17:30:52.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_completions</loc>
    <lastmod>2026-04-21T08:06:30.688Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_embeddings</loc>
    <lastmod>2026-04-21T08:06:30.681Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/openai_api_vision</loc>
    <lastmod>2026-04-21T08:06:30.682Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/overview</loc>
    <lastmod>2026-04-01T04:21:05.807Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/popular_model_usage</loc>
    <lastmod>2026-04-21T07:17:40.729Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3</loc>
    <lastmod>2026-04-21T08:06:30.686Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3_5</loc>
    <lastmod>2026-04-21T08:06:30.680Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/qwen3_vl</loc>
    <lastmod>2026-04-21T08:06:30.718Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/sampling_params</loc>
    <lastmod>2026-04-21T08:06:30.717Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/basic_usage/send_request</loc>
    <lastmod>2026-04-21T08:06:30.723Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/bench_serving</loc>
    <lastmod>2026-04-21T08:06:30.722Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/benchmark_and_profiling</loc>
    <lastmod>2026-04-21T08:06:30.727Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/contribution_guide</loc>
    <lastmod>2026-04-21T08:06:30.719Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_guide_using_docker</loc>
    <lastmod>2026-04-21T08:06:30.716Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/development_jit_kernel_guide</loc>
    <lastmod>2026-04-21T08:06:30.729Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/evaluating_new_models</loc>
    <lastmod>2026-04-21T08:06:30.721Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/developer_guide/overview</loc>
    <lastmod>2026-04-21T07:17:44.367Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/install</loc>
    <lastmod>2026-04-21T08:13:05.299Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/get-started/quickstart</loc>
    <lastmod>2026-04-21T07:17:52.071Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/amd_gpu</loc>
    <lastmod>2026-04-21T08:06:30.771Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/apple_metal</loc>
    <lastmod>2026-04-21T08:06:30.769Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_contribution_guide</loc>
    <lastmod>2026-04-21T08:06:30.782Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu</loc>
    <lastmod>2026-04-21T08:06:30.780Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_best_practice</loc>
    <lastmod>2026-04-21T08:06:30.787Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_deepseek_example</loc>
    <lastmod>2026-04-21T08:06:30.770Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_environment_variables</loc>
    <lastmod>2026-04-21T08:06:30.822Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_glm5_examples</loc>
    <lastmod>2026-04-21T08:06:30.820Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quantization</loc>
    <lastmod>2026-04-21T08:06:30.824Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_quick_start</loc>
    <lastmod>2026-04-21T08:06:30.804Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_5_examples</loc>
    <lastmod>2026-04-21T08:06:30.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_qwen3_examples</loc>
    <lastmod>2026-04-21T08:06:30.819Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_ring_sp_performance</loc>
    <lastmod>2026-04-21T08:06:30.819Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_features</loc>
    <lastmod>2026-04-21T08:06:30.836Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/ascend_npu_support_models</loc>
    <lastmod>2026-04-21T08:06:30.824Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/ascend-npus/mindspore_backend</loc>
    <lastmod>2026-04-21T08:06:30.818Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/cpu_server</loc>
    <lastmod>2026-04-21T08:06:30.873Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/mthreads_gpu</loc>
    <lastmod>2026-04-21T08:06:30.877Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia-gpus</loc>
    <lastmod>2026-04-21T08:06:30.875Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/nvidia_jetson</loc>
    <lastmod>2026-04-21T07:18:19.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/overview</loc>
    <lastmod>2026-04-21T07:18:19.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/plugin</loc>
    <lastmod>2026-04-21T08:06:30.881Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/tpu</loc>
    <lastmod>2026-04-21T08:13:05.304Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/hardware-platforms/xpu</loc>
    <lastmod>2026-04-21T08:06:30.874Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/custom_chat_template</loc>
    <lastmod>2026-04-21T08:06:30.876Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/environment_variables</loc>
    <lastmod>2026-04-21T08:06:30.871Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/faq</loc>
    <lastmod>2026-04-21T08:06:30.929Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/choices_methods</loc>
    <lastmod>2026-04-21T08:06:30.925Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_index</loc>
    <lastmod>2026-04-21T08:06:30.926Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/frontend/frontend_tutorial</loc>
    <lastmod>2026-04-21T08:06:30.933Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/deploy_on_k8s</loc>
    <lastmod>2026-04-21T08:06:30.934Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/lws_pd/lws_pd_deploy</loc>
    <lastmod>2026-04-21T08:06:30.917Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node</loc>
    <lastmod>2026-04-21T08:06:30.927Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/multi_node_index</loc>
    <lastmod>2026-04-21T08:06:30.930Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/multi_node_deployment/rbg_pd/deepseekv32_pd</loc>
    <lastmod>2026-04-21T08:06:30.916Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/overview</loc>
    <lastmod>2026-04-01T04:21:05.821Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/post_training_integration</loc>
    <lastmod>2026-04-21T08:06:30.965Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_metrics</loc>
    <lastmod>2026-04-21T08:06:30.968Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/references/production_request_trace</loc>
    <lastmod>2026-04-21T08:06:30.966Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/cli</loc>
    <lastmod>2026-04-21T07:18:32.428Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/openai_api</loc>
    <lastmod>2026-04-21T07:18:32.425Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/api/post_processing</loc>
    <lastmod>2026-04-21T08:06:30.963Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/attention_backends</loc>
    <lastmod>2026-04-21T07:18:32.424Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/cache_dit</loc>
    <lastmod>2026-04-21T07:18:32.422Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/caching-acceleration</loc>
    <lastmod>2026-04-21T07:18:32.423Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ci_perf</loc>
    <lastmod>2026-04-21T07:18:40.380Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/compatibility_matrix</loc>
    <lastmod>2026-04-21T07:18:40.381Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/contributing</loc>
    <lastmod>2026-04-21T08:06:31.003Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/disaggregation</loc>
    <lastmod>2026-04-21T08:06:31.015Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/environment_variables</loc>
    <lastmod>2026-04-21T07:18:40.386Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion</loc>
    <lastmod>2026-04-21T07:18:40.397Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/installation</loc>
    <lastmod>2026-04-21T07:18:40.396Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/performance-optimization</loc>
    <lastmod>2026-04-21T07:18:40.389Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/profiling</loc>
    <lastmod>2026-03-27T19:16:51.341Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/quantization</loc>
    <lastmod>2026-04-21T08:06:31.000Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/ring_sp_performance</loc>
    <lastmod>2026-04-21T08:06:31.058Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/support_new_models</loc>
    <lastmod>2026-04-21T08:06:31.055Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/sglang-diffusion/teacache</loc>
    <lastmod>2026-04-21T07:18:48.653Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models</loc>
    <lastmod>2026-04-21T07:18:48.656Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/classify_models</loc>
    <lastmod>2026-04-21T08:06:31.052Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/diffusion_language_models</loc>
    <lastmod>2026-04-21T08:06:31.057Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/embedding_models</loc>
    <lastmod>2026-04-21T07:18:48.654Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/generative_models</loc>
    <lastmod>2026-04-21T08:06:31.051Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/mindspore_models</loc>
    <lastmod>2026-04-21T08:06:31.050Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/modelscope</loc>
    <lastmod>2026-04-21T08:06:31.054Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/multimodal_language_models</loc>
    <lastmod>2026-04-21T08:06:31.137Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/rerank_models</loc>
    <lastmod>2026-04-21T08:06:31.131Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/reward_models</loc>
    <lastmod>2026-04-21T08:06:31.135Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/support_new_models</loc>
    <lastmod>2026-04-21T07:18:58.462Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io/docs/supported-models/transformers_fallback</loc>
    <lastmod>2026-04-21T08:06:31.130Z</lastmod>
  </url>

  <url>
    <loc>https://docs.sglang.io</loc>
    <lastmod>2026-04-21T07:18:58.464Z</lastmod>
  </url>
</urlset>