<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
    <url>
         <loc>https://docs.vllm.ai/en/latest/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/benchmarking/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/benchmarking/cli/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/benchmarking/dashboard/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/benchmarking/sweeps/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/chat/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/complete/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/run-batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/latency/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/mm_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/throughput/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/sweep/plot/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/sweep/plot_pareto/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/sweep/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/bench/sweep/serve_workload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/cli/launch/render/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/community/contact_us/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/community/meetups/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/community/sponsors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/conserving_memory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/engine_args/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/env_vars/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/model_resolution/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/optimization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/configuration/serve_args/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/deprecation_policy/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/editing-agent-instructions/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/incremental_build/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/profiling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/vulnerability_management/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/ci/failures/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/ci/nightly_builds/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/ci/update_pytorch_version/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/dockerfile/dockerfile/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/basic/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/registration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/tests/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/contributing/model/transcription/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/docker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/k8s/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/nginx/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/anyscale/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/anything-llm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/autogen/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/bentoml/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/cerebrium/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/chatbox/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/dify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/dstack/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/haystack/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/helm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/hf_inference_endpoints/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/litellm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/lobe-chat/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/lws/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/modal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/open-webui/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/retrieval_augmented_generation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/runpod/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/skypilot/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/streamlit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/frameworks/triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/aibrix/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/dynamo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/kaito/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/kserve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/kthena/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/kubeai/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/kuberay/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/llamastack/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/llm-d/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/llmaz/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/deployment/integrations/production-stack/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/arch_overview/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/attention_backends/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/cuda_graphs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/cuda_graphs_multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/custom_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/dbo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/debug_vllm_compile/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/fused_moe_modular_kernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/fusions/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/huggingface_integration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/hybrid_kv_cache_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/io_processor_plugins/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/logits_processors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/lora_resolver_plugins/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/mm_processing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/model_runner_v2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/moe_kernel_features/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/multiprocessing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/nixl_kv_cache_lease/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/optimization_levels/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/p2p_nccl_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/paged_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/plugin_system/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/prefix_caching/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/torch_compile/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/torch_compile_multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/design/vllm_ir/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/applications/chatbot/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/applications/rag/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/basic/offline_inference/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/basic/online_serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/deployment/async_llm_streaming/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/deployment/chart-helm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/deployment/llm_engine_example/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/deployment/sagemaker-entrypoint/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/disaggregated_encoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/disaggregated_prefill/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/disaggregated_serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/ec_both_encoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/example_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/flexkv_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/kv_load_failure_recovery_offline/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/lmcache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/mooncake_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/disaggregated/p2p_nccl_xpyd/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/automatic_prefix_caching/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/batch_invariance/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/context_extension/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/data_parallel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/kv_events/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/logging_configuration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/logits_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/lora/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/openai_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/pause_resume/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/profiling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/prompt_embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/reset_kv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/sharded_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/speculative_decoding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/structured_outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/tensorize_vllm_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/features/torchrun/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/generate/batched_chat_completions_online/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/generate/multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/generate/qwen_1m_offline/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/generate/token_generation_client/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/observability/dashboards/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/observability/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/observability/opentelemetry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/observability/prometheus_grafana/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/classify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/plugin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/reward/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/score/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/token_classify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/pooling/token_embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/ray_serving/batch_llm_inference/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/ray_serving/elastic_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/ray_serving/multi-node-serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/ray_serving/ray_serve_deepseek/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/ray_serving/run_cluster/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/reasoning/openai_chat_completion_tool_calls_with_reasoning/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/reasoning/openai_chat_completion_with_reasoning/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/reasoning/openai_chat_completion_with_reasoning_streaming/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/reasoning/openai_responses_client/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_async_new_apis/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_http_ipc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_http_nccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_ipc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_ipc_fsdp_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_nccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_nccl_fsdp_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/rlhf_sparse_nccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/routed_experts_e2e/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/rl/skip_loading_weights_in_engine_init/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/speech_to_text/lid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/speech_to_text/openai/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/speech_to_text/realtime/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/chat_with_tools_offline/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_chat_completion_client_with_tools/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_chat_completion_client_with_tools_required/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_chat_completion_client_with_tools_xlam/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_chat_completion_client_with_tools_xlam_streaming/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_responses_client_with_mcp_tools/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/examples/tool_calling/openai_responses_client_with_tools/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/automatic_prefix_caching/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/batch_invariance/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/context_extension/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/custom_arguments/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/custom_logitsprocs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/disagg_encoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/disagg_prefill/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/index_cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/interleaved_thinking/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/lora/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/mooncake_connector_usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/mooncake_store_connector_usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/moriio_connector_usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/multimodal_inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/nixl_connector_compatibility/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/nixl_connector_usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/prompt_embeds/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/reasoning_outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/sleep_mode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/structured_outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/tool_calling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/auto_awq/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/bnb/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/fp8_vit_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/gguf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/gptqmodel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/inc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/int4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/llm_compressor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/modelopt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/online/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/quantized_kvcache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/quark/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/quantization/torchao/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/draft_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/extract_hidden_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/mlp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/n_gram/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/parallel_draft_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/speculators/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/features/speculative_decoding/suffix/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/getting_started/quickstart/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/getting_started/installation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/getting_started/installation/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/getting_started/installation/gpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/governance/collaboration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/governance/committers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/governance/process/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/generative_models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/supported_models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/extensions/fastsafetensor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/extensions/instanttensor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/extensions/runai_model_streamer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/extensions/tensorizer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/hardware_supported_models/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/hardware_supported_models/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/classify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/reward/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/scoring/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/specific_models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/token_classify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/models/pooling_models/token_embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/context_parallel_deployment/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/data_parallel_deployment/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/distributed_troubleshooting/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/expert_parallel_deployment/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/offline_inference/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/parallelism_scaling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/integrations/claude_code/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/integrations/codex/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/integrations/langchain/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/integrations/llamaindex/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/online_serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/online_serving/generative_scoring/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/online_serving/openai_compatible_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/online_serving/renderer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/serving/online_serving/speech_to_text/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/async_rl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/layerwise/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/rlhf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/trl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/weight_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/weight_transfer/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/weight_transfer/ipc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/training/weight_transfer/nccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/faq/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/reproducibility/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/security/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/troubleshooting/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/usage_stats/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/usage/v1_guide/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/assets/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/assets/audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/assets/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/assets/image/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/assets/video/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/datasets/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/datasets/create_txt_slices_dataset/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/datasets/datasets/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/datasets/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/latency/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/lib/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/lib/endpoint_request_func/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/lib/ready_checker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/lib/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/mm_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/plot/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/startup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/cli/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/param_sweep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/plot/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/plot_pareto/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/serve_workload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/startup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/sweep/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/benchmarks/throughput/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/collect_env/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/backends/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/base_static_graph/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/breakable_cudagraph/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/caching/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/codegen/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/compiler_interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/counter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/cuda_graph/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/decorators/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/monitor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/partition_rules/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/act_quant_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/allreduce_rms_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/attn_quant_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/collective_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/matcher_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/mla_attn_quant_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/mla_rope_kvcache_cat_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/qk_norm_rope_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/rms_quant_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/rocm_aiter_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/rope_kvcache_fusion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fusion/sequence_parallelism/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/fx_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/inductor_pass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/ir/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/ir/clone_elimination/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/ir/inplace_functionalization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/ir/lowering_pass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/ir/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/pass_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/fix_functionalization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/noop_elimination/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/post_cleanup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/scatter_split_replace/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/utility/split_coalescing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/passes/vllm_inductor_pass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/piecewise_backend/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/compilation/wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/compilation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/device/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/ec_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/kernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/kv_events/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/kv_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/load/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/lora/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/mamba/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/model_arch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/observability/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/offload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/parallel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/pooler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/profiler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/quantization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/reasoning/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/speculative/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/speech_to_text/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/structured_outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/vllm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/config/weight_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/connections/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/cute_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/cute_utils/cvt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/device_allocator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/device_allocator/cumem/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/communication_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/all2all/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/all_reduce_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/base_device_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/cpu_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/cuda_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/cuda_wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/custom_all_reduce/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/flashinfer_all_reduce/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/mnnvl_compat/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/pynccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/pynccl_allocator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/pynccl_wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/quick_all_reduce/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/ray_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/shm_broadcast/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/shm_object_storage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/symm_mem/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/device_communicators/xpu_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/ec_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/ec_connector/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/ec_connector/example_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/ec_connector/factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/ec_transfer/ec_transfer_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/elastic_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/elastic_ep/elastic_execute/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/elastic_ep/elastic_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/elastic_ep/standby_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/async_worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/eplb_communicator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/eplb_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/eplb_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/policy/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/policy/abstract/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/policy/default/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/eplb/rebalance_execute/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_events/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/decode_bench_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/example_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/example_hidden_states_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/flexkv_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/hf3fs_client/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/hf3fs_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/hf3fs_metadata_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/utils/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/utils/gather_scatter_helper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/hf3fs/utils/hf3fs_mock_client/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/multi_process_adapter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/vllm_v1_adapter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_mp_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/rdma_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/stats/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/coordinator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/data/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/store/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/moriio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/multi_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/stats/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/tp_mapping/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/nixl/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading/scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/offloading_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/p2p/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/p2p/p2p_nccl_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/p2p/p2p_nccl_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/p2p/tensor_memory_pool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/simple_cpu_offload_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_connector/v1/ssm_conv_transfer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/kv_transfer/kv_transfer_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/nixl_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/parallel_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/stateless_coordinator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/ipc_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/nccl_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/distributed/weight_transfer/packed_tensor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/engine/arg_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/engine/async_llm_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/engine/llm_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/engine/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/anthropic/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/anthropic/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/anthropic/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/anthropic/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/api_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/chat_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/latency/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/main/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/mm_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/startup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/sweep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/benchmark/throughput/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/collect_env/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/launch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/main/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/openai/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/run_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/cli/types/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/constants/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/beam_search/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/beam_search/offline/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/beam_search/online/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/beam_search/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/factories/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/generative_scoring/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/generative_scoring/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/generate/generative_scoring/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/grpc_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/launcher/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/llm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/logger/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/mcp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/mcp/tool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/mcp/tool_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/offline_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/api_server/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/batch_serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/chat_completion/stream_harmony/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/cli_args/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/completion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/completion/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/completion/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/completion/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/dp_supervisor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/engine/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/engine/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/fingerprint/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/models/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/models/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/models/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/orca_metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/parser/harmony_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/parser/responses_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/context/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/harmony/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/streaming_events/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/responses/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/run_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/server_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/openai/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/base/io_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/base/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/base/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/classify/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/classify/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/classify/io_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/classify/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/classify/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/embed/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/embed/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/embed/io_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/embed/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/embed/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/factories/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/offline/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/pooling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/pooling/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/pooling/io_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/pooling/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/pooling/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/io_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/typing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/scoring/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/typing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/pooling/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/sagemaker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/sagemaker/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/cache/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/rlhf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/rlhf/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/rpc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/rpc/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/server_info/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/server_info/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/sleep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/dev/sleep/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/disagg/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/disagg/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/disagg/mm_serde/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/disagg/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/disagg/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/elastic_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/elastic_ep/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/elastic_ep/middleware/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/instrumentator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/instrumentator/basic/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/instrumentator/health/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/instrumentator/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/instrumentator/offline_docs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/lora/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/lora/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/lora/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/profile/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/profile/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/render/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/render/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/render/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/tokenize/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/tokenize/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/tokenize/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/serve/tokenize/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/base/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/base/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/factories/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/connection/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/realtime/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/transcription/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/transcription/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/transcription/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/transcription/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/translation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/translation/api_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/translation/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/speech_to_text/translation/serving/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/ssl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/entrypoints/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/env_override/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/envs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/exceptions/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/forward_context/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/inputs/engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/inputs/llm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/inputs/preprocess/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/ops/layernorm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/tolerances/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ir/util/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/aiter_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/case_key/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/config_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/ops/silu_mul_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/register/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/helion/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/oink_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/triton/qkv_padded_fp8_quant/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/vllm_c/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/kernels/xpu_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logger/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/access_log_filter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/dump_input/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/formatter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/lazy/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/log_time/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logging_utils/torch_tensor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logits_process/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/logprobs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/base_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/column_parallel_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/fused_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/logits_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/replicated_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/row_parallel_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/layers/vocal_parallel_embedding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/lora_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/lora_weights/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/model_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/torch_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/torch_ops/lora_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/fp8_kernel_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/fused_moe_lora_fp8_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/fused_moe_lora_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/kernel_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/lora_expand_fp8_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/lora_expand_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/lora_kernel_metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/lora_shrink_fp8_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/lora_shrink_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/triton_ops/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/xpu_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/ops/xpu_ops/lora_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/peft_helper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/punica_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/punica_cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/punica_gpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/punica_selector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/punica_xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/punica_wrapper/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/request/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/resolver/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/lora/worker_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/custom_op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/MPLinearKernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/allspark/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/conch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/cutlass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/dynamic_4bit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/exllama/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/machete/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/rdna3_w4a16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/triton_w4a16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mixed_precision/zentorch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp4/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp4/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp4/marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp4/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/Mxfp8LinearKernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/emulation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/mxfp8/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/cutlass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/emulation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/fbgemm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/nvfp4/marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/BlockScaledMMLinearKernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/ScaledMMLinearKernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/aiter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/cutlass/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/deep_gemm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/pytorch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/rocm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/scaled_mm/zentorch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/linear/zentorch_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/aiter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/tilelang/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/tilelang_kernels/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/torch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/kernels/mhc/triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/activation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/chunked_local_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/cross_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/encoder_only_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/kv_transfer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/mla_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/mm_encoder_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention/static_sink_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/attention_layer_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/batch_invariant/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/conv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/chunk/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/chunk_delta_h/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/chunk_o/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/chunk_scaled_dot_kkt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/cumsum/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/fused_gdn_prefill_post_conv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/fused_recurrent/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/fused_sigmoid_gating/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/index_py/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/kda/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/l2norm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/layernorm_guard/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/op/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/solve_tril/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fla/ops/wy_fast/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/activation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/all2all_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/cpu_fused_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/deep_gemm_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/eep_reconfigure/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/expert_map_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/aiter_mxfp4_w4a8_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/batched_deep_gemm_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/cpu_int4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/cpu_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/cutlass_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/deep_gemm_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/fallback/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/flashinfer_b12x_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/flashinfer_cutedsl_batched_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/flashinfer_cutedsl_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/flashinfer_cutlass_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/fused_batched_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/fused_humming_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/gpt_oss_triton_kernels_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/lora_context/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/lora_experts_mixin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/marlin_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/nvfp4_emulation_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/ocp_mx_emulation_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/rocm_aiter_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/triton_cutlass_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/triton_deep_gemm_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/triton_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/trtllm_bf16_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/trtllm_fp8_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/trtllm_mxfp4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/trtllm_mxint4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/trtllm_nvfp4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/experts/xpu_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/fused_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/fused_moe_method_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/fused_moe_modular_method/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/layer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/modular_kernel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/moe_align_block_size/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/moe_fused_mul_sum/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/moe_permute_unpermute/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/int_wna16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/mxfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/mxfp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/unquantized/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/w4a8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/oracle/w4a8_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/batched/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/deepep_ht/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/deepep_ll/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/flashinfer_nvlink_one_sided/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/flashinfer_nvlink_two_sided/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/mori/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/naive_dp_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/nixl_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/prepare_finalize/no_dp_ep/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/routed_experts_capturer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/aiter_shared_routed_fused_moe_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/base_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/custom_routing_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/fused_moe_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/fused_topk_bias_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/fused_topk_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/gate_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/grouped_topk_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/router_factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/routing_simulator_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/router/zero_expert_router/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/runner/moe_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/runner/moe_runner_interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/runner/shared_experts/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/topk_weight_and_reduce/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/unquantized_fused_moe_method/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/fused_moe/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/layernorm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/lightning_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/logits_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/abstract/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/gdn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/gdn/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/gdn/kimi_gdn_linear_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/gdn/olmo_gdn_linear_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/gdn/qwen_gdn_linear_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/linear_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/mamba_mixer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/mamba_mixer2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/mamba_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/causal_conv1d/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/cpu/causal_conv1d/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/cpu/gdn_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/gdn_chunk_cutedsl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/gdn_chunk_cutedsl/kernel_h/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/gdn_chunk_cutedsl/kernel_kkt_inv_uw/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/gdn_chunk_cutedsl/kernel_o/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/layernorm_gated/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/mamba_ssm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssd_bmm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssd_chunk_scan/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssd_chunk_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssd_combined/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssd_state_passing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/ssu_dispatch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/ops/triton_helpers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mamba/short_conv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mhc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/minimax_rms_norm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/minimax_rms_norm/lamport_workspace/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/minimax_rms_norm/rms_norm_tp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/abstract/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/activations/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/seqwise/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/seqwise/heads/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/seqwise/methods/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/seqwise/poolers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/special/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/tokwise/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/tokwise/heads/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/tokwise/methods/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/pooler/tokwise/poolers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/auto_gptq/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/awq/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/awq_marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/awq_triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/base_config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/bitsandbytes/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w4a4_mxfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w4a4_nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w4a8_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w4a8_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w8a8_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w8a8_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_w8a8_mxfp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_wna16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe/compressed_tensors_moe_wna16_marlin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a16_nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a4_mxfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a4_nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a8_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a8_int/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_mxfp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/module/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/schemes/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/schemes/linear_qutlass_nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/transform/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/triton_scaled_mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/compressed_tensors/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/experts_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/fbgemm_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/fp_quant/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/gguf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/humming/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/inc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/input_quant_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/kv_cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/modelopt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/moe_wna16/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/mxfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/moe_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/online/mxfp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/quark/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/quark_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_nvfp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_scheme/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_w4a8_mxfp4_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_w8a8_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/schemes/quark_w8a8_int8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/quark/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/qutlass_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/torchao/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/turboquant/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/turboquant/centroids/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/turboquant/config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/allspark_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/flashinfer_fp4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/flashinfer_mxint4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/flashinfer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/fp8_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/gptq_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/humming_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/int8_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/layer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/machete_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/marlin_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/marlin_utils_fp4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/marlin_utils_fp8/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/marlin_utils_test/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/mxfp4_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/mxfp6_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/mxfp8_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/nvfp4_emulation_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/nvfp4_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/ocp_mx_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/quant_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/quantization/utils/w8a8_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/resampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/deepseek_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/dual_chunk_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/dynamic_ntk_alpha_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/dynamic_ntk_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/ernie45_vl_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/fope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/gemma4_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/linear_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/llama3_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/llama4_vision_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/mrope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/mrope_interleaved/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/ntk_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/phi3_long_rope_scaled_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/telechat3_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/xdrope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/rotary_embedding/yarn_scaling_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/sparse_attn_indexer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/layers/vocab_parallel_embedding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/base_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/bitsandbytes_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/default_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/dummy_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/ep_weight_filter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/gguf_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/modelexpress_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/layerwise/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/meta/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/sanitize/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/torchao_decorator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/types/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/reload/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/runai_streamer_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/sharded_state_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/tensorizer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/tensorizer_loader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/model_loader/weight_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/AXK1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/adapters/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/afmoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/aimv2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/apertus/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/arcee/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/arctic/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/aria/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/audioflamingo3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/aya_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bagel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/baichuan/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bailing_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bailing_moe_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bamba/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bee/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bert/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bert_with_rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/blip/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/blip2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/bloom/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/chameleon/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/chatglm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cheers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/clip/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cohere2_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cohere2_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cohere_asr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cohere_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/colbert/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/colmodernvbert/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/colpali/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/colqwen3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/colqwen3_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/commandr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/conformer_encoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/cosmos3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/dbrx/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepencoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepencoder2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_eagle3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_ocr2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_v2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/deepseek_vl2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/dots1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/dots_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/eagle2_5_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie45/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie45_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie45_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie45_vl_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ernie_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone4_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone4_5_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/exaone_moe_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/extract_hidden_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/fairseq2_llama/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/falcon/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/falcon_h1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/fireredasr2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/fireredlid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/flex_olmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/funasr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/funaudiochat/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/fuyu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma3_mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma3n/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma3n_audio_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma3n_mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma4_mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma4_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gemma4_unified/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4_1v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4_moe_lite/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4_moe_lite_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4_moe_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm4v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glm_ocr_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glmasr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/glmasr_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gpt2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gpt_bigcode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gpt_j/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gpt_neox/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gpt_oss/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granite/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granite4_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granite_speech/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granitemoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granitemoehybrid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/granitemoeshared/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/gritlm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/grok1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/h2ovl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hunyuan_v1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hunyuan_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hy_v3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hy_v3_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hyperclovax/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hyperclovax_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/hyperclovax_vision_v2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/idefics2_vision_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/idefics3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interfaces/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interfaces_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/intern_vit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/internlm2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/internlm2_ve/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interns1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interns1_pro/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interns1_vit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/interns2_preview/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/internvl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/iquest_loopcoder/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/isaac/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/jais2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/jamba/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/jina/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/jina_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kanana_v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/keye/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/keye_vl1_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kimi_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kimi_k25/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kimi_k25_vit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kimi_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/kimi_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/laguna/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/lfm2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/lfm2_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/lfm2_siglip2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/lfm2_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/lightonocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llama/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llama4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llama4_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llama_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llama_eagle3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llava/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llava_next/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llava_next_video/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/llava_onevision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/longcat_flash/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/longcat_flash_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mamba/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mamba2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/medusa/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mellum/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/midashenglm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo_v2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo_v2_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mimo_v2_omni/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpm3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpm_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpmv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minicpmv4_6/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minimax_m2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minimax_text_01/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/minimax_vl_01/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mistral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mistral3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mistral_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mistral_large_3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mistral_large_3_eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mixtral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mllama4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mlp_speculator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/modernbert/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/module_mapping/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/molmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/molmo2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/moondream3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/moonvit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/mpt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/musicflamingo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nano_nemotron_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron_h/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron_h_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron_nas/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron_parse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nemotron_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/nvlm_d/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/olmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/olmo2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/olmo_hybrid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/olmoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/opencua/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/openpangu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/openpangu_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/openpangu_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/openvla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/opt/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/orion/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ouro/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ovis/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ovis2_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/paddleocr_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/paligemma/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/parakeet/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/param2moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/persimmon/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi3v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi4mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi4mm_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi4mm_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phi4siglip/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/phimoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/pixtral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/plamo2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/plamo3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qianfan_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_5_omni_thinker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_5_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_rm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen2_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_5_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_asr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_asr_forced_aligner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_asr_realtime/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_dflash/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_next/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_next_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_omni_moe_thinker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen3_vl_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/qwen_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/radio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/rnj1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/roberta/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/rvl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/sarvam/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/seed_oss/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/siglip/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/siglip2navit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/skyworkr1v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/smolvlm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/solar/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/stablelm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/starcoder2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step3_text/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step3_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step3p5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step3p5_mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step3p7/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/step_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/tarsier/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/telechat2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/teleflm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/terratorch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/causal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/legacy/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/pooling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/transformers/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/ultravox/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/voxtral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/voxtral_realtime/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/voyage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/whisper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/whisper_causal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/whisper_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/models/zamba2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/offloader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/offloader/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/offloader/prefetch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/offloader/prefetch_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/offloader/uva/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/parameter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/warmup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/warmup/deep_gemm_warmup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_executor/warmup/kernel_warmup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/model_inspection/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/amd/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/amd/model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/amd/mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/amd/rocm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/cache_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/fused_compress_quant_cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/fused_indexer_q/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/fused_inv_rope_fp8_quant/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/fused_mtp_input_rmsnorm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/fused_qk_rmsnorm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/ops/save_partial_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/common/rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/compressor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/flashmla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/mtp/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/ops/dequant_gather_k_cutedsl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/ops/fused_indexer_q_cutedsl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/ops/prepare_megamoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/nvidia/ops/sparse_attn_compress_cutedsl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/models/deepseek_v4/quant_config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/encoder_budget/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/evs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/hasher/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/image/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/image/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/media/video/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/parse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/processing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/processing/context/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/processing/dummy_inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/processing/inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/processing/processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/multimodal/video/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/parser/abstract_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/parser/parser_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/cuda/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/rocm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/tpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/xpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/platforms/zen_cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/io_processors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/io_processors/interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/lora_resolvers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/lora_resolvers/filesystem_resolver/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/plugins/lora_resolvers/hf_hub_resolver/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/pooling_params/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/profiler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/profiler/layerwise_profile/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/profiler/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/profiler/wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ray/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ray/lazy_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/ray/ray_env/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/abs_reasoning_parsers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/basic_parsers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/cohere_command_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/deepseek_r1_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/deepseek_v3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/ernie45_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/gemma4_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/gemma4_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/gptoss_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/granite_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/hunyuan_a13b_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/hy_v3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/identity_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/kimi_k2_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/minimax_m2_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/mistral_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/nemotron_v3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/olmo3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/poolside_v1_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/qwen3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/seedoss_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/step3_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/reasoning/step3p5_reasoning_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/deepseek_v32/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/deepseek_v4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/embed_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/grok2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/hf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/inputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/inputs/preprocess/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/inputs/tokenize/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/mistral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/params/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/renderers/terratorch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/sampling_params/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/scalar_type/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/scripts/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/sequence/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tasks/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/deepseek_v32/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/deepseek_v32_encoding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/deepseek_v4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/deepseek_v4_encoding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/detokenizer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/fastokens/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/grok2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/hf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/kimi_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/mistral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/protocol/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/qwen_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tokenizers/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/abstract_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/apertus_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/cohere_command_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/deepseekv31_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/deepseekv32_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/deepseekv3_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/deepseekv4_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/ernie45_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/functiongemma_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/gemma4_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/gemma4_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/gigachat3_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/glm47_moe_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/glm4_moe_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/granite4_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/granite_20b_fc_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/granite_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/hermes_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/hunyuan_a13b_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/hy_v3_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/internlm2_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/jamba_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/kimi_k2_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/lfm2_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/llama4_pythonic_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/llama_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/longcat_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/minicpm5xml_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/minimax_m2_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/minimax_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/mistral_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/olmo3_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/openai_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/phi4mini_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/poolside_v1_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/pythonic_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/qwen3coder_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/qwen3xml_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/seed_oss_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/step3_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/step3p5_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/streaming/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/structural_tag_registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tool_parsers/xlam_tool_parser/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tracing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tracing/otel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/tracing/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/chat_templates/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/chat_templates/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/config/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/config_parser_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/AXK1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/afmoe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/arctic/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/bagel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/chatglm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/cheers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/colmodernvbert/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/colpali/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/colqwen3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/cosmos3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/deepseek_v4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/deepseek_vl2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/dotsocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/extract_hidden_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/falcon/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/fireredlid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/flex_olmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/funaudiochat/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/granite4_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/hunyuan_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/hy_v3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/hyperclovax/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/isaac/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/kimi_k25/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/kimi_linear/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/kimi_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/laguna/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/lfm2_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/medusa/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/mellum/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/midashenglm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/mimo_v2_omni/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/mistral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/mlp_speculator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/moondream3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/moonvit/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/nemotron/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/nemotron_h/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/olmo_hybrid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/openvla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/ovis/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/parakeet/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/qianfan_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/qwen3_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/qwen3_5_moe/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/qwen3_asr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/qwen3_next/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/radio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/speculators/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/speculators/algos/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/speculators/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/step3_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/step3p5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/tarsier2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/configs/ultravox/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/dynamic_module/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/gguf_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/model_arch_config_convertor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/bagel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/cheers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/cohere_asr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/deepseek_ocr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/deepseek_vl2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/fireredasr2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/fireredlid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/funasr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/glm4v/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/granite4_vision/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/h2ovl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/hunyuan_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/hunyuan_vl_image/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/internvl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/isaac/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/kimi_audio/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/kimi_k25/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/mimo_v2_omni/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/minicpmo/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/minicpmv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/moondream3/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/nano_nemotron_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/nemotron_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/nvlm_d/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/openvla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/ovis/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/ovis2_5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/pixtral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/qwen3_asr/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/qwen_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/step3_vl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/processors/voxtral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/repo_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/runai_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/s3_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/transformers_utils/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/triton_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/triton_utils/allocation/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/triton_utils/importing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/triton_utils/jit_monitor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/usage/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/usage/usage_lib/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/argparse_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/async_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/collection_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/counter/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/cpu_resource_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/cpu_triton_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/deep_gemm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/func_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/gc_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/hashing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/import_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/jsontree/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/math_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/mem_constants/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/mem_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/mistral/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/multi_stream_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/nccl/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/network_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/numa_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/nvtx_pytorch_hooks/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/ompmultiprocessing/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/platform_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/print_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/serial_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/system_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/tensor_schema/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/torch_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/utils/tqdm_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backend/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/cpu_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/fa_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/flash_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/flash_attn_diffkv/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/flex_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/gdn_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/linear_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mamba1_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mamba2_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mamba_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/aiter_triton_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/compressor_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/cutlass_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/flashattn_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/flashinfer_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/flashinfer_mla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/flashmla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/flashmla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/indexer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/flash_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/flashinfer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/selector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/tokenspeed_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/prefill/trtllm_ragged/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/rocm_aiter_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/rocm_aiter_mla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/sparse_swa/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/sparse_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/tokenspeed_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/triton_mla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/mla/xpu_mla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/rocm_aiter_fa/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/rocm_aiter_unified_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/rocm_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/short_conv_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/triton_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/turboquant_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/backends/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/chunked_prefill_paged_decode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/dcp_alltoall/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/flashmla/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/merge_attn_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/paged_attn/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/prefix_prefill/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/rocm_aiter_mla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_attention_helpers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_decode_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_merge_attn_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_prefill_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_reshape_and_cache_flash/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_turboquant_decode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_turboquant_store/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/triton_unified_attention/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/vit_attn_wrappers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/ops/xpu_mla_sparse/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/attention/selector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/block_pool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/encoder_cache_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/kv_cache_coordinator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/kv_cache_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/kv_cache_metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/kv_cache_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/async_scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/output/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/request_queue/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/scheduler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/sched/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/core/single_type_kv_cache_manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/cudagraph_dispatcher/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/async_llm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/coordinator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/core/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/core_client/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/detokenizer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/exceptions/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/input_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/llm_engine/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/logprobs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/output_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/parallel_sampling/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/tensor_ipc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/engine/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/abstract/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/multiproc_executor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/ray_env_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/ray_executor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/ray_executor_v2/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/ray_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/uniproc_executor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/executor/vllm_net_devices/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_cache_interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_cache_spec_registry/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/common/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/gpu_worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/policies/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/policies/arc/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/policies/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/policies/lru/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/shared_offload_region/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/spec/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/cpu/swap_blocks_triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/file_mapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/example/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/example/manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/factory/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/fs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/fs/io/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/fs/manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/fs/thread_pool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/tiering/spec/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/kv_offload/worker/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/loggers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/perf/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/prometheus/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/ray_wrappers/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/reader/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/stats/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/metrics/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/pool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/pool/late_interaction/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/pool/metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/request/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/logits_processor/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/logits_processor/builtin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/logits_processor/interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/logits_processor/state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/bad_words/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/logprobs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/penalties/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/topk_topp_sampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/ops/topk_topp_triton/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/rejection_sampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/sampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/sample/thinking_budget_state/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/serial_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/copy_backend/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/cuda_mem_ops/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/manager/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/simple_kv_offload/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/custom_class_proposer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/dflash/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/draft_model/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/extract_hidden_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/gemma4/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/llm_base_proposer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/medusa/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/metadata/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/ngram_proposer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/ngram_proposer_gpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/step3p5/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/suffix_decoding/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/spec_decode/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/backend_guidance/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/backend_lm_format_enforcer/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/backend_outlines/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/backend_types/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/backend_xgrammar/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/request/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/structured_output/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/block_table/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cp_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu/buffer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu/model_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu/shm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu_model_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/cpu_worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/dp_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/ec_connector_model_runner_mixin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/encoder_cudagraph/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/encoder_cudagraph_defs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/async_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/attn_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/block_table/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/buffer_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/cp_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/cudagraph_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/dp_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/eplb_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/input_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/kv_connector/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/lora_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/metrics/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/metrics/logits/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/mm/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/mm/encoder_cache/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/mm/encoder_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/mm/rope/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_states/default/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_states/interface/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_states/mamba_hybrid/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/model_states/whisper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/pool/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/pool/late_interaction_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/pool/pooling_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/pp_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/bad_words/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/gumbel/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/logit_bias/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/logprob/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/min_p/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/output/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/penalties/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/prompt_logprob/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/sampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/sample/states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/shutdown/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/eagle/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/eagle/cudagraph/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/eagle/eagle3_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/eagle/speculator/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/eagle/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/rejection_sampler/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/rejection_sampler_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/spec_decode/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/states/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/structured_outputs/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu/warmup/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu_input_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu_model_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu_ubatch_wrapper/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/gpu_worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/kv_connector_model_runner_mixin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/lora_model_runner_mixin/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/mamba_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/tpu_input_batch/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/ubatch_utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/ubatching/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/utils/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/worker_base/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/workspace/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/xpu_model_runner/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/v1/worker/xpu_worker/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
    <url>
         <loc>https://docs.vllm.ai/en/latest/api/vllm/version/</loc>
         <lastmod>2026-06-03</lastmod>
    </url>
</urlset>