Index A | B | C | D | E | F | G | H | I | K | L | M | N | O | P | R | S | T | U | V | W A abort() (vllm.AsyncLLMEngine method) abort_request() (vllm.LLMEngine method) add_lora() (vllm.AsyncLLMEngine method) add_request() (vllm.LLMEngine method) additional_data (vllm.PoolingParams attribute) apply() (vllm.multimodal.processing.BaseMultiModalProcessor method) (vllm.multimodal.processing.EncDecMultiModalProcessor method) apply_model() (vllm.LLM method) apply_text_matches() (in module vllm.multimodal.processing) apply_token_matches() (in module vllm.multimodal.processing) as_classification_model() (in module vllm.model_executor.models.adapters) as_embedding_model() (in module vllm.model_executor.models.adapters) as_reward_model() (in module vllm.model_executor.models.adapters) AsyncLLMEngine (class in vllm) AudioEmbeddingItems (class in vllm.multimodal.parse) AudioProcessorItems (class in vllm.multimodal.parse) B BaseDummyInputsBuilder (class in vllm.multimodal.profiling) BaseMultiModalProcessor (class in vllm.multimodal.processing) BaseProcessingInfo (class in vllm.multimodal.processing) batch() (vllm.multimodal.inputs.MultiModalKwargs static method) batched() (vllm.multimodal.inputs.MultiModalFieldConfig static method) beam_search() (vllm.LLM method) BoundPromptUpdate (class in vllm.multimodal.processing) C chat() (vllm.LLM method) check_health() (vllm.AsyncLLMEngine method) classify() (vllm.LLM method) clone() (vllm.PoolingParams method) (vllm.SamplingParams method) collective_rpc() (vllm.LLM method) compute_logits() (vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration method) content (vllm.multimodal.processing.BoundPromptUpdate property) (vllm.multimodal.processing.PromptInsertion property) (vllm.multimodal.processing.PromptReplacement property) (vllm.multimodal.processing.PromptUpdate property) create_decoder_prompt() (vllm.multimodal.processing.EncDecMultiModalProcessor method) create_encoder_prompt() (vllm.multimodal.processing.EncDecMultiModalProcessor method) create_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) create_processor() (vllm.multimodal.registry.MultiModalRegistry method) D data (vllm.multimodal.inputs.MultiModalFieldElem attribute) DEPRECATE_INIT_POSARGS (vllm.LLM attribute) DEPRECATE_LEGACY (vllm.LLM attribute) DictEmbeddingItems (class in vllm.multimodal.parse) do_log_stats() (vllm.LLMEngine method) DO_VALIDATE_OUTPUT (vllm.LLMEngine attribute) DummyDecoderData (class in vllm.multimodal.profiling) DummyEncoderData (class in vllm.multimodal.profiling) DummyInputsBuilderFactory (class in vllm.multimodal.registry) E embed() (vllm.LLM method) EmbeddingItems (class in vllm.multimodal.parse) EncDecMultiModalProcessor (class in vllm.multimodal.processing) encode() (vllm.AsyncLLMEngine method) (vllm.LLM method) engine_step() (vllm.AsyncLLMEngine method) F features (vllm.multimodal.processing.PromptUpdateDetails attribute) field (vllm.multimodal.inputs.MultiModalFieldElem attribute) find_text_matches() (in module vllm.multimodal.processing) find_token_matches() (in module vllm.multimodal.processing) flat() (vllm.multimodal.inputs.MultiModalFieldConfig static method) flat_from_sizes() (vllm.multimodal.inputs.MultiModalFieldConfig static method) forward() (vllm.model_executor.models.interfaces.SupportsPP method) from_engine_args() (vllm.AsyncLLMEngine class method) (vllm.LLMEngine class method) from_items() (vllm.multimodal.inputs.MultiModalKwargs static method) from_vllm_config() (vllm.AsyncLLMEngine class method) full (vllm.multimodal.processing.PromptUpdateDetails attribute) full_groupby_modality() (in module vllm.multimodal.processing) G generate() (vllm.AsyncLLMEngine method) (vllm.LLM method) get() (vllm.multimodal.parse.DictEmbeddingItems method) (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_all() (vllm.multimodal.parse.ModalityDataItems method) get_all_counts() (vllm.multimodal.parse.MultiModalDataItems method) get_content() (vllm.multimodal.processing.BoundPromptUpdate method) get_count() (vllm.multimodal.parse.DictEmbeddingItems method) (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.MultiModalDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_decoder_dummy_data() (vllm.multimodal.registry.MultiModalRegistry method) get_decoding_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_dummy_processor_inputs() (vllm.multimodal.profiling.BaseDummyInputsBuilder method) get_encoder_dummy_data() (vllm.multimodal.registry.MultiModalRegistry method) get_hf_processor() (vllm.multimodal.processing.BaseProcessingInfo method) get_input_embeddings() (vllm.model_executor.models.interfaces.SupportsMultiModal method) get_input_preprocessor() (vllm.AsyncLLMEngine method) get_item() (vllm.multimodal.inputs.MultiModalKwargs method) get_item_count() (vllm.multimodal.inputs.MultiModalKwargs method) get_items() (vllm.multimodal.inputs.MultiModalKwargs method) (vllm.multimodal.parse.MultiModalDataItems method) get_lora_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_max_multimodal_tokens() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_by_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_per_item_by_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_per_item_by_nonzero_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_mm_limits_per_prompt() (vllm.multimodal.registry.MultiModalRegistry method) get_mm_max_tokens_per_item() (vllm.multimodal.processing.BaseProcessingInfo method) get_model_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_multimodal_embeddings() (vllm.model_executor.models.interfaces.SupportsMultiModal method) get_num_unfinished_requests() (vllm.LLMEngine method) get_parallel_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_passthrough_data() (vllm.multimodal.parse.DictEmbeddingItems method) (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_processor_data() (vllm.multimodal.parse.DictEmbeddingItems method) (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_scheduler_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_supported_mm_limits() (vllm.multimodal.processing.BaseProcessingInfo method) get_tokenizer() (vllm.AsyncLLMEngine method) H has_inner_state (vllm.model_executor.models.interfaces.HasInnerState attribute) has_processor() (vllm.multimodal.registry.MultiModalRegistry method) has_unfinished_requests() (vllm.LLMEngine method) has_unfinished_requests_for_virtual_engine() (vllm.LLMEngine method) HasInnerState (class in vllm.model_executor.models.interfaces) HasNoOps (class in vllm.model_executor.models.interfaces) height (vllm.multimodal.parse.ImageSize attribute) I ImageEmbeddingItems (class in vllm.multimodal.parse) ImageProcessorItems (class in vllm.multimodal.parse) ImageSize (class in vllm.multimodal.parse) init_mm_limits_per_prompt() (vllm.multimodal.registry.MultiModalRegistry method) insertion (vllm.multimodal.processing.PromptInsertion attribute) is_attention_free (vllm.model_executor.models.interfaces.IsAttentionFree attribute) is_hybrid (vllm.model_executor.models.interfaces.IsHybrid attribute) is_sleeping() (vllm.AsyncLLMEngine method) IsAttentionFree (class in vllm.model_executor.models.interfaces) IsHybrid (class in vllm.model_executor.models.interfaces) iter_token_matches() (in module vllm.multimodal.processing) K key (vllm.multimodal.inputs.MultiModalFieldElem attribute) L length (vllm.multimodal.inputs.PlaceholderRange attribute) LLM (class in vllm) LLMEngine (class in vllm) M make_empty_intermediate_tensors() (vllm.model_executor.models.interfaces.SupportsPP method) map_input() (vllm.multimodal.registry.MultiModalRegistry method) mm_hashes (vllm.multimodal.inputs.MultiModalInputs attribute) mm_kwargs (vllm.multimodal.inputs.MultiModalInputs attribute) mm_placeholders (vllm.multimodal.inputs.MultiModalInputs attribute) mm_processor_kwargs (vllm.inputs.TextPrompt attribute) (vllm.inputs.TokensPrompt attribute) modality (vllm.multimodal.inputs.MultiModalFieldElem attribute) (vllm.multimodal.processing.PromptUpdate attribute) ModalityDataItems (class in vllm.multimodal.parse) mode (vllm.multimodal.processing.BoundPromptUpdate property) (vllm.multimodal.processing.PromptInsertion property) (vllm.multimodal.processing.PromptReplacement property) (vllm.multimodal.processing.PromptUpdate property) module vllm.engine vllm.model_executor.models.adapters vllm.model_executor.models.interfaces vllm.model_executor.models.interfaces_base vllm.multimodal.parse vllm.multimodal.processing vllm.multimodal.profiling vllm.multimodal.registry multi_modal_data (vllm.inputs.TextPrompt attribute) (vllm.inputs.TokensPrompt attribute) (vllm.multimodal.profiling.DummyDecoderData attribute) multi_modal_placeholders (vllm.multimodal.profiling.DummyDecoderData attribute) MULTIMODAL_REGISTRY (in module vllm.multimodal) MultiModalDataDict (in module vllm.multimodal.inputs) MultiModalDataItems (class in vllm.multimodal.parse) MultiModalDataParser (class in vllm.multimodal.parse) MultiModalEmbeddings (in module vllm.model_executor.models.interfaces) MultiModalFieldConfig (class in vllm.multimodal.inputs) MultiModalFieldElem (class in vllm.multimodal.inputs) MultiModalInputs (class in vllm.multimodal.inputs) MultiModalKwargs (class in vllm.multimodal.inputs) MultiModalKwargsItem (class in vllm.multimodal.inputs) MultiModalProcessorFactory (class in vllm.multimodal.registry) MultiModalProfiler (class in vllm.multimodal.profiling) MultiModalRegistry (class in vllm.multimodal.registry) N NestedTensors (in module vllm.multimodal.inputs) O offset (vllm.multimodal.inputs.PlaceholderRange attribute) P PlaceholderFeaturesInfo (class in vllm.multimodal.processing) PlaceholderRange (class in vllm.multimodal.inputs) pooler() (vllm.model_executor.models.interfaces_base.VllmModelForPooling method) PoolingParams (class in vllm) ProcessingInfoFactory (class in vllm.multimodal.registry) ProcessorBatchItems (class in vllm.multimodal.parse) ProcessorInputs (class in vllm.multimodal.profiling) prompt (vllm.inputs.TextPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) prompt_token_ids (vllm.inputs.TokensPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) (vllm.multimodal.profiling.DummyDecoderData attribute) (vllm.multimodal.profiling.DummyEncoderData attribute) PromptIndex (class in vllm.multimodal.processing) PromptInsertion (class in vllm.multimodal.processing) PromptReplacement (class in vllm.multimodal.processing) PromptSeq (in module vllm.multimodal.processing) PromptTarget (in module vllm.multimodal.processing) PromptTargetMatch (class in vllm.multimodal.processing) PromptType (in module vllm.inputs) PromptUpdate (class in vllm.multimodal.processing) PromptUpdateContent (in module vllm.multimodal.processing) PromptUpdateDetails (class in vllm.multimodal.processing) PromptUpdateInfo (in module vllm.multimodal.processing) R register_image_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) register_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) register_max_image_tokens() (vllm.multimodal.registry.MultiModalRegistry method) register_max_multimodal_tokens() (vllm.multimodal.registry.MultiModalRegistry method) register_plugin() (vllm.multimodal.registry.MultiModalRegistry method) register_processor() (vllm.multimodal.registry.MultiModalRegistry method) replace_token_matches() (in module vllm.multimodal.processing) replacement (vllm.multimodal.processing.PromptReplacement attribute) reset_prefix_cache() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) run_engine_loop() (vllm.AsyncLLMEngine static method) S sample() (vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration method) SamplingParams (class in vllm) score() (vllm.LLM method) shared() (vllm.multimodal.inputs.MultiModalFieldConfig static method) shutdown_background_loop() (vllm.AsyncLLMEngine method) sleep() (vllm.AsyncLLMEngine method) (vllm.LLM method) start_background_loop() (vllm.AsyncLLMEngine method) start_profile() (vllm.AsyncLLMEngine method) step() (vllm.LLMEngine method) stop_profile() (vllm.AsyncLLMEngine method) supports_lora (vllm.model_executor.models.interfaces.SupportsLoRA attribute) supports_multimodal (vllm.model_executor.models.interfaces.SupportsMultiModal attribute) supports_pp (vllm.model_executor.models.interfaces.SupportsPP attribute) SupportsCrossEncoding (class in vllm.model_executor.models.interfaces) SupportsLoRA (class in vllm.model_executor.models.interfaces) SupportsMultiModal (class in vllm.model_executor.models.interfaces) SupportsPP (class in vllm.model_executor.models.interfaces) SupportsQuant (class in vllm.model_executor.models.interfaces) SupportsTranscription (class in vllm.model_executor.models.interfaces) SupportsV0Only (class in vllm.model_executor.models.interfaces) T target (vllm.multimodal.processing.BoundPromptUpdate property) (vllm.multimodal.processing.PromptUpdate attribute) TextPrompt (class in vllm.inputs) token_type_ids (vllm.inputs.TokensPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) TokensPrompt (class in vllm.inputs) type (vllm.multimodal.inputs.MultiModalInputs attribute) U update_from_generation_config() (vllm.SamplingParams method) UpdateMode (class in vllm.multimodal.processing) V VideoEmbeddingItems (class in vllm.multimodal.parse) VideoProcessorItems (class in vllm.multimodal.parse) vllm.engine module vllm.model_executor.models.adapters module vllm.model_executor.models.interfaces module vllm.model_executor.models.interfaces_base module vllm.multimodal.parse module vllm.multimodal.processing module vllm.multimodal.profiling module vllm.multimodal.registry module VllmModel (class in vllm.model_executor.models.interfaces_base) VllmModelForPooling (class in vllm.model_executor.models.interfaces_base) VllmModelForTextGeneration (class in vllm.model_executor.models.interfaces_base) W wake_up() (vllm.AsyncLLMEngine method) (vllm.LLM method) width (vllm.multimodal.parse.ImageSize attribute)