Index A | B | C | D | E | F | G | H | I | L | M | N | O | P | R | S | T | U | V | W A abort() (vllm.AsyncLLMEngine method) abort_request() (vllm.LLMEngine method) add_lora() (vllm.AsyncLLMEngine method) add_request() (vllm.LLMEngine method) additional_data (vllm.PoolingParams attribute) apply() (vllm.multimodal.processing.BaseMultiModalProcessor method) apply_model() (vllm.LLM method) as_classification_model() (in module vllm.model_executor.models.adapters) as_embedding_model() (in module vllm.model_executor.models.adapters) as_reward_model() (in module vllm.model_executor.models.adapters) AsyncLLMEngine (class in vllm) AudioEmbeddingItems (class in vllm.multimodal.parse) AudioProcessorItems (class in vllm.multimodal.parse) B BaseDummyInputsBuilder (class in vllm.multimodal.profiling) BaseMultiModalProcessor (class in vllm.multimodal.processing) BaseProcessingInfo (class in vllm.multimodal.processing) batch() (vllm.multimodal.inputs.MultiModalKwargs static method) beam_search() (vllm.LLM method) BoundPromptReplacement (class in vllm.multimodal.processing) C chat() (vllm.LLM method) check_health() (vllm.AsyncLLMEngine method) classify() (vllm.LLM method) clone() (vllm.PoolingParams method) (vllm.SamplingParams method) collective_rpc() (vllm.LLM method) compute_logits() (vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration method) create_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) create_processor() (vllm.multimodal.registry.MultiModalRegistry method) D DEPRECATE_INIT_POSARGS (vllm.LLM attribute) DEPRECATE_LEGACY (vllm.LLM attribute) do_log_stats() (vllm.LLMEngine method) DO_VALIDATE_OUTPUT (vllm.LLMEngine attribute) DummyInputsBuilderFactory (class in vllm.multimodal.registry) E embed() (vllm.LLM method) EmbeddingItems (class in vllm.multimodal.parse) encode() (vllm.AsyncLLMEngine method) (vllm.LLM method) engine_step() (vllm.AsyncLLMEngine method) F features (vllm.multimodal.processing.PromptReplacementDetails attribute) find_text_matches() (in module vllm.multimodal.processing) find_token_matches() (in module vllm.multimodal.processing) forward() (vllm.model_executor.models.interfaces.SupportsPP method) from_engine_args() (vllm.AsyncLLMEngine class method) (vllm.LLMEngine class method) from_items() (vllm.multimodal.inputs.MultiModalKwargs static method) full (vllm.multimodal.processing.PromptReplacementDetails attribute) full_groupby_modality() (in module vllm.multimodal.processing) G generate() (vllm.AsyncLLMEngine method) (vllm.LLM method) get() (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_all() (vllm.multimodal.parse.ModalityDataItems method) get_all_counts() (vllm.multimodal.parse.MultiModalDataItems method) get_count() (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.MultiModalDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_decoding_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_dummy_processor_inputs() (vllm.multimodal.profiling.BaseDummyInputsBuilder method) get_hf_processor() (vllm.multimodal.processing.BaseProcessingInfo method) get_input_embeddings() (vllm.model_executor.models.interfaces.SupportsMultiModal method) get_input_preprocessor() (vllm.AsyncLLMEngine method) get_item() (vllm.multimodal.inputs.MultiModalKwargs method) get_item_count() (vllm.multimodal.inputs.MultiModalKwargs method) get_items() (vllm.multimodal.inputs.MultiModalKwargs method) (vllm.multimodal.parse.MultiModalDataItems method) get_lora_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_max_multimodal_tokens() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_by_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_per_item_by_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_max_tokens_per_item_by_nonzero_modality() (vllm.multimodal.registry.MultiModalRegistry method) get_mm_limits_per_prompt() (vllm.multimodal.registry.MultiModalRegistry method) get_mm_max_tokens_per_item() (vllm.multimodal.processing.BaseProcessingInfo method) get_model_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_multimodal_embeddings() (vllm.model_executor.models.interfaces.SupportsMultiModal method) get_num_unfinished_requests() (vllm.LLMEngine method) get_parallel_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_passthrough_data() (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_processor_data() (vllm.multimodal.parse.EmbeddingItems method) (vllm.multimodal.parse.ModalityDataItems method) (vllm.multimodal.parse.ProcessorBatchItems method) get_replacement() (vllm.multimodal.processing.BoundPromptReplacement method) get_scheduler_config() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) get_supported_mm_limits() (vllm.multimodal.processing.BaseProcessingInfo method) get_tokenizer() (vllm.AsyncLLMEngine method) H has_inner_state (vllm.model_executor.models.interfaces.HasInnerState attribute) has_processor() (vllm.multimodal.registry.MultiModalRegistry method) has_unfinished_requests() (vllm.LLMEngine method) has_unfinished_requests_for_virtual_engine() (vllm.LLMEngine method) HasInnerState (class in vllm.model_executor.models.interfaces) height (vllm.multimodal.parse.ImageSize attribute) I ImageEmbeddingItems (class in vllm.multimodal.parse) ImageProcessorItems (class in vllm.multimodal.parse) ImageSize (class in vllm.multimodal.parse) init_mm_limits_per_prompt() (vllm.multimodal.registry.MultiModalRegistry method) is_attention_free (vllm.model_executor.models.interfaces.IsAttentionFree attribute) is_hybrid (vllm.model_executor.models.interfaces.IsHybrid attribute) IsAttentionFree (class in vllm.model_executor.models.interfaces) IsHybrid (class in vllm.model_executor.models.interfaces) iter_token_matches() (in module vllm.multimodal.processing) L length (vllm.multimodal.inputs.PlaceholderRange attribute) LLM (class in vllm) LLMEngine (class in vllm) M make_empty_intermediate_tensors() (vllm.model_executor.models.interfaces.SupportsPP method) map_input() (vllm.multimodal.registry.MultiModalRegistry method) mm_hashes (vllm.multimodal.inputs.MultiModalInputs attribute) mm_kwargs (vllm.multimodal.inputs.MultiModalInputs attribute) mm_placeholders (vllm.multimodal.inputs.MultiModalInputs attribute) mm_processor_kwargs (vllm.inputs.TextPrompt attribute) (vllm.inputs.TokensPrompt attribute) modality (vllm.multimodal.processing.PromptReplacement attribute) ModalityDataItems (class in vllm.multimodal.parse) module vllm.engine vllm.model_executor.models.adapters vllm.model_executor.models.interfaces vllm.model_executor.models.interfaces_base vllm.multimodal.parse vllm.multimodal.processing vllm.multimodal.profiling vllm.multimodal.registry multi_modal_data (vllm.inputs.TextPrompt attribute) (vllm.inputs.TokensPrompt attribute) MULTIMODAL_REGISTRY (in module vllm.multimodal) MultiModalDataDict (in module vllm.multimodal.inputs) MultiModalDataItems (class in vllm.multimodal.parse) MultiModalDataParser (class in vllm.multimodal.parse) MultiModalFieldConfig (class in vllm.multimodal.inputs) MultiModalFieldElem (class in vllm.multimodal.inputs) MultiModalInputs (class in vllm.multimodal.inputs) MultiModalKwargs (class in vllm.multimodal.inputs) MultiModalKwargsItem (class in vllm.multimodal.inputs) MultiModalProcessorFactory (class in vllm.multimodal.registry) MultiModalProfiler (class in vllm.multimodal.profiling) MultiModalRegistry (class in vllm.multimodal.registry) N NestedTensors (in module vllm.multimodal.inputs) O offset (vllm.multimodal.inputs.PlaceholderRange attribute) P PlaceholderFeaturesInfo (class in vllm.multimodal.processing) PlaceholderRange (class in vllm.multimodal.inputs) pooler() (vllm.model_executor.models.interfaces_base.VllmModelForPooling method) PoolingParams (class in vllm) ProcessingInfoFactory (class in vllm.multimodal.registry) ProcessorBatchItems (class in vllm.multimodal.parse) ProcessorInputs (class in vllm.multimodal.profiling) prompt (vllm.inputs.TextPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) prompt_token_ids (vllm.inputs.TokensPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) PromptRepl (in module vllm.multimodal.processing) PromptReplacement (class in vllm.multimodal.processing) PromptReplacementDetails (class in vllm.multimodal.processing) PromptSeq (in module vllm.multimodal.processing) PromptType (in module vllm.inputs) R register_image_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) register_input_mapper() (vllm.multimodal.registry.MultiModalRegistry method) register_max_image_tokens() (vllm.multimodal.registry.MultiModalRegistry method) register_max_multimodal_tokens() (vllm.multimodal.registry.MultiModalRegistry method) register_plugin() (vllm.multimodal.registry.MultiModalRegistry method) register_processor() (vllm.multimodal.registry.MultiModalRegistry method) replace_text_matches() (in module vllm.multimodal.processing) replace_token_matches() (in module vllm.multimodal.processing) replacement (vllm.multimodal.processing.PromptReplacement attribute) reset_prefix_cache() (vllm.AsyncLLMEngine method) (vllm.LLMEngine method) run_engine_loop() (vllm.AsyncLLMEngine static method) S sample() (vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration method) SamplingParams (class in vllm) score() (vllm.LLM method) shutdown_background_loop() (vllm.AsyncLLMEngine method) sleep() (vllm.LLM method) start_background_loop() (vllm.AsyncLLMEngine method) start_profile() (vllm.AsyncLLMEngine method) step() (vllm.LLMEngine method) stop_profile() (vllm.AsyncLLMEngine method) supports_lora (vllm.model_executor.models.interfaces.SupportsLoRA attribute) supports_multimodal (vllm.model_executor.models.interfaces.SupportsMultiModal attribute) supports_pp (vllm.model_executor.models.interfaces.SupportsPP attribute) SupportsCrossEncoding (class in vllm.model_executor.models.interfaces) SupportsLoRA (class in vllm.model_executor.models.interfaces) SupportsMultiModal (class in vllm.model_executor.models.interfaces) SupportsPP (class in vllm.model_executor.models.interfaces) T target (vllm.multimodal.processing.BoundPromptReplacement property) (vllm.multimodal.processing.PromptReplacement attribute) TextPrompt (class in vllm.inputs) token_type_ids (vllm.inputs.TokensPrompt attribute) (vllm.multimodal.inputs.MultiModalInputs attribute) TokensPrompt (class in vllm.inputs) type (vllm.multimodal.inputs.MultiModalInputs attribute) U update_from_generation_config() (vllm.SamplingParams method) V VideoEmbeddingItems (class in vllm.multimodal.parse) VideoProcessorItems (class in vllm.multimodal.parse) vllm.engine module vllm.model_executor.models.adapters module vllm.model_executor.models.interfaces module vllm.model_executor.models.interfaces_base module vllm.multimodal.parse module vllm.multimodal.processing module vllm.multimodal.profiling module vllm.multimodal.registry module VllmModel (class in vllm.model_executor.models.interfaces_base) VllmModelForPooling (class in vllm.model_executor.models.interfaces_base) VllmModelForTextGeneration (class in vllm.model_executor.models.interfaces_base) W width (vllm.multimodal.parse.ImageSize attribute)