vllm_omni.diffusion.models.wan2_2.pipeline_wan2_2 ¶

DEBUG_PERF `module-attribute` ¶

DEBUG_PERF = False

WAN_SAMPLE_SOLVER_CHOICES `module-attribute` ¶

WAN_SAMPLE_SOLVER_CHOICES = {'unipc', 'euler'}

logger `module-attribute` ¶

logger = logging.getLogger(__name__)

Wan22Pipeline ¶

Bases: Module, PipelineParallelMixin, CFGParallelMixin, ProgressBarMixin, DiffusionPipelineProfilerMixin, SupportsComponentDiscovery

boundary_ratio `instance-attribute` ¶

boundary_ratio = od_config.boundary_ratio

current_timestep `property` ¶

current_timestep

device `instance-attribute` ¶

device = get_local_device()

do_classifier_free_guidance `property` ¶

do_classifier_free_guidance

expand_timesteps `instance-attribute` ¶

expand_timesteps = model_index.get(
    "expand_timesteps", False
)

guidance_scale `property` ¶

guidance_scale

has_transformer_2 `instance-attribute` ¶

has_transformer_2 = transformer_2_info[0] is not None

num_timesteps `property` ¶

num_timesteps

od_config `instance-attribute` ¶

od_config = od_config

scheduler `instance-attribute` ¶

scheduler = build_wan_scheduler(
    self._sample_solver, self._flow_shift
)

text_encoder `instance-attribute` ¶

text_encoder = from_pretrained_with_prefetch(
    UMT5EncoderModel.from_pretrained,
    model,
    subfolder="text_encoder",
    prefetch_list=component_subfolders,
    local_files_only=local_files_only,
    torch_dtype=dtype,
).to(self.device)

tokenizer `instance-attribute` ¶

tokenizer = from_pretrained_with_prefetch(
    AutoTokenizer.from_pretrained,
    model,
    subfolder="tokenizer",
    prefetch_list=component_subfolders,
    local_files_only=local_files_only,
)

transformer `instance-attribute` ¶

transformer = self._create_transformer(transformer_config)

transformer_2 `instance-attribute` ¶

transformer_2 = self._create_transformer(
    transformer_2_config
)

transformer_config `instance-attribute` ¶

transformer_config = self.transformer.config

vae `instance-attribute` ¶

vae = from_pretrained_with_prefetch(
    DistributedAutoencoderKLWan.from_pretrained,
    model,
    subfolder="vae",
    prefetch_list=component_subfolders,
    local_files_only=local_files_only,
    torch_dtype=dtype,
).to(self.device)

vae_scale_factor_spatial `instance-attribute` ¶

vae_scale_factor_spatial = (
    self.vae.config.scale_factor_spatial
    if getattr(self, "vae", None)
    else 8
)

vae_scale_factor_temporal `instance-attribute` ¶

vae_scale_factor_temporal = (
    self.vae.config.scale_factor_temporal
    if getattr(self, "vae", None)
    else 4
)

weights_sources `instance-attribute` ¶

weights_sources = []

check_inputs ¶

check_inputs(
    prompt,
    negative_prompt,
    height,
    width,
    prompt_embeds=None,
    negative_prompt_embeds=None,
    guidance_scale_2=None,
    boundary_ratio=None,
)

diffuse ¶

diffuse(
    latents: Tensor,
    timesteps: Tensor,
    prompt_embeds: Tensor,
    negative_prompt_embeds: Tensor | None,
    guidance_low: float,
    guidance_high: float,
    boundary_timestep: float | None,
    dtype: dtype,
    attention_kwargs: dict[str, Any],
    latent_condition: Tensor | None = None,
    first_frame_mask: Tensor | None = None,
) -> Tensor | AsyncLatents

encode_prompt ¶

encode_prompt(
    prompt: str | list[str],
    negative_prompt: str | list[str] | None = None,
    do_classifier_free_guidance: bool = True,
    num_videos_per_prompt: int = 1,
    max_sequence_length: int = 512,
    device: device | None = None,
    dtype: dtype | None = None,
)

forward ¶

forward(req: DiffusionRequestBatch) -> DiffusionOutput

load_weights ¶

load_weights(
    weights: Iterable[tuple[str, Tensor]],
) -> set[str]

Load weights using AutoWeightsLoader for vLLM integration.

predict_noise ¶

predict_noise(
    current_model: Module | None = None, **kwargs: Any
) -> Tensor | IntermediateTensors

Forward pass through transformer to predict noise.

Parameters:

Name	Type	Description	Default
`current_model`	`Module \| None`	The transformer model to use (transformer or transformer_2)	`None`
`**kwargs`	`Any`	Arguments to pass to the transformer	`{}`

Returns:

Type	Description
`Tensor \| IntermediateTensors`	Predicted noise tensor or IntermediateTensors on non-last PP stages.

prepare_latents ¶

prepare_latents(
    batch_size: int,
    num_channels_latents: int,
    height: int,
    width: int,
    num_frames: int,
    dtype: dtype | None,
    device: device | None,
    generator: Generator | list[Generator] | None,
    latents: Tensor | None = None,
) -> Tensor

WanT2VDMD2Pipeline ¶

Bases: DMD2PipelineMixin, Wan22Pipeline

Wan 2.x T2V pipeline for FastGen DMD2-distilled models.

build_wan_scheduler ¶

build_wan_scheduler(
    sample_solver: str, flow_shift: float
) -> Any

create_transformer_from_config ¶

create_transformer_from_config(
    config: dict,
    quant_config: QuantizationConfig | None = None,
    prefix: str = "",
) -> WanTransformer3DModel

Create WanTransformer3DModel from config dict.

get_wan22_post_process_func ¶

get_wan22_post_process_func(od_config: OmniDiffusionConfig)

get_wan22_pre_process_func ¶

get_wan22_pre_process_func(od_config: OmniDiffusionConfig)

Pre-process function for Wan2.2: optionally load and resize input image for I2V mode.

load_transformer_config ¶

load_transformer_config(
    model_path: str,
    subfolder: str = "transformer",
    local_files_only: bool = True,
) -> dict

Load transformer config from model directory or HF Hub.

resolve_wan_flow_shift ¶

resolve_wan_flow_shift(
    req: OmniDiffusionRequest,
    od_config: OmniDiffusionConfig,
) -> float

resolve_wan_sample_solver ¶

resolve_wan_sample_solver(
    req: OmniDiffusionRequest, default: str = "unipc"
) -> str

retrieve_latents ¶

retrieve_latents(
    encoder_output: Tensor,
    generator: Generator | None = None,
    sample_mode: str = "sample",
)

Retrieve latents from VAE encoder output.

vllm_omni.diffusion.models.wan2_2.pipeline_wan2_2 ¶

DEBUG_PERF module-attribute ¶

WAN_SAMPLE_SOLVER_CHOICES module-attribute ¶

logger module-attribute ¶

Wan22Pipeline ¶

boundary_ratio instance-attribute ¶

current_timestep property ¶

device instance-attribute ¶

do_classifier_free_guidance property ¶

expand_timesteps instance-attribute ¶

guidance_scale property ¶

has_transformer_2 instance-attribute ¶

num_timesteps property ¶

od_config instance-attribute ¶

scheduler instance-attribute ¶

text_encoder instance-attribute ¶

tokenizer instance-attribute ¶

transformer instance-attribute ¶

transformer_2 instance-attribute ¶

transformer_config instance-attribute ¶

vae instance-attribute ¶

vae_scale_factor_spatial instance-attribute ¶

vae_scale_factor_temporal instance-attribute ¶

weights_sources instance-attribute ¶