Skip to content

vllm_gaudi.models.qwen3_vl_moe

HpuQwen3_VLMoeForConditionalGeneration

Bases: Qwen3VLMoeForConditionalGeneration

Source code in vllm_gaudi/models/qwen3_vl_moe.py
class HpuQwen3_VLMoeForConditionalGeneration(Qwen3VLMoeForConditionalGeneration):

    def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
        super().__init__(vllm_config=vllm_config, prefix=prefix)

        # qwen3 moe mlp blocks: make forward for 3d safe (b,s,h -> t,h)
        lm = getattr(self, "language_model", None)
        if lm is not None:
            _n = upgrade_qwen3_moe_blocks_inplace(lm)

__init__

__init__(*, vllm_config: VllmConfig, prefix: str = '')
Source code in vllm_gaudi/models/qwen3_vl_moe.py
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
    super().__init__(vllm_config=vllm_config, prefix=prefix)

    # qwen3 moe mlp blocks: make forward for 3d safe (b,s,h -> t,h)
    lm = getattr(self, "language_model", None)
    if lm is not None:
        _n = upgrade_qwen3_moe_blocks_inplace(lm)