Skip to content

vllm_gaudi.models

Modules:

Name Description
gemma3_mm
interfaces
qwen2_5_vl
qwen3_moe
qwen3_vl
qwen3_vl_moe
utils

register_model

register_model()
Source code in vllm_gaudi/models/__init__.py
def register_model():
    from vllm_gaudi.models.gemma3_mm import HpuGemma3ForConditionalGeneration  # noqa: F401

    ModelRegistry.register_model(
        "Gemma3ForConditionalGeneration",  # Original architecture identifier in vLLM
        "vllm_gaudi.models.gemma3_mm:HpuGemma3ForConditionalGeneration")

    from vllm_gaudi.models.qwen2_5_vl import HpuQwen2_5_VLForConditionalGeneration  # noqa: F401
    ModelRegistry.register_model("Qwen2_5_VLForConditionalGeneration",
                                 "vllm_gaudi.models.qwen2_5_vl:HpuQwen2_5_VLForConditionalGeneration")

    from vllm_gaudi.models.qwen3_vl import HpuQwen3_VLForConditionalGeneration  # noqa: F401
    ModelRegistry.register_model("Qwen3VLForConditionalGeneration",
                                 "vllm_gaudi.models.qwen3_vl:HpuQwen3_VLForConditionalGeneration")

    from vllm_gaudi.models.qwen3_vl_moe import HpuQwen3_VLMoeForConditionalGeneration  # noqa: F401
    ModelRegistry.register_model("Qwen3VLMoeForConditionalGeneration",
                                 "vllm_gaudi.models.qwen3_vl_moe:HpuQwen3_VLMoeForConditionalGeneration")