Skip to content

vllm_omni.platforms.npu.omni_connectors

Modules:

Name Description
yuanrong_transfer_engine_connector

YuanrongTransferEngineConnector

Bases: OmniConnectorBase

Pull-based connector backed by Yuanrong transfer_engine.

allocator instance-attribute

allocator = BufferAllocator(pool_size, alignment=4096)

base_ptr instance-attribute

base_ptr = int(data_ptr())

can_put instance-attribute

can_put = role == 'sender'

config instance-attribute

config = {
    key: (expand_env_value(value))
    for key, value in (items())
}

device_name instance-attribute

device_name = _resolve_device_name(
    get("device_name", "auto"), protocol
)

engine instance-attribute

engine = TransferEngine()

host instance-attribute

host = (
    _get_local_ip()
    if lower() in AUTO_HOST_VALUES
    else host_config
)

pool instance-attribute

pool = empty(pool_size, dtype=uint8, device=pool_device)

pool_device instance-attribute

pool_device = _resolve_pool_device(
    get("memory_pool_device", "npu")
)

pool_size instance-attribute

pool_size = int(get('memory_pool_size', 1024 ** 3))

protocol instance-attribute

protocol = str(get('protocol', 'ascend'))

rpc_port instance-attribute

rpc_port = _resolve_port(get('rpc_port'), host, 'rpc_port')

sender_host instance-attribute

sender_host = get('sender_host')

sender_zmq_port instance-attribute

sender_zmq_port = _resolve_optional_port(
    sender_zmq_port, "sender_zmq_port"
)

supports_raw_data class-attribute instance-attribute

supports_raw_data: bool = True

zmq_ctx instance-attribute

zmq_ctx = Context()

zmq_port instance-attribute

zmq_port = _resolve_port(get('zmq_port'), host, 'zmq_port')

cleanup

cleanup(
    request_id: str,
    from_stage: str | None = None,
    to_stage: str | None = None,
) -> None

close

close() -> None

get

get(
    from_stage: str,
    to_stage: str,
    get_key: str,
    metadata: dict[str, Any] | None = None,
) -> tuple[Any, int] | None

get_connection_info

get_connection_info() -> dict[str, Any]

health

health() -> dict[str, Any]

put

put(
    from_stage: str, to_stage: str, put_key: str, data: Any
) -> tuple[bool, int, dict[str, Any] | None]

update_sender_info

update_sender_info(
    sender_host: str, sender_zmq_port: int
) -> None