Skip to content

vllm_omni.platforms.npu.omni_connectors

Modules:

Name Description
yuanrong_transfer_engine_connector

YuanrongTransferEngineConnector

Bases: OmniConnectorBase

Pull-based connector backed by Yuanrong transfer_engine.

allocator instance-attribute

allocator = BufferAllocator(self.pool_size, alignment=4096)

base_ptr instance-attribute

base_ptr = int(self.pool.data_ptr())

can_put instance-attribute

can_put = role == 'sender'

config instance-attribute

config = {
    key: (expand_env_value(value))
    for key, value in (config.items())
}

device_name instance-attribute

device_name = _resolve_device_name(
    config.get("device_name", "auto"), self.protocol
)

engine instance-attribute

engine = TransferEngine()

host instance-attribute

host = (
    self._get_local_ip()
    if host_config.lower() in AUTO_HOST_VALUES
    else host_config
)

pool instance-attribute

pool = torch.empty(
    self.pool_size,
    dtype=torch.uint8,
    device=self.pool_device,
)

pool_device instance-attribute

pool_device = _resolve_pool_device(
    config.get("memory_pool_device", "npu")
)

pool_size instance-attribute

pool_size = int(config.get('memory_pool_size', 1024 ** 3))

protocol instance-attribute

protocol = str(config.get('protocol', 'ascend'))

rpc_port instance-attribute

rpc_port = self._resolve_port(
    config.get("rpc_port"), self.host, "rpc_port"
)

sender_host instance-attribute

sender_host = config.get('sender_host')

sender_zmq_port instance-attribute

sender_zmq_port = self._resolve_optional_port(
    sender_zmq_port, "sender_zmq_port"
)

supports_raw_data class-attribute instance-attribute

supports_raw_data: bool = True

zmq_ctx instance-attribute

zmq_ctx = zmq.Context()

zmq_port instance-attribute

zmq_port = self._resolve_port(
    config.get("zmq_port"), self.host, "zmq_port"
)

cleanup

cleanup(
    request_id: str,
    from_stage: str | None = None,
    to_stage: str | None = None,
) -> None

close

close() -> None

get

get(
    from_stage: str,
    to_stage: str,
    get_key: str,
    metadata: dict[str, Any] | None = None,
) -> tuple[Any, int] | None

get_connection_info

get_connection_info() -> dict[str, Any]

health

health() -> dict[str, Any]

put

put(
    from_stage: str, to_stage: str, put_key: str, data: Any
) -> tuple[bool, int, dict[str, Any] | None]

update_sender_info

update_sender_info(
    sender_host: str, sender_zmq_port: int
) -> None