Skip to content

vllm.pooling_params

PoolingParams

Bases: Struct

API parameters for pooling models. This is currently a placeholder.

Attributes:

Name Type Description
dimensions Optional[int]

Reduce the dimensions of embeddings if model support matryoshka representation.

additional_data Optional[Any]

Any additional data needed for pooling.

Source code in vllm/pooling_params.py
class PoolingParams(
        msgspec.Struct,
        omit_defaults=True,  # type: ignore[call-arg]
        array_like=True):  # type: ignore[call-arg]
    """API parameters for pooling models. This is currently a placeholder.

    Attributes:
        dimensions: Reduce the dimensions of embeddings
                    if model support matryoshka representation.
        additional_data: Any additional data needed for pooling.
    """

    dimensions: Optional[int] = None
    additional_data: Optional[Any] = None
    output_kind: RequestOutputKind = RequestOutputKind.FINAL_ONLY

    def clone(self) -> "PoolingParams":
        """Returns a deep copy of the PoolingParams instance."""
        return PoolingParams(dimensions=self.dimensions,
                             additional_data=self.additional_data)

    def verify(self, model_config: "ModelConfig") -> None:
        if self.dimensions is not None:
            if not model_config.is_matryoshka:
                raise ValueError(
                    f'Model "{model_config.served_model_name}" does not '
                    f'support matryoshka representation, '
                    f'changing output dimensions will lead to poor results.')

            mds = model_config.matryoshka_dimensions
            if mds is not None:
                if self.dimensions not in mds:
                    raise ValueError(
                        f'Model "{model_config.served_model_name}" '
                        f'only supports {str(mds)} matryoshka dimensions, '
                        f'use other output dimensions will '
                        f'lead to poor results.')
            elif self.dimensions < 1:
                raise ValueError("Dimensions must be greater than 0")

    def __repr__(self) -> str:
        return (f"PoolingParams("
                f"dimensions={self.dimensions}, "
                f"additional_metadata={self.additional_data})")

    def __post_init__(self) -> None:
        assert self.output_kind == RequestOutputKind.FINAL_ONLY,\
            "For pooling output_kind has to be FINAL_ONLY"

additional_data class-attribute instance-attribute

additional_data: Optional[Any] = None

dimensions class-attribute instance-attribute

dimensions: Optional[int] = None

output_kind class-attribute instance-attribute

__post_init__

__post_init__() -> None
Source code in vllm/pooling_params.py
def __post_init__(self) -> None:
    assert self.output_kind == RequestOutputKind.FINAL_ONLY,\
        "For pooling output_kind has to be FINAL_ONLY"

__repr__

__repr__() -> str
Source code in vllm/pooling_params.py
def __repr__(self) -> str:
    return (f"PoolingParams("
            f"dimensions={self.dimensions}, "
            f"additional_metadata={self.additional_data})")

clone

clone() -> PoolingParams

Returns a deep copy of the PoolingParams instance.

Source code in vllm/pooling_params.py
def clone(self) -> "PoolingParams":
    """Returns a deep copy of the PoolingParams instance."""
    return PoolingParams(dimensions=self.dimensions,
                         additional_data=self.additional_data)

verify

verify(model_config: ModelConfig) -> None
Source code in vllm/pooling_params.py
def verify(self, model_config: "ModelConfig") -> None:
    if self.dimensions is not None:
        if not model_config.is_matryoshka:
            raise ValueError(
                f'Model "{model_config.served_model_name}" does not '
                f'support matryoshka representation, '
                f'changing output dimensions will lead to poor results.')

        mds = model_config.matryoshka_dimensions
        if mds is not None:
            if self.dimensions not in mds:
                raise ValueError(
                    f'Model "{model_config.served_model_name}" '
                    f'only supports {str(mds)} matryoshka dimensions, '
                    f'use other output dimensions will '
                    f'lead to poor results.')
        elif self.dimensions < 1:
            raise ValueError("Dimensions must be greater than 0")