vllm.entrypoints.pooling.pooling.protocol ¶
PoolingRequest module-attribute ¶
PoolingRequest: TypeAlias = (
PoolingCompletionRequest
| PoolingChatRequest
| IOProcessorRequest
)
IOProcessorRequest ¶
Bases: OpenAIBaseModel, Generic[T]
Source code in vllm/entrypoints/pooling/pooling/protocol.py
embed_dtype class-attribute instance-attribute ¶
embed_dtype: EmbedDType = Field(
default="float32",
description="What dtype to use for encoding. Default to using float32 for base64 encoding to match the OpenAI python client behavior. This parameter will affect base64 and binary_response.",
)
endianness class-attribute instance-attribute ¶
endianness: Endianness = Field(
default="native",
description="What endianness to use for encoding. Default to using native for base64 encoding to match the OpenAI python client behavior.This parameter will affect base64 and binary_response.",
)
IOProcessorResponse ¶
Bases: OpenAIBaseModel, Generic[T]
Source code in vllm/entrypoints/pooling/pooling/protocol.py
PoolingBytesResponse ¶
Bases: OpenAIBaseModel
Source code in vllm/entrypoints/pooling/pooling/protocol.py
PoolingChatRequest ¶
Bases: EmbeddingChatRequest
Source code in vllm/entrypoints/pooling/pooling/protocol.py
activation class-attribute instance-attribute ¶
activation: bool | None = Field(
default=None,
description="activation will be deprecated, please use use_activation instead.",
)
softmax class-attribute instance-attribute ¶
softmax: bool | None = Field(
default=None,
description="softmax will be deprecated, please use use_activation instead.",
)
use_activation class-attribute instance-attribute ¶
use_activation: bool | None = Field(
default=None,
description="Whether to use activation for classification outputs. If it is a classify or token_classify task, the default is True; for other tasks, this value should be None.",
)
to_pooling_params ¶
PoolingCompletionRequest ¶
Bases: EmbeddingCompletionRequest
Source code in vllm/entrypoints/pooling/pooling/protocol.py
activation class-attribute instance-attribute ¶
activation: bool | None = Field(
default=None,
description="activation will be deprecated, please use use_activation instead.",
)
softmax class-attribute instance-attribute ¶
softmax: bool | None = Field(
default=None,
description="softmax will be deprecated, please use use_activation instead.",
)
use_activation class-attribute instance-attribute ¶
use_activation: bool | None = Field(
default=None,
description="Whether to use activation for classification outputs. If it is a classify or token_classify task, the default is True; for other tasks, this value should be None.",
)
to_pooling_params ¶
PoolingResponse ¶
Bases: OpenAIBaseModel
Source code in vllm/entrypoints/pooling/pooling/protocol.py
created class-attribute instance-attribute ¶
id class-attribute instance-attribute ¶
id: str = Field(
default_factory=lambda: f"pool-{random_uuid()}"
)
PoolingResponseData ¶
Bases: OpenAIBaseModel