vllm.plugins.io_processors.interface
IOProcessor ¶
Bases: ABC
, Generic[IOProcessorInput, IOProcessorOutput]
Source code in vllm/plugins/io_processors/interface.py
__init__ ¶
__init__(vllm_config: VllmConfig)
output_to_response abstractmethod
¶
output_to_response(
plugin_output: IOProcessorOutput,
) -> IOProcessorResponse
parse_request abstractmethod
¶
parse_request(request: Any) -> IOProcessorInput
post_process abstractmethod
¶
post_process(
model_output: Sequence[PoolingRequestOutput],
request_id: Optional[str] = None,
**kwargs,
) -> IOProcessorOutput
post_process_async async
¶
post_process_async(
model_output: AsyncGenerator[
tuple[int, PoolingRequestOutput]
],
request_id: Optional[str] = None,
**kwargs,
) -> IOProcessorOutput
Source code in vllm/plugins/io_processors/interface.py
pre_process abstractmethod
¶
pre_process(
prompt: IOProcessorInput,
request_id: Optional[str] = None,
**kwargs,
) -> Union[PromptType, Sequence[PromptType]]
pre_process_async async
¶
pre_process_async(
prompt: IOProcessorInput,
request_id: Optional[str] = None,
**kwargs,
) -> Union[PromptType, Sequence[PromptType]]