aidial_sdk/deployment/truncate_prompt.py (15 lines of code) (raw):

from typing import List, Literal, Union from aidial_sdk.chat_completion.request import ChatCompletionRequest from aidial_sdk.deployment.from_request_mixin import FromRequestDeploymentMixin from aidial_sdk.pydantic_v1 import BaseModel class TruncatePromptRequest(FromRequestDeploymentMixin): inputs: List[ChatCompletionRequest] class TruncatePromptSuccess(BaseModel): status: Literal["success"] = "success" discarded_messages: List[int] class TruncatePromptError(BaseModel): status: Literal["error"] = "error" error: str TruncatePromptResult = Union[TruncatePromptSuccess, TruncatePromptError] class TruncatePromptResponse(BaseModel): outputs: List[TruncatePromptResult]