aidial_adapter_vertexai/deployments.py (45 lines of code) (raw):
from enum import Enum
from typing import Literal
class ChatCompletionDeployment(str, Enum):
CHAT_BISON_1 = "chat-bison@001"
CHAT_BISON_2 = "chat-bison@002"
CHAT_BISON_2_32K = "chat-bison-32k@002"
CODECHAT_BISON_1 = "codechat-bison@001"
CODECHAT_BISON_2 = "codechat-bison@002"
CODECHAT_BISON_2_32K = "codechat-bison-32k@002"
GEMINI_PRO_1 = "gemini-pro"
GEMINI_PRO_VISION_1 = "gemini-pro-vision"
GEMINI_PRO_1_5_PREVIEW = "gemini-1.5-pro-preview-0409"
GEMINI_PRO_1_5_V1 = "gemini-1.5-pro-001"
GEMINI_PRO_1_5_V2 = "gemini-1.5-pro-002"
GEMINI_FLASH_1_5_V1 = "gemini-1.5-flash-001"
GEMINI_FLASH_1_5_V2 = "gemini-1.5-flash-002"
GEMINI_2_0_EXPERIMENTAL_1206 = "gemini-exp-1206"
GEMINI_2_0_FLASH_EXP = "gemini-2.0-flash-exp"
GEMINI_2_0_FLASH_THINKING_EXP_1219 = "gemini-2.0-flash-thinking-exp-1219"
IMAGEN_005 = "imagegeneration@005"
def get_model_id(self) -> str:
return self.value
GeminiDeployment = Literal[
ChatCompletionDeployment.GEMINI_PRO_1,
ChatCompletionDeployment.GEMINI_PRO_VISION_1,
ChatCompletionDeployment.GEMINI_PRO_1_5_PREVIEW,
ChatCompletionDeployment.GEMINI_PRO_1_5_V1,
ChatCompletionDeployment.GEMINI_PRO_1_5_V2,
ChatCompletionDeployment.GEMINI_FLASH_1_5_V1,
ChatCompletionDeployment.GEMINI_FLASH_1_5_V2,
]
Gemini2Deployment = Literal[
ChatCompletionDeployment.GEMINI_2_0_EXPERIMENTAL_1206,
ChatCompletionDeployment.GEMINI_2_0_FLASH_EXP,
ChatCompletionDeployment.GEMINI_2_0_FLASH_THINKING_EXP_1219,
]
class EmbeddingsDeployment(str, Enum):
# English models
TEXT_EMBEDDING_GECKO_1 = "textembedding-gecko@001"
TEXT_EMBEDDING_GECKO_3 = "textembedding-gecko@003"
TEXT_EMBEDDING_4 = "text-embedding-004"
# Multilingual models
TEXT_EMBEDDING_GECKO_MULTILINGUAL_1 = "textembedding-gecko-multilingual@001"
TEXT_MULTILINGUAL_EMBEDDING_2 = "text-multilingual-embedding-002"
MULTI_MODAL_EMBEDDING_1 = "multimodalembedding@001"
def get_model_id(self) -> str:
return self.value