ai-ml/t5-model-serving/kubernetes/application.yaml (56 lines of code) (raw):
# Copyright 2023 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
apiVersion: apps/v1
kind: Deployment
metadata:
name: fastdash
labels:
app: fastdash
spec:
replicas: 1
selector:
matchLabels:
app: fastdash
template:
metadata:
labels:
app: fastdash
spec:
containers:
- name: main
image: us-central1-docker.pkg.dev/PROJECT_ID/models/fastdash:latest
imagePullPolicy: IfNotPresent
env:
- name: MODEL_PREDICTION
value: "http://t5-inference:8080/predictions/t5-small/1.0"
- name: MODEL_MANAGEMENT
value: "http://t5-inference:8081/predictions/models/t5-small"
resources:
limits:
cpu: 250m
memory: 512Mi
ephemeral-storage: 1Gi
requests:
cpu: 250m
memory: 512Mi
ephemeral-storage: 1Gi
ports:
- containerPort: 8050
name: http
readinessProbe:
httpGet:
path: /
port: http
---
apiVersion: v1
kind: Service
metadata:
name: fastdash
labels:
app: fastdash
spec:
type: ClusterIP
selector:
app: fastdash
ports:
- port: 8050
name: http
targetPort: http