bearking58's picture
fix: try to have dynamic substitutions
be01f94
raw
history blame
1.58 kB
steps:
- name: "docker"
dir: "core-model-prediction"
args:
[
"builds",
"submit",
"--tag",
"gcr.io/$PROJECT_ID/interview-ai-detector/model-prediction",
]
- name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
entrypoint: "bash"
args:
- "-c"
- |
_MODEL_ID=$(gcloud ai models upload \
--region="$_GCP_VERTEX_AI_REGION" \
--container-ports=8080 \
--container-image-uri="gcr.io/$PROJECT_ID/interview-ai-detector/model-prediction:latest" \
--container-predict-route="/predict" \
--container-health-route="/health" \
--display-name="interview-ai-detector-model" \
--format="value(model)")
echo "_MODEL_ID=${_MODEL_ID}"
- name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
entrypoint: "bash"
args:
- "-c"
- |
_ENDPOINT_ID=$(gcloud ai endpoints create \
--region="$_GCP_VERTEX_AI_REGION" \
--display-name="interview-ai-detector-endpoint" \
--format="value(name)")
echo "_ENDPOINT_ID=${_ENDPOINT_ID}"
- name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
entrypoint: "bash"
args:
- "-c"
- |
gcloud ai endpoints deploy-model "$_ENDPOINT_ID" \
--region="$_GCP_VERTEX_AI_REGION" \
--model="$_MODEL_ID" \
--display-name="interview-ai-detector-deployment" \
--machine-type="n1-standard-4" \
--accelerator="count=1,type=nvidia-tesla-t4" \
--service-account="$_GCP_VERTEX_AI_SA_EMAIL"