File size: 1,582 Bytes
3c4533d
 
 
358e4c4
3c4533d
 
 
585662b
e9072c9
3c4533d
c3aed00
3c4533d
 
585662b
 
3c4533d
 
358e4c4
dbb7ef8
3c4533d
 
 
dbb7ef8
e9072c9
3c4533d
dbb7ef8
3c4533d
 
 
09df726
3c4533d
 
 
d87e8e8
 
 
e9072c9
d87e8e8
3c4533d
 
 
e9072c9
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
steps:
  - name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
    entrypoint: "bash"
    id: upload-model
    args:
      - "-c"
      - |
        gcloud ai models upload \
          --region="us-central1" \
          --container-ports=8080 \
          --container-image-uri="us-central1-docker.pkg.dev/${PROJECT_ID}/interview-ai-detector/model-prediction:latest" \
          --container-predict-route="/predict" \
          --container-health-route="/health" \
          --display-name="interview-ai-detector-model"

  - name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
    entrypoint: "bash"
    id: create-endpoint
    waitFor: ["upload-model"]
    args:
      - "-c"
      - |
        gcloud ai endpoints create \
          --region="us-central1" \
          --display-name="interview-ai-detector-endpoint" \
          --format="value(name)"

  - name: "gcr.io/google.com/cloudsdktool/cloud-sdk"
    entrypoint: "bash"
    waitFor: ["create-endpoint"]
    args:
      - "-c"
      - |
        _MODEL_ID=$(gcloud ai models list --region=us-central1 --format="value(name)" | head -n 1) \
        _ENDPOINT_ID=$(gcloud ai endpoints list --region=us-central1 --format="value(name)" | head -n 1) \
        gcloud ai endpoints deploy-model $_ENDPOINT_ID \
          --region="us-central1" \
          --model=$_MODEL_ID \
          --display-name="interview-ai-detector-deployment" \
          --machine-type="n1-standard-4" \
          --accelerator="count=1,type=nvidia-tesla-t4" \
          --service-account="vertex-ai-user-managed-sa@steady-climate-416810.iam.gserviceaccount.com"