feat: add reservation affinity proto

Google APIs · copybara-github · commit 333c1ece4e90 · 2024-08-05T14:46:47.000-07:00
feat: add spot field to Vertex Prediction's Dedicated Resources and Custom Training's Scheduling Strategy
docs: update the description for the deprecated GPU (K80)

PiperOrigin-RevId: 659688229
diff --git a/google/cloud/aiplatform/v1beta1/BUILD.bazel b/google/cloud/aiplatform/v1beta1/BUILD.bazel
@@ -120,6 +120,7 @@ proto_library(
         "pipeline_state.proto",
         "prediction_service.proto",
         "publisher_model.proto",
+        "reservation_affinity.proto",
         "reasoning_engine.proto",
         "reasoning_engine_execution_service.proto",
         "reasoning_engine_service.proto",
diff --git a/google/cloud/aiplatform/v1beta1/accelerator_type.proto b/google/cloud/aiplatform/v1beta1/accelerator_type.proto
@@ -29,7 +29,8 @@ enum AcceleratorType {
   // Unspecified accelerator type, which means no accelerator.
   ACCELERATOR_TYPE_UNSPECIFIED = 0;
 
-  // Nvidia Tesla K80 GPU.
+  // Deprecated: Nvidia Tesla K80 GPU has reached end of support,
+  // see https://cloud.google.com/compute/docs/eol/k80-eol.
   NVIDIA_TESLA_K80 = 1 [deprecated = true];
 
   // Nvidia Tesla P100 GPU.
diff --git a/google/cloud/aiplatform/v1beta1/custom_job.proto b/google/cloud/aiplatform/v1beta1/custom_job.proto
@@ -364,7 +364,13 @@ message Scheduling {
     ON_DEMAND = 1;
 
     // Low cost by making potential use of spot resources.
-    LOW_COST = 2;
+    LOW_COST = 2 [deprecated = true];
+
+    // Standard provisioning strategy uses regular on-demand resources.
+    STANDARD = 3;
+
+    // Spot provisioning strategy uses spot resources.
+    SPOT = 4;
   }
 
   // The maximum job running time. The default is 7 days.
diff --git a/google/cloud/aiplatform/v1beta1/machine_resources.proto b/google/cloud/aiplatform/v1beta1/machine_resources.proto
@@ -18,6 +18,7 @@ package google.cloud.aiplatform.v1beta1;
 
 import "google/api/field_behavior.proto";
 import "google/cloud/aiplatform/v1beta1/accelerator_type.proto";
+import "google/cloud/aiplatform/v1beta1/reservation_affinity.proto";
 
 option csharp_namespace = "Google.Cloud.AIPlatform.V1Beta1";
 option go_package = "cloud.google.com/go/aiplatform/apiv1beta1/aiplatformpb;aiplatformpb";
@@ -56,6 +57,13 @@ message MachineSpec {
   // Immutable. The topology of the TPUs. Corresponds to the TPU topologies
   // available from GKE. (Example: tpu_topology: "2x2x1").
   string tpu_topology = 4 [(google.api.field_behavior) = IMMUTABLE];
+
+  // Optional. Immutable. Configuration controlling how this resource pool
+  // consumes reservation.
+  ReservationAffinity reservation_affinity = 5 [
+    (google.api.field_behavior) = IMMUTABLE,
+    (google.api.field_behavior) = OPTIONAL
+  ];
 }
 
 // A description of resources that are dedicated to a DeployedModel, and
@@ -121,6 +129,10 @@ message DedicatedResources {
   // to `80`.
   repeated AutoscalingMetricSpec autoscaling_metric_specs = 4
       [(google.api.field_behavior) = IMMUTABLE];
+
+  // Optional. If true, schedule the deployment workload on [spot
+  // VMs](https://cloud.google.com/kubernetes-engine/docs/concepts/spot-vms).
+  bool spot = 5 [(google.api.field_behavior) = OPTIONAL];
 }
 
 // A description of resources that to large degree are decided by Vertex AI,
diff --git a/google/cloud/aiplatform/v1beta1/reservation_affinity.proto b/google/cloud/aiplatform/v1beta1/reservation_affinity.proto
@@ -0,0 +1,71 @@
+// Copyright 2024 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+syntax = "proto3";
+
+package google.cloud.aiplatform.v1beta1;
+
+import "google/api/field_behavior.proto";
+import "google/api/resource.proto";
+
+option csharp_namespace = "Google.Cloud.AIPlatform.V1Beta1";
+option go_package = "cloud.google.com/go/aiplatform/apiv1beta1/aiplatformpb;aiplatformpb";
+option java_multiple_files = true;
+option java_outer_classname = "ReservationAffinityProto";
+option java_package = "com.google.cloud.aiplatform.v1beta1";
+option php_namespace = "Google\\Cloud\\AIPlatform\\V1beta1";
+option ruby_package = "Google::Cloud::AIPlatform::V1beta1";
+option (google.api.resource_definition) = {
+  type: "compute.googleapis.com/Reservation"
+  pattern: "projects/{project_id_or_number}/zones/{zone}/reservations/{reservation_name}"
+};
+
+// A ReservationAffinity can be used to configure a Vertex AI resource (e.g., a
+// DeployedModel) to draw its Compute Engine resources from a Shared
+// Reservation, or exclusively from on-demand capacity.
+message ReservationAffinity {
+  // Identifies a type of reservation affinity.
+  enum Type {
+    // Default value. This should not be used.
+    TYPE_UNSPECIFIED = 0;
+
+    // Do not consume from any reserved capacity, only use on-demand.
+    NO_RESERVATION = 1;
+
+    // Consume any reservation available, falling back to on-demand.
+    ANY_RESERVATION = 2;
+
+    // Consume from a specific reservation. When chosen, the reservation
+    // must be identified via the `key` and `values` fields.
+    SPECIFIC_RESERVATION = 3;
+  }
+
+  // Required. Specifies the reservation affinity type.
+  Type reservation_affinity_type = 1 [(google.api.field_behavior) = REQUIRED];
+
+  // Optional. Corresponds to the label key of a reservation resource. To target
+  // a SPECIFIC_RESERVATION by name, use
+  // `compute.googleapis.com/reservation-name` as the key and specify the name
+  // of your reservation as its value.
+  string key = 2 [(google.api.field_behavior) = OPTIONAL];
+
+  // Optional. Corresponds to the label values of a reservation resource. This
+  // must be the full resource name of the reservation.
+  repeated string values = 3 [
+    (google.api.field_behavior) = OPTIONAL,
+    (google.api.resource_reference) = {
+      type: "compute.googleapis.com/Reservation"
+    }
+  ];
+}