feat: adds DWS and spot VM feature support to custom batch predictions 2.0

Google APIs · copybara-github · commit 9abc113b07cd · 2025-07-25T11:40:18.000-07:00
PiperOrigin-RevId: 787184611
diff --git a/google/cloud/aiplatform/v1beta1/machine_resources.proto b/google/cloud/aiplatform/v1beta1/machine_resources.proto
@@ -195,6 +195,18 @@ message BatchDedicatedResources {
   // Immutable. The maximum number of machine replicas the batch operation may
   // be scaled to. The default value is 10.
   int32 max_replica_count = 3 [(google.api.field_behavior) = IMMUTABLE];
+
+  // Optional. Immutable. If set, use DWS resource to schedule the deployment
+  // workload. reference:
+  // (https://cloud.google.com/blog/products/compute/introducing-dynamic-workload-scheduler)
+  FlexStart flex_start = 4 [
+    (google.api.field_behavior) = IMMUTABLE,
+    (google.api.field_behavior) = OPTIONAL
+  ];
+
+  // Optional. If true, schedule the deployment workload on [spot
+  // VMs](https://cloud.google.com/kubernetes-engine/docs/concepts/spot-vms).
+  bool spot = 5 [(google.api.field_behavior) = OPTIONAL];
 }
 
 // Statistics information about resource consumption.
@@ -256,6 +268,7 @@ message AutoscalingMetricSpec {
   // * For Online Prediction:
   // * `aiplatform.googleapis.com/prediction/online/accelerator/duty_cycle`
   // * `aiplatform.googleapis.com/prediction/online/cpu/utilization`
+  // * `aiplatform.googleapis.com/prediction/online/request_count`
   string metric_name = 1 [(google.api.field_behavior) = REQUIRED];
 
   // The target resource utilization in percentage (1% - 100%) for the given