feat: add gpu_partition_size in machine_spec v1 api

Google APIs · copybara-github · commit df29a8257419 · 2025-11-18T11:35:46.000-08:00
PiperOrigin-RevId: 833901564
diff --git a/google/cloud/aiplatform/v1/machine_resources.proto b/google/cloud/aiplatform/v1/machine_resources.proto
@@ -54,6 +54,25 @@ message MachineSpec {
   // The number of accelerators to attach to the machine.
   int32 accelerator_count = 3;
 
+  // Optional. Immutable. The Nvidia GPU partition size.
+  //
+  // When specified, the requested accelerators will be partitioned into
+  // smaller GPU partitions. For example, if the request is for 8 units of
+  // NVIDIA A100 GPUs, and gpu_partition_size="1g.10gb", the service will
+  // create 8 * 7 = 56 partitioned MIG instances.
+  //
+  // The partition size must be a value supported by the requested accelerator.
+  // Refer to
+  // [Nvidia GPU
+  // Partitioning](https://cloud.google.com/kubernetes-engine/docs/how-to/gpus-multi#multi-instance_gpu_partitions)
+  // for the available partition sizes.
+  //
+  // If set, the accelerator_count should be set to 1.
+  string gpu_partition_size = 7 [
+    (google.api.field_behavior) = IMMUTABLE,
+    (google.api.field_behavior) = OPTIONAL
+  ];
+
   // Immutable. The topology of the TPUs. Corresponds to the TPU topologies
   // available from GKE. (Example: tpu_topology: "2x2x1").
   string tpu_topology = 4 [(google.api.field_behavior) = IMMUTABLE];