File tree Expand file tree Collapse file tree 1 file changed +19
-0
lines changed
google/cloud/aiplatform/v1 Expand file tree Collapse file tree 1 file changed +19
-0
lines changed Original file line number Diff line number Diff line change @@ -54,6 +54,25 @@ message MachineSpec {
5454 // The number of accelerators to attach to the machine.
5555 int32 accelerator_count = 3 ;
5656
57+ // Optional. Immutable. The Nvidia GPU partition size.
58+ //
59+ // When specified, the requested accelerators will be partitioned into
60+ // smaller GPU partitions. For example, if the request is for 8 units of
61+ // NVIDIA A100 GPUs, and gpu_partition_size="1g.10gb", the service will
62+ // create 8 * 7 = 56 partitioned MIG instances.
63+ //
64+ // The partition size must be a value supported by the requested accelerator.
65+ // Refer to
66+ // [Nvidia GPU
67+ // Partitioning](https://cloud.google.com/kubernetes-engine/docs/how-to/gpus-multi#multi-instance_gpu_partitions)
68+ // for the available partition sizes.
69+ //
70+ // If set, the accelerator_count should be set to 1.
71+ string gpu_partition_size = 7 [
72+ (google.api.field_behavior ) = IMMUTABLE ,
73+ (google.api.field_behavior ) = OPTIONAL
74+ ];
75+
5776 // Immutable. The topology of the TPUs. Corresponds to the TPU topologies
5877 // available from GKE. (Example: tpu_topology: "2x2x1").
5978 string tpu_topology = 4 [(google.api.field_behavior ) = IMMUTABLE ];
You can’t perform that action at this time.
0 commit comments