File tree Expand file tree Collapse file tree 1 file changed +19
-0
lines changed
google/cloud/aiplatform/v1beta1 Expand file tree Collapse file tree 1 file changed +19
-0
lines changed Original file line number Diff line number Diff line change @@ -55,6 +55,25 @@ message MachineSpec {
5555 // The number of accelerators to attach to the machine.
5656 int32 accelerator_count = 3 ;
5757
58+ // Optional. Immutable. The Nvidia GPU partition size.
59+ //
60+ // When specified, the requested accelerators will be partitioned into
61+ // smaller GPU partitions. For example, if the request is for 8 units of
62+ // NVIDIA A100 GPUs, and gpu_partition_size="1g.10gb", the service will
63+ // create 8 * 7 = 56 partitioned MIG instances.
64+ //
65+ // The partition size must be a value supported by the requested accelerator.
66+ // Refer to
67+ // [Nvidia GPU
68+ // Partitioning](https://cloud.google.com/kubernetes-engine/docs/how-to/gpus-multi#multi-instance_gpu_partitions)
69+ // for the available partition sizes.
70+ //
71+ // If set, the accelerator_count should be set to 1.
72+ string gpu_partition_size = 7 [
73+ (google.api.field_behavior ) = IMMUTABLE ,
74+ (google.api.field_behavior ) = OPTIONAL
75+ ];
76+
5877 // Immutable. The topology of the TPUs. Corresponds to the TPU topologies
5978 // available from GKE. (Example: tpu_topology: "2x2x1").
6079 string tpu_topology = 4 [(google.api.field_behavior ) = IMMUTABLE ];
You can’t perform that action at this time.
0 commit comments