feat: Expose FullFineTunedResources for full fine tuned deployments

Google APIs · copybara-github · commit c751a014049e · 2025-12-02T12:03:39.000-08:00
PiperOrigin-RevId: 839371231
diff --git a/google/cloud/aiplatform/v1beta1/endpoint.proto b/google/cloud/aiplatform/v1beta1/endpoint.proto
@@ -225,6 +225,10 @@ message DeployedModel {
     string shared_resources = 17 [(google.api.resource_reference) = {
       type: "aiplatform.googleapis.com/DeploymentResourcePool"
     }];
+
+    // Optional. Resources for a full fine tuned model.
+    FullFineTunedResources full_fine_tuned_resources = 36
+        [(google.api.field_behavior) = OPTIONAL];
   }
 
   // Immutable. The ID of the DeployedModel. If not provided upon deployment,
diff --git a/google/cloud/aiplatform/v1beta1/machine_resources.proto b/google/cloud/aiplatform/v1beta1/machine_resources.proto
@@ -270,6 +270,42 @@ message BatchDedicatedResources {
   bool spot = 5 [(google.api.field_behavior) = OPTIONAL];
 }
 
+// Resources for an fft model.
+message FullFineTunedResources {
+  // The type of deployment.
+  enum DeploymentType {
+    // Unspecified deployment type.
+    DEPLOYMENT_TYPE_UNSPECIFIED = 0;
+
+    // Eval deployment type.
+    DEPLOYMENT_TYPE_EVAL = 1;
+
+    // Prod deployment type.
+    DEPLOYMENT_TYPE_PROD = 2;
+  }
+
+  // Required. The kind of deployment.
+  DeploymentType deployment_type = 1 [(google.api.field_behavior) = REQUIRED];
+
+  // Optional. The number of model inference units to use for this deployment.
+  // This can only be specified for DEPLOYMENT_TYPE_PROD.
+  // The following table lists the number of model inference units for different
+  // model types:
+  // * Gemini 2.5 Flash
+  //   * Foundation FMIU: 25
+  //   * Expansion FMIU: 4
+  // * Gemini 2.5 Pro
+  //   * Foundation FMIU: 32
+  //   * Expansion FMIU: 16
+  // * Veo 3.0 (undistilled)
+  //   * Foundation FMIU: 63
+  //   * Expansion FMIU: 7
+  // * Veo 3.0 (distilled)
+  //   * Foundation FMIU: 30
+  //   * Expansion FMIU: 10
+  int32 model_inference_unit_count = 2 [(google.api.field_behavior) = OPTIONAL];
+}
+
 // Statistics information about resource consumption.
 message ResourcesConsumed {
   // Output only. The number of replica hours used. Note that many replicas may