feat: add DeploymentStage for CreateEndpointOperationMetadata and DeployModelOperationMetadata

Google APIs · copybara-github · commit 0e31cfedb652 · 2025-07-30T20:14:27.000-07:00
docs: update MutateDeployedModel documentation

PiperOrigin-RevId: 789150946
diff --git a/google/cloud/aiplatform/v1/BUILD.bazel b/google/cloud/aiplatform/v1/BUILD.bazel
@@ -49,6 +49,7 @@ proto_library(
         "deployed_model_ref.proto",
         "deployment_resource_pool.proto",
         "deployment_resource_pool_service.proto",
+        "deployment_stage.proto",
         "encryption_spec.proto",
         "endpoint.proto",
         "endpoint_service.proto",
diff --git a/google/cloud/aiplatform/v1/deployment_stage.proto b/google/cloud/aiplatform/v1/deployment_stage.proto
@@ -0,0 +1,55 @@
+// Copyright 2025 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+syntax = "proto3";
+
+package google.cloud.aiplatform.v1;
+
+option csharp_namespace = "Google.Cloud.AIPlatform.V1";
+option go_package = "cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb";
+option java_multiple_files = true;
+option java_outer_classname = "DeploymentStageProto";
+option java_package = "com.google.cloud.aiplatform.v1";
+option php_namespace = "Google\\Cloud\\AIPlatform\\V1";
+option ruby_package = "Google::Cloud::AIPlatform::V1";
+
+// Stage field indicating the current progress of a deployment.
+enum DeploymentStage {
+  // Default value. This value is unused.
+  DEPLOYMENT_STAGE_UNSPECIFIED = 0;
+
+  // The deployment is initializing and setting up the environment.
+  STARTING_DEPLOYMENT = 5;
+
+  // The deployment is preparing the model assets.
+  PREPARING_MODEL = 6;
+
+  // The deployment is creating the underlying serving cluster.
+  CREATING_SERVING_CLUSTER = 7;
+
+  // The deployment is adding nodes to the serving cluster.
+  ADDING_NODES_TO_CLUSTER = 8;
+
+  // The deployment is getting the container image for the model server.
+  GETTING_CONTAINER_IMAGE = 9;
+
+  // The deployment is starting the model server.
+  STARTING_MODEL_SERVER = 3;
+
+  // The deployment is performing finalization steps.
+  FINISHING_UP = 4;
+
+  // The deployment has terminated.
+  DEPLOYMENT_TERMINATED = 10;
+}
diff --git a/google/cloud/aiplatform/v1/endpoint_service.proto b/google/cloud/aiplatform/v1/endpoint_service.proto
@@ -20,6 +20,7 @@ import "google/api/annotations.proto";
 import "google/api/client.proto";
 import "google/api/field_behavior.proto";
 import "google/api/resource.proto";
+import "google/cloud/aiplatform/v1/deployment_stage.proto";
 import "google/cloud/aiplatform/v1/endpoint.proto";
 import "google/cloud/aiplatform/v1/operation.proto";
 import "google/longrunning/operations.proto";
@@ -138,9 +139,9 @@ service EndpointService {
   }
 
   // Updates an existing deployed model. Updatable fields include
-  // `min_replica_count`, `max_replica_count`, `autoscaling_metric_specs`,
-  // `disable_container_logging` (v1 only), and `enable_container_logging`
-  // (v1beta1 only).
+  // `min_replica_count`, `max_replica_count`, `required_replica_count`,
+  // `autoscaling_metric_specs`, `disable_container_logging` (v1 only), and
+  // `enable_container_logging` (v1beta1 only).
   rpc MutateDeployedModel(MutateDeployedModelRequest)
       returns (google.longrunning.Operation) {
     option (google.api.http) = {
@@ -193,6 +194,11 @@ message CreateEndpointRequest {
 message CreateEndpointOperationMetadata {
   // The operation generic information.
   GenericOperationMetadata generic_metadata = 1;
+
+  // Output only. The deployment stage of the model. Only populated if this
+  // CreateEndpoint request deploys a model at the same time.
+  DeploymentStage deployment_stage = 2
+      [(google.api.field_behavior) = OUTPUT_ONLY];
 }
 
 // Request message for
@@ -372,6 +378,10 @@ message DeployModelResponse {
 message DeployModelOperationMetadata {
   // The operation generic information.
   GenericOperationMetadata generic_metadata = 1;
+
+  // Output only. The deployment stage of the model.
+  DeploymentStage deployment_stage = 2
+      [(google.api.field_behavior) = OUTPUT_ONLY];
 }
 
 // Request message for
@@ -433,6 +443,8 @@ message MutateDeployedModelRequest {
   // * `max_replica_count` in either
   // [DedicatedResources][google.cloud.aiplatform.v1.DedicatedResources] or
   // [AutomaticResources][google.cloud.aiplatform.v1.AutomaticResources]
+  // * `required_replica_count` in
+  // [DedicatedResources][google.cloud.aiplatform.v1.DedicatedResources]
   // * [autoscaling_metric_specs][google.cloud.aiplatform.v1.DedicatedResources.autoscaling_metric_specs]
   // * `disable_container_logging` (v1 only)
   // * `enable_container_logging` (v1beta1 only)