feat: Support picosecond timestamp precision in BigQuery Storage API

Google APIs · copybara-github · commit 04bd623ce9d0 · 2025-11-07T10:19:45.000-08:00
docs: A comment for method `ReadRows` in service `BigQueryRead` is changed
docs: A comment for message `AppendRowsRequest` is changed
docs: A comment for field `writer_schema` in message `.google.cloud.bigquery.storage.v1.AppendRowsRequest` is changed
docs: A comment for field `rows` in message `.google.cloud.bigquery.storage.v1.AppendRowsRequest` is changed
docs: A comment for field `arrow_rows` in message `.google.cloud.bigquery.storage.v1.AppendRowsRequest` is changed
docs: A comment for field `default_missing_value_interpretation` in message `.google.cloud.bigquery.storage.v1.AppendRowsRequest` is changed
docs: A comment for field `location` in message `.google.cloud.bigquery.storage.v1.WriteStream` is changed
PiperOrigin-RevId: 829486853
diff --git a/google/cloud/bigquery/storage/v1/arrow.proto b/google/cloud/bigquery/storage/v1/arrow.proto
@@ -58,7 +58,32 @@ message ArrowSerializationOptions {
     ZSTD = 2;
   }
 
+  // The precision of the timestamp value in the Avro message. This precision
+  // will **only** be applied to the column(s) with the `TIMESTAMP_PICOS` type.
+  enum PicosTimestampPrecision {
+    // Unspecified timestamp precision. The default precision is microseconds.
+    PICOS_TIMESTAMP_PRECISION_UNSPECIFIED = 0;
+
+    // Timestamp values returned by Read API will be truncated to microsecond
+    // level precision. The value will be encoded as Arrow TIMESTAMP type in a
+    // 64 bit integer.
+    TIMESTAMP_PRECISION_MICROS = 1;
+
+    // Timestamp values returned by Read API will be truncated to nanosecond
+    // level precision. The value will be encoded as Arrow TIMESTAMP type in a
+    // 64 bit integer.
+    TIMESTAMP_PRECISION_NANOS = 2;
+
+    // Read API will return full precision picosecond value. The value will be
+    // encoded as a string which conforms to ISO 8601 format.
+    TIMESTAMP_PRECISION_PICOS = 3;
+  }
+
   // The compression codec to use for Arrow buffers in serialized record
   // batches.
   CompressionCodec buffer_compression = 2;
+
+  // Optional. Set timestamp precision option. If not set, the default precision
+  // is microseconds.
+  PicosTimestampPrecision picos_timestamp_precision = 3;
 }
diff --git a/google/cloud/bigquery/storage/v1/avro.proto b/google/cloud/bigquery/storage/v1/avro.proto
@@ -42,6 +42,27 @@ message AvroRows {
 
 // Contains options specific to Avro Serialization.
 message AvroSerializationOptions {
+  // The precision of the timestamp value in the Avro message. This precision
+  // will **only** be applied to the column(s) with the `TIMESTAMP_PICOS` type.
+  enum PicosTimestampPrecision {
+    // Unspecified timestamp precision. The default precision is microseconds.
+    PICOS_TIMESTAMP_PRECISION_UNSPECIFIED = 0;
+
+    // Timestamp values returned by Read API will be truncated to microsecond
+    // level precision. The value will be encoded as Avro TIMESTAMP type in a
+    // 64 bit integer.
+    TIMESTAMP_PRECISION_MICROS = 1;
+
+    // Timestamp values returned by Read API will be truncated to nanosecond
+    // level precision. The value will be encoded as Avro TIMESTAMP type in a
+    // 64 bit integer.
+    TIMESTAMP_PRECISION_NANOS = 2;
+
+    // Read API will return full precision picosecond value. The value will be
+    // encoded as a string which conforms to ISO 8601 format.
+    TIMESTAMP_PRECISION_PICOS = 3;
+  }
+
   // Enable displayName attribute in Avro schema.
   //
   // The Avro specification requires field names to be alphanumeric.  By
@@ -53,4 +74,8 @@ message AvroSerializationOptions {
   // value and populates a "displayName" attribute for every avro field with the
   // original column name.
   bool enable_display_name_attribute = 1;
+
+  // Optional. Set timestamp precision option. If not set, the default precision
+  // is microseconds.
+  PicosTimestampPrecision picos_timestamp_precision = 2;
 }
diff --git a/google/cloud/bigquery/storage/v1/bigquerystorage_grpc_service_config.json b/google/cloud/bigquery/storage/v1/bigquerystorage_grpc_service_config.json
@@ -118,6 +118,25 @@
           "RESOURCE_EXHAUSTED"
         ]
       }
+    },
+    {
+      "name": [
+        {
+          "service": "google.cloud.bigquery.storage.v1.StreamMetastorePartitions",
+          "method": "StreamMetastorePartitions"
+        }
+      ],
+      "timeout": "1200s",
+      "retryPolicy": {
+        "initialBackoff": "0.100s",
+        "maxBackoff": "60s",
+        "backoffMultiplier": 1.3,
+        "retryableStatusCodes": [
+          "DEADLINE_EXCEEDED",
+          "UNAVAILABLE",
+          "RESOURCE_EXHAUSTED"
+        ]
+      }
     }
   ]
 }
diff --git a/google/cloud/bigquery/storage/v1/bigquerystorage_v1.yaml b/google/cloud/bigquery/storage/v1/bigquerystorage_v1.yaml
@@ -7,19 +7,6 @@ apis:
 - name: google.cloud.bigquery.storage.v1.BigQueryRead
 - name: google.cloud.bigquery.storage.v1.BigQueryWrite
 
-backend:
-  rules:
-  - selector: google.cloud.bigquery.storage.v1.BigQueryRead.CreateReadSession
-    deadline: 120.0
-  - selector: google.cloud.bigquery.storage.v1.BigQueryRead.ReadRows
-    deadline: 21600.0
-  - selector: google.cloud.bigquery.storage.v1.BigQueryRead.SplitReadStream
-    deadline: 120.0
-  - selector: 'google.cloud.bigquery.storage.v1.BigQueryWrite.*'
-    deadline: 120.0
-  - selector: google.cloud.bigquery.storage.v1.BigQueryWrite.CreateWriteStream
-    deadline: 600.0
-
 authentication:
   rules:
   - selector: 'google.cloud.bigquery.storage.v1.BigQueryRead.*'
@@ -37,10 +24,21 @@ authentication:
 publishing:
   new_issue_uri: https://issuetracker.google.com/issues/new?component=187149&template=1162659
   documentation_uri: https://cloud.google.com/bigquery/docs/reference/storage/
+  api_short_name: bigquerystorage
+  github_label: 'api: bigquerystorage'
+  doc_tag_prefix: bigquerystorage
+  organization: CLOUD
   library_settings:
   - version: google.cloud.bigquery.storage.v1
     launch_stage: GA
     java_settings:
       library_package: com.google.cloud.bigquery.storage.v1
       service_class_names:
         google.cloud.bigquery.storage.v1.BigQueryRead: BaseBigQueryRead
+      common:
+        destinations:
+        - PACKAGE_MANAGER
+    python_settings:
+      common:
+        destinations:
+        - PACKAGE_MANAGER
diff --git a/google/cloud/bigquery/storage/v1/storage.proto b/google/cloud/bigquery/storage/v1/storage.proto
@@ -78,9 +78,9 @@ service BigQueryRead {
   }
 
   // Reads rows from the stream in the format prescribed by the ReadSession.
-  // Each response contains one or more table rows, up to a maximum of 100 MiB
+  // Each response contains one or more table rows, up to a maximum of 128 MB
   // per response; read requests which attempt to read individual rows larger
-  // than 100 MiB will fail.
+  // than 128 MB will fail.
   //
   // Each request also returns a set of stream statistics reflecting the current
   // state of the stream.
@@ -423,8 +423,6 @@ message CreateWriteStreamRequest {
 // Requests larger than this return an error, typically `INVALID_ARGUMENT`.
 message AppendRowsRequest {
   // Arrow schema and data.
-  // Arrow format is an experimental feature only selected for allowlisted
-  // customers.
   message ArrowData {
     // Optional. Arrow Schema used to serialize the data.
     ArrowSchema writer_schema = 1;
@@ -436,8 +434,8 @@ message AppendRowsRequest {
   // ProtoData contains the data rows and schema when constructing append
   // requests.
   message ProtoData {
-    // The protocol buffer schema used to serialize the data. Provide this value
-    // whenever:
+    // Optional. The protocol buffer schema used to serialize the data. Provide
+    // this value whenever:
     //
     // * You send the first request of an RPC connection.
     //
@@ -446,7 +444,7 @@ message AppendRowsRequest {
     // * You specify a new destination table.
     ProtoSchema writer_schema = 1;
 
-    // Serialized row data in protobuf message format.
+    // Required. Serialized row data in protobuf message format.
     // Currently, the backend expects the serialized rows to adhere to
     // proto2 semantics when appending rows, particularly with respect to
     // how default values are encoded.
@@ -522,8 +520,7 @@ message AppendRowsRequest {
     // Rows in proto format.
     ProtoData proto_rows = 4;
 
-    // Rows in arrow format. This is an experimental feature only selected for
-    // allowlisted customers.
+    // Rows in arrow format.
     ArrowData arrow_rows = 5;
   }
 
@@ -553,8 +550,8 @@ message AppendRowsRequest {
 
   // Optional. Default missing value interpretation for all columns in the
   // table. When a value is specified on an `AppendRowsRequest`, it is applied
-  // to all requests on the connection from that point forward, until a
-  // subsequent `AppendRowsRequest` sets it to a different value.
+  // to all requests from that point forward, until a subsequent
+  // `AppendRowsRequest` sets it to a different value.
   // `missing_value_interpretation` can override
   // `default_missing_value_interpretation`. For example, if you want to write
   // `NULL` instead of using default values for some columns, you can set
diff --git a/google/cloud/bigquery/storage/v1/stream.proto b/google/cloud/bigquery/storage/v1/stream.proto
@@ -328,8 +328,8 @@ message WriteStream {
   // Immutable. Mode of the stream.
   WriteMode write_mode = 7 [(google.api.field_behavior) = IMMUTABLE];
 
-  // Immutable. The geographic location where the stream's dataset resides. See
-  // https://cloud.google.com/bigquery/docs/locations for supported
+  // Output only. The geographic location where the stream's dataset resides.
+  // See https://cloud.google.com/bigquery/docs/locations for supported
   // locations.
-  string location = 8 [(google.api.field_behavior) = IMMUTABLE];
+  string location = 8 [(google.api.field_behavior) = OUTPUT_ONLY];
 }
diff --git a/google/cloud/bigquery/storage/v1/table.proto b/google/cloud/bigquery/storage/v1/table.proto
@@ -17,6 +17,7 @@ syntax = "proto3";
 package google.cloud.bigquery.storage.v1;
 
 import "google/api/field_behavior.proto";
+import "google/protobuf/wrappers.proto";
 
 option csharp_namespace = "Google.Cloud.BigQuery.Storage.V1";
 option go_package = "cloud.google.com/go/bigquery/storage/apiv1/storagepb;storagepb";
@@ -178,6 +179,16 @@ message TableFieldSchema {
   // (https://cloud.google.com/bigquery/docs/default-values) for this field.
   string default_value_expression = 10 [(google.api.field_behavior) = OPTIONAL];
 
+  // Optional. Precision (maximum number of total digits in base 10) for seconds
+  // of TIMESTAMP type.
+  //
+  // Possible values include:
+  //
+  // * 6 (Default, for TIMESTAMP type with microsecond precision)
+  // * 12 (For TIMESTAMP type with picosecond precision)
+  google.protobuf.Int64Value timestamp_precision = 27
+      [(google.api.field_behavior) = OPTIONAL];
+
   // Optional. The subtype of the RANGE, if the type of this field is RANGE. If
   // the type is RANGE, this field is required. Possible values for the field
   // element type of a RANGE include:

Original file line number	Diff line number	Diff line change
`@@ -118,6 +118,25 @@`
`118`	`118`	`"RESOURCE_EXHAUSTED"`
`119`	`119`	`]`
`120`	`120`	`}`
	`121`	`+ },`
	`122`	`+ {`
	`123`	`+ "name": [`
	`124`	`+ {`
	`125`	`+ "service": "google.cloud.bigquery.storage.v1.StreamMetastorePartitions",`
	`126`	`+ "method": "StreamMetastorePartitions"`
	`127`	`+ }`
	`128`	`+ ],`
	`129`	`+ "timeout": "1200s",`
	`130`	`+ "retryPolicy": {`
	`131`	`+ "initialBackoff": "0.100s",`
	`132`	`+ "maxBackoff": "60s",`
	`133`	`+ "backoffMultiplier": 1.3,`
	`134`	`+ "retryableStatusCodes": [`
	`135`	`+ "DEADLINE_EXCEEDED",`
	`136`	`+ "UNAVAILABLE",`
	`137`	`+ "RESOURCE_EXHAUSTED"`
	`138`	`+ ]`
	`139`	`+ }`
`121`	`140`	`}`
`122`	`141`	`]`
`123`	`142`	`}`