UNPKG

@google-cloud/bigquery

Version:

Google BigQuery Client Library for Node.js

1,065 lines (1,023 loc) 264 kB
// Copyright 2024 Google LLC // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // https://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. /** * BigQuery API */ declare namespace bigquery { /** * Aggregate metrics for classification/classifier models. For multi-class models, the metrics are either macro-averaged or micro-averaged. When macro-averaged, the metrics are calculated for each label and then an unweighted average is taken of those values. When micro-averaged, the metric is calculated globally by counting the total number of correctly predicted rows. */ type IAggregateClassificationMetrics = { /** * Accuracy is the fraction of predictions given the correct label. For multiclass this is a micro-averaged metric. */ accuracy?: number; /** * The F1 score is an average of recall and precision. For multiclass this is a macro-averaged metric. */ f1Score?: number; /** * Logarithmic Loss. For multiclass this is a macro-averaged metric. */ logLoss?: number; /** * Precision is the fraction of actual positive predictions that had positive actual labels. For multiclass this is a macro-averaged metric treating each class as a binary classifier. */ precision?: number; /** * Recall is the fraction of actual positive labels that were given a positive prediction. For multiclass this is a macro-averaged metric. */ recall?: number; /** * Area Under a ROC Curve. For multiclass this is a macro-averaged metric. */ rocAuc?: number; /** * Threshold at which the metrics are computed. For binary classification models this is the positive class threshold. For multi-class classfication models this is the confidence threshold. */ threshold?: number; }; /** * Represents privacy policy associated with "aggregation threshold" method. */ type IAggregationThresholdPolicy = { /** * Optional. The privacy unit column(s) associated with this policy. For now, only one column per data source object (table, view) is allowed as a privacy unit column. Representing as a repeated field in metadata for extensibility to multiple columns in future. Duplicates and Repeated struct fields are not allowed. For nested fields, use dot notation ("outer.inner") */ privacyUnitColumns?: Array<string>; /** * Optional. The threshold for the "aggregation threshold" policy. */ threshold?: string; }; /** * Input/output argument of a function or a stored procedure. */ type IArgument = { /** * Optional. Defaults to FIXED_TYPE. */ argumentKind?: 'ARGUMENT_KIND_UNSPECIFIED' | 'FIXED_TYPE' | 'ANY_TYPE'; /** * Required unless argument_kind = ANY_TYPE. */ dataType?: IStandardSqlDataType; /** * Optional. Whether the argument is an aggregate function parameter. Must be Unset for routine types other than AGGREGATE_FUNCTION. For AGGREGATE_FUNCTION, if set to false, it is equivalent to adding "NOT AGGREGATE" clause in DDL; Otherwise, it is equivalent to omitting "NOT AGGREGATE" clause in DDL. */ isAggregate?: boolean; /** * Optional. Specifies whether the argument is input or output. Can be set for procedures only. */ mode?: 'MODE_UNSPECIFIED' | 'IN' | 'OUT' | 'INOUT'; /** * Optional. The name of this argument. Can be absent for function return argument. */ name?: string; }; /** * Arima coefficients. */ type IArimaCoefficients = { /** * Auto-regressive coefficients, an array of double. */ autoRegressiveCoefficients?: Array<number>; /** * Intercept coefficient, just a double not an array. */ interceptCoefficient?: number; /** * Moving-average coefficients, an array of double. */ movingAverageCoefficients?: Array<number>; }; /** * ARIMA model fitting metrics. */ type IArimaFittingMetrics = { /** * AIC. */ aic?: number; /** * Log-likelihood. */ logLikelihood?: number; /** * Variance. */ variance?: number; }; /** * Model evaluation metrics for ARIMA forecasting models. */ type IArimaForecastingMetrics = { /** * Arima model fitting metrics. */ arimaFittingMetrics?: Array<IArimaFittingMetrics>; /** * Repeated as there can be many metric sets (one for each model) in auto-arima and the large-scale case. */ arimaSingleModelForecastingMetrics?: Array<IArimaSingleModelForecastingMetrics>; /** * Whether Arima model fitted with drift or not. It is always false when d is not 1. */ hasDrift?: Array<boolean>; /** * Non-seasonal order. */ nonSeasonalOrder?: Array<IArimaOrder>; /** * Seasonal periods. Repeated because multiple periods are supported for one time series. */ seasonalPeriods?: Array< | 'SEASONAL_PERIOD_TYPE_UNSPECIFIED' | 'NO_SEASONALITY' | 'DAILY' | 'WEEKLY' | 'MONTHLY' | 'QUARTERLY' | 'YEARLY' >; /** * Id to differentiate different time series for the large-scale case. */ timeSeriesId?: Array<string>; }; /** * Arima model information. */ type IArimaModelInfo = { /** * Arima coefficients. */ arimaCoefficients?: IArimaCoefficients; /** * Arima fitting metrics. */ arimaFittingMetrics?: IArimaFittingMetrics; /** * Whether Arima model fitted with drift or not. It is always false when d is not 1. */ hasDrift?: boolean; /** * If true, holiday_effect is a part of time series decomposition result. */ hasHolidayEffect?: boolean; /** * If true, spikes_and_dips is a part of time series decomposition result. */ hasSpikesAndDips?: boolean; /** * If true, step_changes is a part of time series decomposition result. */ hasStepChanges?: boolean; /** * Non-seasonal order. */ nonSeasonalOrder?: IArimaOrder; /** * Seasonal periods. Repeated because multiple periods are supported for one time series. */ seasonalPeriods?: Array< | 'SEASONAL_PERIOD_TYPE_UNSPECIFIED' | 'NO_SEASONALITY' | 'DAILY' | 'WEEKLY' | 'MONTHLY' | 'QUARTERLY' | 'YEARLY' >; /** * The time_series_id value for this time series. It will be one of the unique values from the time_series_id_column specified during ARIMA model training. Only present when time_series_id_column training option was used. */ timeSeriesId?: string; /** * The tuple of time_series_ids identifying this time series. It will be one of the unique tuples of values present in the time_series_id_columns specified during ARIMA model training. Only present when time_series_id_columns training option was used and the order of values here are same as the order of time_series_id_columns. */ timeSeriesIds?: Array<string>; }; /** * Arima order, can be used for both non-seasonal and seasonal parts. */ type IArimaOrder = { /** * Order of the differencing part. */ d?: string; /** * Order of the autoregressive part. */ p?: string; /** * Order of the moving-average part. */ q?: string; }; /** * (Auto-)arima fitting result. Wrap everything in ArimaResult for easier refactoring if we want to use model-specific iteration results. */ type IArimaResult = { /** * This message is repeated because there are multiple arima models fitted in auto-arima. For non-auto-arima model, its size is one. */ arimaModelInfo?: Array<IArimaModelInfo>; /** * Seasonal periods. Repeated because multiple periods are supported for one time series. */ seasonalPeriods?: Array< | 'SEASONAL_PERIOD_TYPE_UNSPECIFIED' | 'NO_SEASONALITY' | 'DAILY' | 'WEEKLY' | 'MONTHLY' | 'QUARTERLY' | 'YEARLY' >; }; /** * Model evaluation metrics for a single ARIMA forecasting model. */ type IArimaSingleModelForecastingMetrics = { /** * Arima fitting metrics. */ arimaFittingMetrics?: IArimaFittingMetrics; /** * Is arima model fitted with drift or not. It is always false when d is not 1. */ hasDrift?: boolean; /** * If true, holiday_effect is a part of time series decomposition result. */ hasHolidayEffect?: boolean; /** * If true, spikes_and_dips is a part of time series decomposition result. */ hasSpikesAndDips?: boolean; /** * If true, step_changes is a part of time series decomposition result. */ hasStepChanges?: boolean; /** * Non-seasonal order. */ nonSeasonalOrder?: IArimaOrder; /** * Seasonal periods. Repeated because multiple periods are supported for one time series. */ seasonalPeriods?: Array< | 'SEASONAL_PERIOD_TYPE_UNSPECIFIED' | 'NO_SEASONALITY' | 'DAILY' | 'WEEKLY' | 'MONTHLY' | 'QUARTERLY' | 'YEARLY' >; /** * The time_series_id value for this time series. It will be one of the unique values from the time_series_id_column specified during ARIMA model training. Only present when time_series_id_column training option was used. */ timeSeriesId?: string; /** * The tuple of time_series_ids identifying this time series. It will be one of the unique tuples of values present in the time_series_id_columns specified during ARIMA model training. Only present when time_series_id_columns training option was used and the order of values here are same as the order of time_series_id_columns. */ timeSeriesIds?: Array<string>; }; /** * Specifies the audit configuration for a service. The configuration determines which permission types are logged, and what identities, if any, are exempted from logging. An AuditConfig must have one or more AuditLogConfigs. If there are AuditConfigs for both `allServices` and a specific service, the union of the two AuditConfigs is used for that service: the log_types specified in each AuditConfig are enabled, and the exempted_members in each AuditLogConfig are exempted. Example Policy with multiple AuditConfigs: { "audit_configs": [ { "service": "allServices", "audit_log_configs": [ { "log_type": "DATA_READ", "exempted_members": [ "user:jose@example.com" ] }, { "log_type": "DATA_WRITE" }, { "log_type": "ADMIN_READ" } ] }, { "service": "sampleservice.googleapis.com", "audit_log_configs": [ { "log_type": "DATA_READ" }, { "log_type": "DATA_WRITE", "exempted_members": [ "user:aliya@example.com" ] } ] } ] } For sampleservice, this policy enables DATA_READ, DATA_WRITE and ADMIN_READ logging. It also exempts `jose@example.com` from DATA_READ logging, and `aliya@example.com` from DATA_WRITE logging. */ type IAuditConfig = { /** * The configuration for logging of each type of permission. */ auditLogConfigs?: Array<IAuditLogConfig>; /** * Specifies a service that will be enabled for audit logging. For example, `storage.googleapis.com`, `cloudsql.googleapis.com`. `allServices` is a special value that covers all services. */ service?: string; }; /** * Provides the configuration for logging a type of permissions. Example: { "audit_log_configs": [ { "log_type": "DATA_READ", "exempted_members": [ "user:jose@example.com" ] }, { "log_type": "DATA_WRITE" } ] } This enables 'DATA_READ' and 'DATA_WRITE' logging, while exempting jose@example.com from DATA_READ logging. */ type IAuditLogConfig = { /** * Specifies the identities that do not cause logging for this type of permission. Follows the same format of Binding.members. */ exemptedMembers?: Array<string>; /** * The log type that this config enables. */ logType?: | 'LOG_TYPE_UNSPECIFIED' | 'ADMIN_READ' | 'DATA_WRITE' | 'DATA_READ'; }; /** * Options for external data sources. */ type IAvroOptions = { /** * Optional. If sourceFormat is set to "AVRO", indicates whether to interpret logical types as the corresponding BigQuery data type (for example, TIMESTAMP), instead of using the raw type (for example, INTEGER). */ useAvroLogicalTypes?: boolean; }; /** * Reason why BI Engine didn't accelerate the query (or sub-query). */ type IBiEngineReason = { /** * Output only. High-level BI Engine reason for partial or disabled acceleration */ code?: | 'CODE_UNSPECIFIED' | 'NO_RESERVATION' | 'INSUFFICIENT_RESERVATION' | 'UNSUPPORTED_SQL_TEXT' | 'INPUT_TOO_LARGE' | 'OTHER_REASON' | 'TABLE_EXCLUDED'; /** * Output only. Free form human-readable reason for partial or disabled acceleration. */ message?: string; }; /** * Statistics for a BI Engine specific query. Populated as part of JobStatistics2 */ type IBiEngineStatistics = { /** * Output only. Specifies which mode of BI Engine acceleration was performed (if any). */ accelerationMode?: | 'BI_ENGINE_ACCELERATION_MODE_UNSPECIFIED' | 'BI_ENGINE_DISABLED' | 'PARTIAL_INPUT' | 'FULL_INPUT' | 'FULL_QUERY'; /** * Output only. Specifies which mode of BI Engine acceleration was performed (if any). */ biEngineMode?: | 'ACCELERATION_MODE_UNSPECIFIED' | 'DISABLED' | 'PARTIAL' | 'FULL'; /** * In case of DISABLED or PARTIAL bi_engine_mode, these contain the explanatory reasons as to why BI Engine could not accelerate. In case the full query was accelerated, this field is not populated. */ biEngineReasons?: Array<IBiEngineReason>; }; /** * Configuration for BigLake managed tables. */ type IBigLakeConfiguration = { /** * Required. The connection specifying the credentials to be used to read and write to external storage, such as Cloud Storage. The connection_id can have the form "<project\_id>.<location\_id>.<connection\_id>" or "projects/<project\_id>/locations/<location\_id>/connections/<connection\_id>". */ connectionId?: string; /** * Required. The file format the table data is stored in. */ fileFormat?: 'FILE_FORMAT_UNSPECIFIED' | 'PARQUET'; /** * Required. The fully qualified location prefix of the external folder where table data is stored. The '*' wildcard character is not allowed. The URI should be in the format "gs://bucket/path_to_table/" */ storageUri?: string; /** * Required. The table format the metadata only snapshots are stored in. */ tableFormat?: 'TABLE_FORMAT_UNSPECIFIED' | 'ICEBERG'; }; type IBigQueryModelTraining = { /** * Deprecated. */ currentIteration?: number; /** * Deprecated. */ expectedTotalIterations?: string; }; /** * Information related to a Bigtable column. */ type IBigtableColumn = { /** * Optional. The encoding of the values when the type is not STRING. Acceptable encoding values are: TEXT - indicates values are alphanumeric text strings. BINARY - indicates values are encoded using HBase Bytes.toBytes family of functions. 'encoding' can also be set at the column family level. However, the setting at this level takes precedence if 'encoding' is set at both levels. */ encoding?: string; /** * Optional. If the qualifier is not a valid BigQuery field identifier i.e. does not match a-zA-Z*, a valid identifier must be provided as the column field name and is used as field name in queries. */ fieldName?: string; /** * Optional. If this is set, only the latest version of value in this column are exposed. 'onlyReadLatest' can also be set at the column family level. However, the setting at this level takes precedence if 'onlyReadLatest' is set at both levels. */ onlyReadLatest?: boolean; /** * [Required] Qualifier of the column. Columns in the parent column family that has this exact qualifier are exposed as . field. If the qualifier is valid UTF-8 string, it can be specified in the qualifier_string field. Otherwise, a base-64 encoded value must be set to qualifier_encoded. The column field name is the same as the column qualifier. However, if the qualifier is not a valid BigQuery field identifier i.e. does not match a-zA-Z*, a valid identifier must be provided as field_name. */ qualifierEncoded?: string; /** * Qualifier string. */ qualifierString?: string; /** * Optional. The type to convert the value in cells of this column. The values are expected to be encoded using HBase Bytes.toBytes function when using the BINARY encoding value. Following BigQuery types are allowed (case-sensitive): * BYTES * STRING * INTEGER * FLOAT * BOOLEAN * JSON Default type is BYTES. 'type' can also be set at the column family level. However, the setting at this level takes precedence if 'type' is set at both levels. */ type?: string; }; /** * Information related to a Bigtable column family. */ type IBigtableColumnFamily = { /** * Optional. Lists of columns that should be exposed as individual fields as opposed to a list of (column name, value) pairs. All columns whose qualifier matches a qualifier in this list can be accessed as .. Other columns can be accessed as a list through .Column field. */ columns?: Array<IBigtableColumn>; /** * Optional. The encoding of the values when the type is not STRING. Acceptable encoding values are: TEXT - indicates values are alphanumeric text strings. BINARY - indicates values are encoded using HBase Bytes.toBytes family of functions. This can be overridden for a specific column by listing that column in 'columns' and specifying an encoding for it. */ encoding?: string; /** * Identifier of the column family. */ familyId?: string; /** * Optional. If this is set only the latest version of value are exposed for all columns in this column family. This can be overridden for a specific column by listing that column in 'columns' and specifying a different setting for that column. */ onlyReadLatest?: boolean; /** * Optional. The type to convert the value in cells of this column family. The values are expected to be encoded using HBase Bytes.toBytes function when using the BINARY encoding value. Following BigQuery types are allowed (case-sensitive): * BYTES * STRING * INTEGER * FLOAT * BOOLEAN * JSON Default type is BYTES. This can be overridden for a specific column by listing that column in 'columns' and specifying a type for it. */ type?: string; }; /** * Options specific to Google Cloud Bigtable data sources. */ type IBigtableOptions = { /** * Optional. List of column families to expose in the table schema along with their types. This list restricts the column families that can be referenced in queries and specifies their value types. You can use this list to do type conversions - see the 'type' field for more details. If you leave this list empty, all column families are present in the table schema and their values are read as BYTES. During a query only the column families referenced in that query are read from Bigtable. */ columnFamilies?: Array<IBigtableColumnFamily>; /** * Optional. If field is true, then the column families that are not specified in columnFamilies list are not exposed in the table schema. Otherwise, they are read with BYTES type values. The default value is false. */ ignoreUnspecifiedColumnFamilies?: boolean; /** * Optional. If field is true, then each column family will be read as a single JSON column. Otherwise they are read as a repeated cell structure containing timestamp/value tuples. The default value is false. */ outputColumnFamiliesAsJson?: boolean; /** * Optional. If field is true, then the rowkey column families will be read and converted to string. Otherwise they are read with BYTES type values and users need to manually cast them with CAST if necessary. The default value is false. */ readRowkeyAsString?: boolean; }; /** * Evaluation metrics for binary classification/classifier models. */ type IBinaryClassificationMetrics = { /** * Aggregate classification metrics. */ aggregateClassificationMetrics?: IAggregateClassificationMetrics; /** * Binary confusion matrix at multiple thresholds. */ binaryConfusionMatrixList?: Array<IBinaryConfusionMatrix>; /** * Label representing the negative class. */ negativeLabel?: string; /** * Label representing the positive class. */ positiveLabel?: string; }; /** * Confusion matrix for binary classification models. */ type IBinaryConfusionMatrix = { /** * The fraction of predictions given the correct label. */ accuracy?: number; /** * The equally weighted average of recall and precision. */ f1Score?: number; /** * Number of false samples predicted as false. */ falseNegatives?: string; /** * Number of false samples predicted as true. */ falsePositives?: string; /** * Threshold value used when computing each of the following metric. */ positiveClassThreshold?: number; /** * The fraction of actual positive predictions that had positive actual labels. */ precision?: number; /** * The fraction of actual positive labels that were given a positive prediction. */ recall?: number; /** * Number of true samples predicted as false. */ trueNegatives?: string; /** * Number of true samples predicted as true. */ truePositives?: string; }; /** * Associates `members`, or principals, with a `role`. */ type IBinding = { /** * The condition that is associated with this binding. If the condition evaluates to `true`, then this binding applies to the current request. If the condition evaluates to `false`, then this binding does not apply to the current request. However, a different role binding might grant the same role to one or more of the principals in this binding. To learn which resources support conditions in their IAM policies, see the [IAM documentation](https://cloud.google.com/iam/help/conditions/resource-policies). */ condition?: IExpr; /** * Specifies the principals requesting access for a Google Cloud resource. `members` can have the following values: * `allUsers`: A special identifier that represents anyone who is on the internet; with or without a Google account. * `allAuthenticatedUsers`: A special identifier that represents anyone who is authenticated with a Google account or a service account. Does not include identities that come from external identity providers (IdPs) through identity federation. * `user:{emailid}`: An email address that represents a specific Google account. For example, `alice@example.com` . * `serviceAccount:{emailid}`: An email address that represents a Google service account. For example, `my-other-app@appspot.gserviceaccount.com`. * `serviceAccount:{projectid}.svc.id.goog[{namespace}/{kubernetes-sa}]`: An identifier for a [Kubernetes service account](https://cloud.google.com/kubernetes-engine/docs/how-to/kubernetes-service-accounts). For example, `my-project.svc.id.goog[my-namespace/my-kubernetes-sa]`. * `group:{emailid}`: An email address that represents a Google group. For example, `admins@example.com`. * `domain:{domain}`: The G Suite domain (primary) that represents all the users of that domain. For example, `google.com` or `example.com`. * `principal://iam.googleapis.com/locations/global/workforcePools/{pool_id}/subject/{subject_attribute_value}`: A single identity in a workforce identity pool. * `principalSet://iam.googleapis.com/locations/global/workforcePools/{pool_id}/group/{group_id}`: All workforce identities in a group. * `principalSet://iam.googleapis.com/locations/global/workforcePools/{pool_id}/attribute.{attribute_name}/{attribute_value}`: All workforce identities with a specific attribute value. * `principalSet://iam.googleapis.com/locations/global/workforcePools/{pool_id}/*`: All identities in a workforce identity pool. * `principal://iam.googleapis.com/projects/{project_number}/locations/global/workloadIdentityPools/{pool_id}/subject/{subject_attribute_value}`: A single identity in a workload identity pool. * `principalSet://iam.googleapis.com/projects/{project_number}/locations/global/workloadIdentityPools/{pool_id}/group/{group_id}`: A workload identity pool group. * `principalSet://iam.googleapis.com/projects/{project_number}/locations/global/workloadIdentityPools/{pool_id}/attribute.{attribute_name}/{attribute_value}`: All identities in a workload identity pool with a certain attribute. * `principalSet://iam.googleapis.com/projects/{project_number}/locations/global/workloadIdentityPools/{pool_id}/*`: All identities in a workload identity pool. * `deleted:user:{emailid}?uid={uniqueid}`: An email address (plus unique identifier) representing a user that has been recently deleted. For example, `alice@example.com?uid=123456789012345678901`. If the user is recovered, this value reverts to `user:{emailid}` and the recovered user retains the role in the binding. * `deleted:serviceAccount:{emailid}?uid={uniqueid}`: An email address (plus unique identifier) representing a service account that has been recently deleted. For example, `my-other-app@appspot.gserviceaccount.com?uid=123456789012345678901`. If the service account is undeleted, this value reverts to `serviceAccount:{emailid}` and the undeleted service account retains the role in the binding. * `deleted:group:{emailid}?uid={uniqueid}`: An email address (plus unique identifier) representing a Google group that has been recently deleted. For example, `admins@example.com?uid=123456789012345678901`. If the group is recovered, this value reverts to `group:{emailid}` and the recovered group retains the role in the binding. * `deleted:principal://iam.googleapis.com/locations/global/workforcePools/{pool_id}/subject/{subject_attribute_value}`: Deleted single identity in a workforce identity pool. For example, `deleted:principal://iam.googleapis.com/locations/global/workforcePools/my-pool-id/subject/my-subject-attribute-value`. */ members?: Array<string>; /** * Role that is assigned to the list of `members`, or principals. For example, `roles/viewer`, `roles/editor`, or `roles/owner`. For an overview of the IAM roles and permissions, see the [IAM documentation](https://cloud.google.com/iam/docs/roles-overview). For a list of the available pre-defined roles, see [here](https://cloud.google.com/iam/docs/understanding-roles). */ role?: string; }; type IBqmlIterationResult = { /** * Deprecated. */ durationMs?: string; /** * Deprecated. */ evalLoss?: number; /** * Deprecated. */ index?: number; /** * Deprecated. */ learnRate?: number; /** * Deprecated. */ trainingLoss?: number; }; type IBqmlTrainingRun = { /** * Deprecated. */ iterationResults?: Array<IBqmlIterationResult>; /** * Deprecated. */ startTime?: string; /** * Deprecated. */ state?: string; /** * Deprecated. */ trainingOptions?: { earlyStop?: boolean; l1Reg?: number; l2Reg?: number; learnRate?: number; learnRateStrategy?: string; lineSearchInitLearnRate?: number; maxIteration?: string; minRelProgress?: number; warmStart?: boolean; }; }; /** * Representative value of a categorical feature. */ type ICategoricalValue = { /** * Counts of all categories for the categorical feature. If there are more than ten categories, we return top ten (by count) and return one more CategoryCount with category "_OTHER_" and count as aggregate counts of remaining categories. */ categoryCounts?: Array<ICategoryCount>; }; /** * Represents the count of a single category within the cluster. */ type ICategoryCount = { /** * The name of category. */ category?: string; /** * The count of training samples matching the category within the cluster. */ count?: string; }; /** * Information about base table and clone time of a table clone. */ type ICloneDefinition = { /** * Required. Reference describing the ID of the table that was cloned. */ baseTableReference?: ITableReference; /** * Required. The time at which the base table was cloned. This value is reported in the JSON response using RFC3339 format. */ cloneTime?: string; }; /** * Message containing the information about one cluster. */ type ICluster = { /** * Centroid id. */ centroidId?: string; /** * Count of training data rows that were assigned to this cluster. */ count?: string; /** * Values of highly variant features for this cluster. */ featureValues?: Array<IFeatureValue>; }; /** * Information about a single cluster for clustering model. */ type IClusterInfo = { /** * Centroid id. */ centroidId?: string; /** * Cluster radius, the average distance from centroid to each point assigned to the cluster. */ clusterRadius?: number; /** * Cluster size, the total number of points assigned to the cluster. */ clusterSize?: string; }; /** * Configures table clustering. */ type IClustering = { /** * One or more fields on which data should be clustered. Only top-level, non-repeated, simple-type fields are supported. The ordering of the clustering fields should be prioritized from most to least important for filtering purposes. Additional information on limitations can be found here: https://cloud.google.com/bigquery/docs/creating-clustered-tables#limitations */ fields?: Array<string>; }; /** * Evaluation metrics for clustering models. */ type IClusteringMetrics = { /** * Information for all clusters. */ clusters?: Array<ICluster>; /** * Davies-Bouldin index. */ daviesBouldinIndex?: number; /** * Mean of squared distances between each sample to its cluster centroid. */ meanSquaredDistance?: number; }; /** * Confusion matrix for multi-class classification models. */ type IConfusionMatrix = { /** * Confidence threshold used when computing the entries of the confusion matrix. */ confidenceThreshold?: number; /** * One row per actual label. */ rows?: Array<IRow>; }; /** * A connection-level property to customize query behavior. Under JDBC, these correspond directly to connection properties passed to the DriverManager. Under ODBC, these correspond to properties in the connection string. Currently supported connection properties: * **dataset_project_id**: represents the default project for datasets that are used in the query. Setting the system variable `@@dataset_project_id` achieves the same behavior. For more information about system variables, see: https://cloud.google.com/bigquery/docs/reference/system-variables * **time_zone**: represents the default timezone used to run the query. * **session_id**: associates the query with a given session. * **query_label**: associates the query with a given job label. If set, all subsequent queries in a script or session will have this label. For the format in which a you can specify a query label, see labels in the JobConfiguration resource type: https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#jobconfiguration Additional properties are allowed, but ignored. Specifying multiple connection properties with the same key returns an error. */ type IConnectionProperty = { /** * The key of the property to set. */ key?: string; /** * The value of the property to set. */ value?: string; }; /** * Information related to a CSV data source. */ type ICsvOptions = { /** * Optional. Indicates if BigQuery should accept rows that are missing trailing optional columns. If true, BigQuery treats missing trailing columns as null values. If false, records with missing trailing columns are treated as bad records, and if there are too many bad records, an invalid error is returned in the job result. The default value is false. */ allowJaggedRows?: boolean; /** * Optional. Indicates if BigQuery should allow quoted data sections that contain newline characters in a CSV file. The default value is false. */ allowQuotedNewlines?: boolean; /** * Optional. The character encoding of the data. The supported values are UTF-8, ISO-8859-1, UTF-16BE, UTF-16LE, UTF-32BE, and UTF-32LE. The default value is UTF-8. BigQuery decodes the data after the raw, binary data has been split using the values of the quote and fieldDelimiter properties. */ encoding?: string; /** * Optional. The separator character for fields in a CSV file. The separator is interpreted as a single byte. For files encoded in ISO-8859-1, any single character can be used as a separator. For files encoded in UTF-8, characters represented in decimal range 1-127 (U+0001-U+007F) can be used without any modification. UTF-8 characters encoded with multiple bytes (i.e. U+0080 and above) will have only the first byte used for separating fields. The remaining bytes will be treated as a part of the field. BigQuery also supports the escape sequence "\t" (U+0009) to specify a tab separator. The default value is comma (",", U+002C). */ fieldDelimiter?: string; /** * [Optional] A custom string that will represent a NULL value in CSV import data. */ nullMarker?: string; /** * Optional. Indicates if the embedded ASCII control characters (the first 32 characters in the ASCII-table, from '\x00' to '\x1F') are preserved. */ preserveAsciiControlCharacters?: boolean; /** * Optional. The value that is used to quote data sections in a CSV file. BigQuery converts the string to ISO-8859-1 encoding, and then uses the first byte of the encoded string to split the data in its raw, binary state. The default value is a double-quote ("). If your data does not contain quoted sections, set the property value to an empty string. If your data contains quoted newline characters, you must also set the allowQuotedNewlines property to true. To include the specific quote character within a quoted value, precede it with an additional matching quote character. For example, if you want to escape the default character ' " ', use ' "" '. */ quote?: string; /** * Optional. The number of rows at the top of a CSV file that BigQuery will skip when reading the data. The default value is 0. This property is useful if you have header rows in the file that should be skipped. When autodetect is on, the behavior is the following: * skipLeadingRows unspecified - Autodetect tries to detect headers in the first row. If they are not detected, the row is read as data. Otherwise data is read starting from the second row. * skipLeadingRows is 0 - Instructs autodetect that there are no headers and data should be read starting from the first row. * skipLeadingRows = N > 0 - Autodetect skips N-1 rows and tries to detect headers in row N. If headers are not detected, row N is just skipped. Otherwise row N is used to extract column names for the detected schema. */ skipLeadingRows?: string; }; /** * Options for data format adjustments. */ type IDataFormatOptions = { /** * Optional. Output timestamp as usec int64. Default is false. */ useInt64Timestamp?: boolean; }; /** * Statistics for data-masking. */ type IDataMaskingStatistics = { /** * Whether any accessed data was protected by the data masking. */ dataMaskingApplied?: boolean; }; /** * Data split result. This contains references to the training and evaluation data tables that were used to train the model. */ type IDataSplitResult = { /** * Table reference of the evaluation data after split. */ evaluationTable?: ITableReference; /** * Table reference of the test data after split. */ testTable?: ITableReference; /** * Table reference of the training data after split. */ trainingTable?: ITableReference; }; type IDataset = { /** * Optional. An array of objects that define dataset access for one or more entities. You can set this property when inserting or updating a dataset in order to control who is allowed to access the data. If unspecified at dataset creation time, BigQuery adds default dataset access for the following entities: access.specialGroup: projectReaders; access.role: READER; access.specialGroup: projectWriters; access.role: WRITER; access.specialGroup: projectOwners; access.role: OWNER; access.userByEmail: [dataset creator email]; access.role: OWNER; */ access?: Array<{ /** * [Pick one] A grant authorizing all resources of a particular type in a particular dataset access to this dataset. Only views are supported for now. The role field is not required when this field is set. If that dataset is deleted and re-created, its access needs to be granted again via an update operation. */ dataset?: IDatasetAccessEntry; /** * [Pick one] A domain to grant access to. Any users signed in with the domain specified will be granted the specified access. Example: "example.com". Maps to IAM policy member "domain:DOMAIN". */ domain?: string; /** * [Pick one] An email address of a Google Group to grant access to. Maps to IAM policy member "group:GROUP". */ groupByEmail?: string; /** * [Pick one] Some other type of member that appears in the IAM Policy but isn't a user, group, domain, or special group. */ iamMember?: string; /** * An IAM role ID that should be granted to the user, group, or domain specified in this access entry. The following legacy mappings will be applied: OWNER <=> roles/bigquery.dataOwner WRITER <=> roles/bigquery.dataEditor READER <=> roles/bigquery.dataViewer This field will accept any of the above formats, but will return only the legacy format. For example, if you set this field to "roles/bigquery.dataOwner", it will be returned back as "OWNER". */ role?: string; /** * [Pick one] A routine from a different dataset to grant access to. Queries executed against that routine will have read access to views/tables/routines in this dataset. Only UDF is supported for now. The role field is not required when this field is set. If that routine is updated by any user, access to the routine needs to be granted again via an update operation. */ routine?: IRoutineReference; /** * [Pick one] A special group to grant access to. Possible values include: projectOwners: Owners of the enclosing project. projectReaders: Readers of the enclosing project. projectWriters: Writers of the enclosing project. allAuthenticatedUsers: All authenticated BigQuery users. Maps to similarly-named IAM members. */ specialGroup?: string; /** * [Pick one] An email address of a user to grant access to. For example: fred@example.com. Maps to IAM policy member "user:EMAIL" or "serviceAccount:EMAIL". */ userByEmail?: string; /** * [Pick one] A view from a different dataset to grant access to. Queries executed against that view will have read access to views/tables/routines in this dataset. The role field is not required when this field is set. If that view is updated by any user, access to the view needs to be granted again via an update operation. */ view?: ITableReference; }>; /** * Output only. The time when this dataset was created, in milliseconds since the epoch. */ creationTime?: string; /** * Required. A reference that identifies the dataset. */ datasetReference?: IDatasetReference; /** * Optional. Defines the default collation specification of future tables created in the dataset. If a table is created in this dataset without table-level default collation, then the table inherits the dataset default collation, which is applied to the string fields that do not have explicit collation specified. A change to this field affects only tables created afterwards, and does not alter the existing tables. The following values are supported: * 'und:ci': undetermined locale, case insensitive. * '': empty string. Default to case-sensitive behavior. */ defaultCollation?: string; /** * The default encryption key for all tables in the dataset. Once this property is set, all newly-created partitioned tables in the dataset will have encryption key set to this value, unless table creation request (or query) overrides the key. */ defaultEncryptionConfiguration?: IEncryptionConfiguration; /** * This default partition expiration, expressed in milliseconds. When new time-partitioned tables are created in a dataset where this property is set, the table will inherit this value, propagated as the `TimePartitioning.expirationMs` property on the new table. If you set `TimePartitioning.expirationMs` explicitly when creating a table, the `defaultPartitionExpirationMs` of the containing dataset is ignored. When creating a partitioned table, if `defaultPartitionExpirationMs` is set, the `defaultTableExpirationMs` value is ignored and the table will not be inherit a table expiration deadline. */ defaultPartitionExpirationMs?: string; /** * Optional. Defines the default rounding mode specification of new tables created within this dataset. During table creation, if this field is specified, the table within this dataset will inherit the default rounding mode of the dataset. Setting the default rounding mode on a table overrides this option. Existing tables in the dataset are unaffected. If columns are defined during that table creation, they will immediately inherit the table's default rounding mode, unless otherwise specified. */ defaultRoundingMode?: | 'ROUNDING_MODE_UNSPECIFIED' | 'ROUND_HALF_AWAY_FROM_ZERO' | 'ROUND_HALF_EVEN'; /** * Optional. The default lifetime of all tables in the dataset, in milliseconds. The minimum lifetime value is 3600000 milliseconds (one hour). To clear an existing default expiration with a PATCH request, set to 0. Once this property is set, all newly-created tables in the dataset will have an expirationTime property set to the creation time plus the value in this property, and changing the value will only affect new tables, not existing ones. When the expirationTime for a given table is reached, that table will be deleted automatically. If a table's expirationTime is modified or removed before the table expires, or if you provide an explicit expirationTime when creating a table, that value takes precedence over the default expiration time indicated by this property. */ defaultTableExpirationMs?: string; /** * Optional. A user-friendly description of the dataset. */ description?: string; /** * Output only. A hash of the resource. */ etag?: string; /** * Optional. Reference to a read-only external dataset defined in data catalogs outside of BigQuery. Filled out when the dataset type is EXTERNAL. */ externalDatasetReference?: IExternalDatasetReference; /** * Optional. A descriptive name for the dataset. */ friendlyName?: string; /** * Output only. The fully-qualified unique name of the dataset in the format projectId:datasetId. The dataset name without the project name is given in the datasetId field. When creating a new dataset, leave this field blank, and instead specify the datasetId field. */ id?: string; /** * Optional. TRUE if the dataset and its table names are case-insensitive, otherwise FALSE. By default, this is FALSE, which means the dataset and its table names are case-sensitive. This field does not affect routine references. */ isCaseInsensitive?: boolean; /** * Output only. The resource type. */ kind?: string; /** * The labels associated with this dataset. You can use these to organize and group your datasets. You can set this property when inserting or updating a dataset. See Creating and Updating Dataset Labels for more information. */ labels?: {[key: string]: string}; /** * Output only. The date when this dataset was last modified, in milliseconds since the epoch. */ lastModifiedTime?: string; /** * Optional. The source dataset reference when the dataset is of type LINKED. For all other dataset types it is not set. This field cannot be updated once it is set. Any attempt to update this field using Update and Patch API Operations will be ignored. */ linkedDatasetSource?: ILinkedDatasetSource; /** * The geographic location where the dataset should reside. See https://cloud.google.com/bigquery/docs/locations for supported locations. */ location?: string; /** * Optional. Defines the time travel window in hours. The value can be from 48 to 168 hours (2 to 7 days). The default value is 168 hours if this is not set. */ maxTimeTravelHours?: string; /** * Output only. Reserved for future use. */ satisfiesPzi?: boolean; /** * Output only. Reserved for future use. */ satisfiesPzs?: boolean; /** * Output only. A URL that can be used to access the resource again. You can use this URL in Get or Update requests to the resource. */ selfLink?: string; /** * Optional. Updates storage_billing_model for the dataset. */ storageBillingModel?: | 'STORAGE_BILLING_MODEL_UNSPECIFIED' | 'LOGICAL' | 'PHYSICAL'; /** * Output only. Tags for the Dataset. */ tags?: Array<{ /** * Required. The namespaced friendly name of the tag key, e.g. "12345/environment" where 12345 is org id. */ tagKey?: string; /** * Required. The friendly short name of the tag value, e.g. "production". */ tagValue?: string; }>; /** * Output only. Same as `type` in `ListFormatDataset`. The type of the dataset, one of: * DEFAULT - only accessible by owner and authorized accounts, * PUBLIC - accessible by everyone, * LINKED - linked dataset, * EXTERNAL - dataset with definition in external metadata catalog. -- *BIGLAKE_METASTORE - dataset that references a database created in BigLakeMetastore service. -- */ type?: string; }; /** * Grants all resources of particular types in a particular dataset read access to the current dataset. Similar to how individually authorized views work, updates to any resource granted through its dataset (including creation of new resources) requires read permission to referenced resources, plus write permission to the authorizing dataset. */ type IDatasetAccessEntry = { /** * The dataset this entry applies to */ dataset?: IDatasetReference; /** * Which resources in the dataset this entry applies to. Currently, only views are supported, but additional target types may be added in the future. */ targetTypes?: Array<'TARGET_TYPE_UNSPECIFIED' | 'VIEWS' | 'ROUTINES'>; }; /** * Response format for a page of results when listing datasets. */ type IDatasetList = { /** * An array of the dataset resources in the project. Each resource contains basic information. For full information about a particular dataset resource, use the Datasets: get method. This property is omitted when there are no datasets in the project. */ datasets?: Array<{ /** * The dataset reference. Use this property to access specific parts of the dataset's ID, such as project ID or dataset ID. */ datasetReference?: IDatasetReference; /** * An alternate name for the dataset. The friendly name is purely decorative in nature. */ friendlyName?: string; /** * The fully-qualified, unique, opaque ID of the dataset. */ id?: string; /** * The resource type. This property always returns the value "bigquery#dataset" */ kind?: string; /** * The labels associated with this dataset. You can use these to organize and group your datasets. */ labels?: {[key: string]: string}; /** * The geographic location where the dataset resides. */ location?: string; }>; /** * Output only. A hash value of the results page. You can use this property to determine if the page has changed since the last request. */ etag?: string; /** * Output only. The resource type. This property always returns the value "bigquery#datasetList" */