1// Copyright 2021 Google LLC 2// 3// Licensed under the Apache License, Version 2.0 (the "License"); 4// you may not use this file except in compliance with the License. 5// You may obtain a copy of the License at 6// 7// http://www.apache.org/licenses/LICENSE-2.0 8// 9// Unless required by applicable law or agreed to in writing, software 10// distributed under the License is distributed on an "AS IS" BASIS, 11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12// See the License for the specific language governing permissions and 13// limitations under the License. 14 15syntax = "proto3"; 16 17package google.cloud.aiplatform.v1beta1.schema; 18 19 20option csharp_namespace = "Google.Cloud.AIPlatform.V1Beta1.Schema"; 21option go_package = "cloud.google.com/go/aiplatform/apiv1beta1/schema/schemapb;schemapb"; 22option java_multiple_files = true; 23option java_outer_classname = "DatasetMetadataProto"; 24option java_package = "com.google.cloud.aiplatform.v1beta1.schema"; 25option php_namespace = "Google\\Cloud\\AIPlatform\\V1beta1\\Schema"; 26option ruby_package = "Google::Cloud::AIPlatform::V1beta1::Schema"; 27 28// The metadata of Datasets that contain Image DataItems. 29message ImageDatasetMetadata { 30 // Points to a YAML file stored on Google Cloud Storage describing payload of 31 // the Image DataItems that belong to this Dataset. 32 string data_item_schema_uri = 1; 33 34 // Google Cloud Storage Bucket name that contains the blob data of this 35 // Dataset. 36 string gcs_bucket = 2; 37} 38 39// The metadata of Datasets that contain Text DataItems. 40message TextDatasetMetadata { 41 // Points to a YAML file stored on Google Cloud Storage describing payload of 42 // the Text DataItems that belong to this Dataset. 43 string data_item_schema_uri = 1; 44 45 // Google Cloud Storage Bucket name that contains the blob data of this 46 // Dataset. 47 string gcs_bucket = 2; 48} 49 50// The metadata of Datasets that contain Video DataItems. 51message VideoDatasetMetadata { 52 // Points to a YAML file stored on Google Cloud Storage describing payload of 53 // the Video DataItems that belong to this Dataset. 54 string data_item_schema_uri = 1; 55 56 // Google Cloud Storage Bucket name that contains the blob data of this 57 // Dataset. 58 string gcs_bucket = 2; 59} 60 61// The metadata of Datasets that contain tables data. 62message TablesDatasetMetadata { 63 // The tables Dataset's data source. The Dataset doesn't store the data 64 // directly, but only pointer(s) to its data. 65 message InputConfig { 66 oneof source { 67 GcsSource gcs_source = 1; 68 69 BigQuerySource bigquery_source = 2; 70 } 71 } 72 73 message GcsSource { 74 // Cloud Storage URI of one or more files. Only CSV files are supported. 75 // The first line of the CSV file is used as the header. 76 // If there are multiple files, the header is the first line of 77 // the lexicographically first file, the other files must either 78 // contain the exact same header or omit the header. 79 repeated string uri = 1; 80 } 81 82 message BigQuerySource { 83 // The URI of a BigQuery table. 84 // e.g. bq://projectId.bqDatasetId.bqTableId 85 string uri = 1; 86 } 87 88 InputConfig input_config = 1; 89} 90 91// The metadata of Datasets that contain time series data. 92message TimeSeriesDatasetMetadata { 93 // The time series Dataset's data source. The Dataset doesn't store the data 94 // directly, but only pointer(s) to its data. 95 message InputConfig { 96 oneof source { 97 GcsSource gcs_source = 1; 98 99 BigQuerySource bigquery_source = 2; 100 } 101 } 102 103 message GcsSource { 104 // Cloud Storage URI of one or more files. Only CSV files are supported. 105 // The first line of the CSV file is used as the header. 106 // If there are multiple files, the header is the first line of 107 // the lexicographically first file, the other files must either 108 // contain the exact same header or omit the header. 109 repeated string uri = 1; 110 } 111 112 message BigQuerySource { 113 // The URI of a BigQuery table. 114 string uri = 1; 115 } 116 117 InputConfig input_config = 1; 118 119 // The column name of the time series identifier column that identifies the 120 // time series. 121 string time_series_identifier_column = 2; 122 123 // The column name of the time column that identifies time order in the time 124 // series. 125 string time_column = 3; 126} 127