dataset_metadata.proto 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126
  1. // Copyright 2021 Google LLC
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. syntax = "proto3";
  15. package google.cloud.aiplatform.v1beta1.schema;
  16. option csharp_namespace = "Google.Cloud.AIPlatform.V1Beta1.Schema";
  17. option go_package = "google.golang.org/genproto/googleapis/cloud/aiplatform/v1beta1/schema;schema";
  18. option java_multiple_files = true;
  19. option java_outer_classname = "DatasetMetadataProto";
  20. option java_package = "com.google.cloud.aiplatform.v1beta1.schema";
  21. option php_namespace = "Google\\Cloud\\AIPlatform\\V1beta1\\Schema";
  22. option ruby_package = "Google::Cloud::AIPlatform::V1beta1::Schema";
  23. // The metadata of Datasets that contain Image DataItems.
  24. message ImageDatasetMetadata {
  25. // Points to a YAML file stored on Google Cloud Storage describing payload of
  26. // the Image DataItems that belong to this Dataset.
  27. string data_item_schema_uri = 1;
  28. // Google Cloud Storage Bucket name that contains the blob data of this
  29. // Dataset.
  30. string gcs_bucket = 2;
  31. }
  32. // The metadata of Datasets that contain Text DataItems.
  33. message TextDatasetMetadata {
  34. // Points to a YAML file stored on Google Cloud Storage describing payload of
  35. // the Text DataItems that belong to this Dataset.
  36. string data_item_schema_uri = 1;
  37. // Google Cloud Storage Bucket name that contains the blob data of this
  38. // Dataset.
  39. string gcs_bucket = 2;
  40. }
  41. // The metadata of Datasets that contain Video DataItems.
  42. message VideoDatasetMetadata {
  43. // Points to a YAML file stored on Google Cloud Storage describing payload of
  44. // the Video DataItems that belong to this Dataset.
  45. string data_item_schema_uri = 1;
  46. // Google Cloud Storage Bucket name that contains the blob data of this
  47. // Dataset.
  48. string gcs_bucket = 2;
  49. }
  50. // The metadata of Datasets that contain tables data.
  51. message TablesDatasetMetadata {
  52. // The tables Dataset's data source. The Dataset doesn't store the data
  53. // directly, but only pointer(s) to its data.
  54. message InputConfig {
  55. oneof source {
  56. GcsSource gcs_source = 1;
  57. BigQuerySource bigquery_source = 2;
  58. }
  59. }
  60. message GcsSource {
  61. // Cloud Storage URI of one or more files. Only CSV files are supported.
  62. // The first line of the CSV file is used as the header.
  63. // If there are multiple files, the header is the first line of
  64. // the lexicographically first file, the other files must either
  65. // contain the exact same header or omit the header.
  66. repeated string uri = 1;
  67. }
  68. message BigQuerySource {
  69. // The URI of a BigQuery table.
  70. // e.g. bq://projectId.bqDatasetId.bqTableId
  71. string uri = 1;
  72. }
  73. InputConfig input_config = 1;
  74. }
  75. // The metadata of Datasets that contain time series data.
  76. message TimeSeriesDatasetMetadata {
  77. // The time series Dataset's data source. The Dataset doesn't store the data
  78. // directly, but only pointer(s) to its data.
  79. message InputConfig {
  80. oneof source {
  81. GcsSource gcs_source = 1;
  82. BigQuerySource bigquery_source = 2;
  83. }
  84. }
  85. message GcsSource {
  86. // Cloud Storage URI of one or more files. Only CSV files are supported.
  87. // The first line of the CSV file is used as the header.
  88. // If there are multiple files, the header is the first line of
  89. // the lexicographically first file, the other files must either
  90. // contain the exact same header or omit the header.
  91. repeated string uri = 1;
  92. }
  93. message BigQuerySource {
  94. // The URI of a BigQuery table.
  95. string uri = 1;
  96. }
  97. InputConfig input_config = 1;
  98. // The column name of the time series identifier column that identifies the
  99. // time series.
  100. string time_series_identifier_column = 2;
  101. // The column name of the time column that identifies time order in the time
  102. // series.
  103. string time_column = 3;
  104. }