// Copyright 2023 Google LLC // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. syntax = "proto3"; package google.cloud.aiplatform.v1beta1; import "google/api/field_behavior.proto"; import "google/api/resource.proto"; import "google/cloud/aiplatform/v1beta1/io.proto"; import "google/protobuf/timestamp.proto"; option csharp_namespace = "Google.Cloud.AIPlatform.V1Beta1"; option go_package = "cloud.google.com/go/aiplatform/apiv1beta1/aiplatformpb;aiplatformpb"; option java_multiple_files = true; option java_outer_classname = "VertexRagDataProto"; option java_package = "com.google.cloud.aiplatform.v1beta1"; option php_namespace = "Google\\Cloud\\AIPlatform\\V1beta1"; option ruby_package = "Google::Cloud::AIPlatform::V1beta1"; // A RagCorpus is a RagFile container and a project can have multiple // RagCorpora. message RagCorpus { option (google.api.resource) = { type: "aiplatform.googleapis.com/RagCorpus" pattern: "projects/{project}/locations/{location}/ragCorpora/{rag_corpus}" plural: "ragCorpora" singular: "ragCorpus" }; // Output only. The resource name of the RagCorpus. string name = 1 [(google.api.field_behavior) = OUTPUT_ONLY]; // Required. The display name of the RagCorpus. // The name can be up to 128 characters long and can consist of any UTF-8 // characters. string display_name = 2 [(google.api.field_behavior) = REQUIRED]; // Optional. The description of the RagCorpus. string description = 3 [(google.api.field_behavior) = OPTIONAL]; // Output only. Timestamp when this RagCorpus was created. google.protobuf.Timestamp create_time = 4 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. Timestamp when this RagCorpus was last updated. google.protobuf.Timestamp update_time = 5 [(google.api.field_behavior) = OUTPUT_ONLY]; } // A RagFile contains user data for chunking, embedding and indexing. message RagFile { option (google.api.resource) = { type: "aiplatform.googleapis.com/RagFile" pattern: "projects/{project}/locations/{location}/ragCorpora/{rag_corpus}/ragFiles/{rag_file}" plural: "ragFiles" singular: "ragFile" }; // The type of the RagFile. enum RagFileType { // RagFile type is unspecified. RAG_FILE_TYPE_UNSPECIFIED = 0; // RagFile type is TXT. RAG_FILE_TYPE_TXT = 1; // RagFile type is PDF. RAG_FILE_TYPE_PDF = 2; } // The origin location of the RagFile if it is imported from Google Cloud // Storage or Google Drive. oneof rag_file_source { // Output only. Google Cloud Storage location of the RagFile. // It does not support wildcards in the GCS uri for now. GcsSource gcs_source = 8 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. Google Drive location. Supports importing individual files // as well as Google Drive folders. GoogleDriveSource google_drive_source = 9 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. The RagFile is encapsulated and uploaded in the // UploadRagFile request. DirectUploadSource direct_upload_source = 10 [(google.api.field_behavior) = OUTPUT_ONLY]; } // Output only. The resource name of the RagFile. string name = 1 [(google.api.field_behavior) = OUTPUT_ONLY]; // Required. The display name of the RagFile. // The name can be up to 128 characters long and can consist of any UTF-8 // characters. string display_name = 2 [(google.api.field_behavior) = REQUIRED]; // Optional. The description of the RagFile. string description = 3 [(google.api.field_behavior) = OPTIONAL]; // Output only. The size of the RagFile in bytes. int64 size_bytes = 4 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. The type of the RagFile. RagFileType rag_file_type = 5 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. Timestamp when this RagFile was created. google.protobuf.Timestamp create_time = 6 [(google.api.field_behavior) = OUTPUT_ONLY]; // Output only. Timestamp when this RagFile was last updated. google.protobuf.Timestamp update_time = 7 [(google.api.field_behavior) = OUTPUT_ONLY]; } // Specifies the size and overlap of chunks for RagFiles. message RagFileChunkingConfig { // The size of the chunks. int32 chunk_size = 1; // The overlap between chunks. int32 chunk_overlap = 2; } // Config for uploading RagFile. message UploadRagFileConfig { // Specifies the size and overlap of chunks after uploading RagFile. RagFileChunkingConfig rag_file_chunking_config = 1; } // Config for importing RagFiles. message ImportRagFilesConfig { oneof import_source { // Google Cloud Storage location. Supports importing individual files as // well as entire Google Cloud Storage directories. Sample formats: // - `gs://bucket_name/my_directory/object_name/my_file.txt` // - `gs://bucket_name/my_directory` GcsSource gcs_source = 2; // Google Drive location. Supports importing individual files as // well as Google Drive folders. GoogleDriveSource google_drive_source = 3; } // Specifies the size and overlap of chunks after importing RagFiles. RagFileChunkingConfig rag_file_chunking_config = 4; }