@@ -254,6 +254,22 @@ message RagCorpus {
254254 singular : "ragCorpus"
255255 };
256256
257+ // The backend config of the RagCorpus.
258+ // It can be data store and/or retrieval engine.
259+ oneof backend_config {
260+ // Optional. Immutable. The config for the Vector DBs.
261+ RagVectorDbConfig vector_db_config = 9 [
262+ (google.api.field_behavior ) = OPTIONAL ,
263+ (google.api.field_behavior ) = IMMUTABLE
264+ ];
265+
266+ // Optional. Immutable. The config for the Vertex AI Search.
267+ VertexAiSearchConfig vertex_ai_search_config = 10 [
268+ (google.api.field_behavior ) = OPTIONAL ,
269+ (google.api.field_behavior ) = IMMUTABLE
270+ ];
271+ }
272+
257273 // Output only. The resource name of the RagCorpus.
258274 string name = 1 [(google.api.field_behavior ) = OUTPUT_ONLY ];
259275
@@ -290,23 +306,8 @@ message RagCorpus {
290306 // Output only. RagCorpus state.
291307 CorpusStatus corpus_status = 8 [(google.api.field_behavior ) = OUTPUT_ONLY ];
292308
293- // The backend config of the RagCorpus.
294- // It can be data store and/or retrieval engine.
295- oneof backend_config {
296- // Optional. Immutable. The config for the Vector DBs.
297- RagVectorDbConfig vector_db_config = 9 [
298- (google.api.field_behavior ) = OPTIONAL ,
299- (google.api.field_behavior ) = IMMUTABLE
300- ];
301-
302- // Optional. Immutable. The config for the Vertex AI Search.
303- VertexAiSearchConfig vertex_ai_search_config = 10 [
304- (google.api.field_behavior ) = OPTIONAL ,
305- (google.api.field_behavior ) = IMMUTABLE
306- ];
307- }
308- // Output only. The number of RagFiles in the RagCorpus.
309- int32 rag_files_count = 11 ;
309+ // Output only. Number of RagFiles in the RagCorpus.
310+ int32 rag_files_count = 11 [(google.api.field_behavior ) = OUTPUT_ONLY ];
310311}
311312
312313// A RagFile contains user data for chunking, embedding and indexing.
@@ -386,6 +387,25 @@ message RagFile {
386387 FileStatus file_status = 13 [(google.api.field_behavior ) = OUTPUT_ONLY ];
387388}
388389
390+ // A RagChunk includes the content of a chunk of a RagFile, and associated
391+ // metadata.
392+ message RagChunk {
393+ // Represents where the chunk starts and ends in the document.
394+ message PageSpan {
395+ // Page where chunk starts in the document. Inclusive. 1-indexed.
396+ int32 first_page = 1 ;
397+
398+ // Page where chunk ends in the document. Inclusive. 1-indexed.
399+ int32 last_page = 2 ;
400+ }
401+
402+ // The content of the chunk.
403+ string text = 1 ;
404+
405+ // If populated, represents where the chunk starts and ends in the document.
406+ optional PageSpan page_span = 2 ;
407+ }
408+
389409// Specifies the size and overlap of chunks for RagFiles.
390410message RagFileChunkingConfig {
391411 // Specifies the fixed length chunking config.
@@ -445,7 +465,8 @@ message RagFileParsingConfig {
445465 // Specifies the advanced parsing for RagFiles.
446466 message LlmParser {
447467 // The name of a LLM model used for parsing.
448- // Format: `gemini-1.5-pro-002`
468+ // Format:
469+ // * `projects/{project_id}/locations/{location}/publishers/{publisher}/models/{model}`
449470 string model_name = 1 ;
450471
451472 // The maximum number of requests the job is allowed to make to the
0 commit comments