Skip to content

Commit 07ab54b

Browse files
Google APIscopybara-github
authored andcommitted
feat: Introduce RAG as context/memory store for Gemini Live API
docs: A comment for message `RagFileParsingConfig` is updated. docs: A comment for field `global_max_embedding_requests_per_min` in message `.google.cloud.aiplatform.v1beta1.ImportRagFilesConfig` is updated. PiperOrigin-RevId: 763909021
1 parent d8bb284 commit 07ab54b

2 files changed

Lines changed: 38 additions & 2 deletions

File tree

google/cloud/aiplatform/v1beta1/tool.proto

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -315,6 +315,15 @@ message VertexRagStore {
315315
// Optional. The retrieval config for the Rag query.
316316
RagRetrievalConfig rag_retrieval_config = 6
317317
[(google.api.field_behavior) = OPTIONAL];
318+
319+
// Optional. Currently only supported for Gemini Multimodal Live API.
320+
//
321+
// In Gemini Multimodal Live API, if `store_context` bool is
322+
// true, Gemini will leverage it to automatically memorize the
323+
// interactions between the client and Gemini, and retrieve context when
324+
// needed to augment the response generation for users' ongoing and future
325+
// interactions.
326+
bool store_context = 7 [(google.api.field_behavior) = OPTIONAL];
318327
}
319328

320329
// Retrieve from Vertex AI Search datastore or engine for grounding.

google/cloud/aiplatform/v1beta1/vertex_rag_data.proto

Lines changed: 29 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -295,6 +295,29 @@ message RagCorpus {
295295
singular: "ragCorpus"
296296
};
297297

298+
// The config for the corpus type of the RagCorpus.
299+
message CorpusTypeConfig {
300+
// Config for the document corpus.
301+
message DocumentCorpus {}
302+
303+
// Config for the memory corpus.
304+
message MemoryCorpus {
305+
// The LLM parser to use for the memory corpus.
306+
RagFileParsingConfig.LlmParser llm_parser = 1;
307+
}
308+
309+
// Optional.
310+
// Whether the RagCorpus is used as document store or memory store.
311+
oneof corpus_type_config {
312+
// Optional. Config for the document corpus.
313+
DocumentCorpus document_corpus = 1
314+
[(google.api.field_behavior) = OPTIONAL];
315+
316+
// Optional. Config for the memory corpus.
317+
MemoryCorpus memory_corpus = 2 [(google.api.field_behavior) = OPTIONAL];
318+
}
319+
}
320+
298321
// The backend config of the RagCorpus.
299322
// It can be data store and/or retrieval engine.
300323
oneof backend_config {
@@ -358,6 +381,10 @@ message RagCorpus {
358381
(google.api.field_behavior) = IMMUTABLE,
359382
(google.api.field_behavior) = OPTIONAL
360383
];
384+
385+
// Optional. The corpus type config of the RagCorpus.
386+
CorpusTypeConfig corpus_type_config = 13
387+
[(google.api.field_behavior) = OPTIONAL];
361388
}
362389

363390
// A RagFile contains user data for chunking, embedding and indexing.
@@ -521,7 +548,7 @@ message RagFileParsingConfig {
521548
int32 global_max_parsing_requests_per_min = 3;
522549
}
523550

524-
// Specifies the advanced parsing for RagFiles.
551+
// Specifies the LLM parsing for RagFiles.
525552
message LlmParser {
526553
// The name of a LLM model used for parsing.
527554
// Format:
@@ -652,7 +679,7 @@ message ImportRagFilesConfig {
652679
// Optional. The max number of queries per minute that the indexing pipeline
653680
// job is allowed to make to the embedding model specified in the project.
654681
// Please follow the quota usage guideline of the embedding model you use to
655-
// set the value properly. If this value is not specified,
682+
// set the value properly.If this value is not specified,
656683
// max_embedding_requests_per_min will be used by indexing pipeline job as the
657684
// global limit.
658685
int32 global_max_embedding_requests_per_min = 18

0 commit comments

Comments
 (0)