feat: Copy v1beta1 preview SDK to GA directory

feat: Refactor rag_store and rag_retrieval to use v1 protos PiperOrigin-RevId: 699287935
googleapis · Nov 22, 2024 · bdc077d · bdc077d
1 parent 1487846
commit bdc077d
Show file tree

Hide file tree

Showing 10 changed files with 1,262 additions and 2 deletions.
diff --git a/tests/unit/vertex_rag/conftest.py → tests/unit/vertex_rag/v1beta1/conftest.py b/tests/unit/vertex_rag/conftest.py → tests/unit/vertex_rag/v1beta1/conftest.py
diff --git a/tests/unit/vertex_rag/test_rag_constants.py → .../vertex_rag/v1beta1/test_rag_constants.py b/tests/unit/vertex_rag/test_rag_constants.py → .../vertex_rag/v1beta1/test_rag_constants.py
diff --git a/tests/unit/vertex_rag/test_rag_data.py → .../unit/vertex_rag/v1beta1/test_rag_data.py b/tests/unit/vertex_rag/test_rag_data.py → .../unit/vertex_rag/v1beta1/test_rag_data.py
diff --git a/tests/unit/vertex_rag/test_rag_retrieval.py → .../vertex_rag/v1beta1/test_rag_retrieval.py b/tests/unit/vertex_rag/test_rag_retrieval.py → .../vertex_rag/v1beta1/test_rag_retrieval.py
@@ -16,13 +16,13 @@
 #
 import importlib
 from google.cloud import aiplatform
+import test_rag_constants as tc
 from vertexai.preview import rag
 from google.cloud.aiplatform_v1beta1 import (
     VertexRagServiceClient,
 )
 import mock
 import pytest
-import test_rag_constants as tc
 
 
 @pytest.fixture

diff --git a/tests/unit/vertex_rag/test_rag_store.py → ...unit/vertex_rag/v1beta1/test_rag_store.py b/tests/unit/vertex_rag/test_rag_store.py → ...unit/vertex_rag/v1beta1/test_rag_store.py
@@ -14,10 +14,10 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
+import test_rag_constants as tc
 from vertexai.preview import rag
 from vertexai.preview.generative_models import Tool
 import pytest
-import test_rag_constants as tc
 
 
 @pytest.mark.usefixtures("google_auth_mock")

diff --git a/vertexai/rag/__init__.py b/vertexai/rag/__init__.py
@@ -0,0 +1,89 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2024 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+# from vertexai.rag.rag_data import (
+#     create_corpus,
+#     update_corpus,
+#     list_corpora,
+#     get_corpus,
+#     delete_corpus,
+#     upload_file,
+#     import_files,
+#     import_files_async,
+#     get_file,
+#     list_files,
+#     delete_file,
+# )
+
+from vertexai.rag.rag_retrieval import (
+    retrieval_query,
+)
+
+from vertexai.rag.rag_store import (
+    Retrieval,
+    VertexRagStore,
+)
+from vertexai.rag.utils.resources import (
+    EmbeddingModelConfig,
+    JiraQuery,
+    JiraSource,
+    Pinecone,
+    RagCorpus,
+    RagFile,
+    RagManagedDb,
+    RagResource,
+    SharePointSource,
+    SharePointSources,
+    SlackChannel,
+    SlackChannelsSource,
+    VertexFeatureStore,
+    VertexVectorSearch,
+    Weaviate,
+)
+
+
+__all__ = (
+    "EmbeddingModelConfig",
+    "JiraQuery",
+    "JiraSource",
+    "Pinecone",
+    "RagCorpus",
+    "RagFile",
+    "RagManagedDb",
+    "RagResource",
+    "Retrieval",
+    "SharePointSource",
+    "SharePointSources",
+    "SlackChannel",
+    "SlackChannelsSource",
+    "VertexFeatureStore",
+    "VertexRagStore",
+    "VertexVectorSearch",
+    "Weaviate",
+    # "create_corpus",
+    # "delete_corpus",
+    # "delete_file",
+    # "get_corpus",
+    # "get_file",
+    # "import_files",
+    # "import_files_async",
+    # "list_corpora",
+    # "list_files",
+    "retrieval_query",
+    # "upload_file",
+    # "update_corpus",
+)
diff --git a/vertexai/rag/rag_retrieval.py b/vertexai/rag/rag_retrieval.py
@@ -0,0 +1,179 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2024 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+"""Retrieval query to get relevant contexts."""
+
+import re
+from typing import List, Optional
+import warnings
+
+from google.cloud.aiplatform import initializer
+from google.cloud.aiplatform_v1 import RagQuery
+from google.cloud.aiplatform_v1 import RagRetrievalConfig
+from google.cloud.aiplatform_v1 import RetrieveContextsRequest
+from google.cloud.aiplatform_v1 import RetrieveContextsResponse
+from vertexai.rag.utils import _gapic_utils
+from vertexai.rag.utils.resources import RagResource
+
+
+def retrieval_query(
+    text: str,
+    rag_resources: Optional[List[RagResource]] = None,
+    rag_corpora: Optional[List[str]] = None,
+    similarity_top_k: Optional[int] = None,
+    vector_distance_threshold: Optional[float] = None,
+    rag_retrieval_config: Optional[RagRetrievalConfig] = None,
+) -> RetrieveContextsResponse:
+    """Retrieve top k relevant docs/chunks.
+
+    Example usage:
+    ```
+    import vertexai
+
+    vertexai.init(project="my-project")
+
+    results = vertexai.preview.rag.retrieval_query(
+        text="Why is the sky blue?",
+        rag_resources=[vertexai.preview.rag.RagResource(
+            rag_corpus="projects/my-project/locations/us-central1/ragCorpora/rag-corpus-1",
+            rag_file_ids=["rag-file-1", "rag-file-2", ...],
+        )],
+        similarity_top_k=2,
+        vector_distance_threshold=0.5,
+        vector_search_alpha=0.5,
+    )
+    ```
+
+    Args:
+        text: The query in text format to get relevant contexts.
+        rag_resources: A list of RagResource. It can be used to specify corpus
+            only or ragfiles. Currently only support one corpus or multiple files
+            from one corpus. In the future we may open up multiple corpora support.
+        rag_corpora: If rag_resources is not specified, use rag_corpora as a list
+            of rag corpora names.
+        similarity_top_k: The number of contexts to retrieve.
+        vector_distance_threshold: Optional. Only return contexts with vector
+            distance smaller than the threshold.
+        vector_search_alpha: Optional. Controls the weight between dense and
+            sparse vector search results. The range is [0, 1], where 0 means
+            sparse vector search only and 1 means dense vector search only.
+            The default value is 0.5.
+        rag_retrieval_config: Optional. The config containing the retrieval
+            parameters, including similarity_top_k, vector_distance_threshold,
+            vector_search_alpha, and hybrid_search.
+
+    Returns:
+        RetrieveContextsResonse.
+    """
+    parent = initializer.global_config.common_location_path()
+
+    client = _gapic_utils.create_rag_service_client()
+
+    if rag_resources:
+        if len(rag_resources) > 1:
+            raise ValueError("Currently only support 1 RagResource.")
+        name = rag_resources[0].rag_corpus
+    elif rag_corpora:
+        if len(rag_corpora) > 1:
+            raise ValueError("Currently only support 1 RagCorpus.")
+        name = rag_corpora[0]
+        warnings.warn(
+            "rag_corpora is deprecated. Please use rag_resources instead.",
+            DeprecationWarning,
+        )
+    else:
+        raise ValueError("rag_resources or rag_corpora must be specified.")
+
+    data_client = _gapic_utils.create_rag_data_service_client()
+    if data_client.parse_rag_corpus_path(name):
+        rag_corpus_name = name
+    elif re.match("^{}$".format(_gapic_utils._VALID_RESOURCE_NAME_REGEX), name):
+        rag_corpus_name = parent + "/ragCorpora/" + name
+    else:
+        raise ValueError(
+            f"Invalid RagCorpus name: {rag_corpora}. Proper format should be:"
+            " projects/{project}/locations/{location}/ragCorpora/{rag_corpus_id}"
+        )
+
+    if rag_resources:
+        gapic_rag_resource = RetrieveContextsRequest.VertexRagStore.RagResource(
+            rag_corpus=rag_corpus_name,
+            rag_file_ids=rag_resources[0].rag_file_ids,
+        )
+        vertex_rag_store = RetrieveContextsRequest.VertexRagStore(
+            rag_resources=[gapic_rag_resource],
+        )
+    else:
+        vertex_rag_store = RetrieveContextsRequest.VertexRagStore(
+            rag_corpora=[rag_corpus_name],
+        )
+
+    # Check for deprecated parameters and raise warnings.
+    if similarity_top_k:
+        # If similarity_top_k is specified, throw deprecation warning.
+        warnings.warn(
+            "similarity_top_k is deprecated. Please use"
+            " rag_retrieval_config.top_k instead.",
+            DeprecationWarning,
+        )
+    else:
+        # If similarity_top_k is not specified, set it to default 10.
+        similarity_top_k = 10
+    if vector_distance_threshold:
+        # If vector_distance_threshold is specified, throw deprecation warning.
+        warnings.warn(
+            "vector_distance_threshold is deprecated. Please use"
+            " rag_retrieval_config.filter.vector_distance_threshold instead.",
+            DeprecationWarning,
+        )
+    else:
+        # If vector_distance_threshold is not specified, set it to default 0.3.
+        vector_distance_threshold = 0.3
+
+    # If rag_retrieval_config is not specified, set it to default values.
+    if not rag_retrieval_config:
+        rag_retrieval_config = RagRetrievalConfig(
+            top_k=similarity_top_k,
+            filter=RagRetrievalConfig.Filter(
+                vector_distance_threshold=vector_distance_threshold
+            ),
+        )
+    else:
+        # If rag_retrieval_config is specified, check for missing parameters.
+        if not rag_retrieval_config.top_k:
+            rag_retrieval_config.top_k = similarity_top_k
+        if (
+            not rag_retrieval_config.filter
+            or not rag_retrieval_config.filter.vector_distance_threshold
+        ):
+            rag_retrieval_config.filter = RagRetrievalConfig.Filter(
+                vector_distance_threshold=vector_distance_threshold
+            ),
+    query = RagQuery(
+        text=text,
+        rag_retrieval_config=rag_retrieval_config,
+    )
+    request = RetrieveContextsRequest(
+        vertex_rag_store=vertex_rag_store,
+        parent=parent,
+        query=query,
+    )
+    try:
+        response = client.retrieve_contexts(request=request)
+    except Exception as e:
+        raise RuntimeError("Failed in retrieving contexts due to: ", e) from e
+
+    return response