Refactor imports to allow using without Annoy/SentenceTransformers when using custom embedding search.

drazvan · drazvan · commit ec07145f0cde · 2023-09-04T23:08:34.000+03:00
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -19,6 +19,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 - Moved to using `nest_asyncio` for [implementing the blocking API](./docs/user_guide/advanced/nested-async-loop.md). Fixes [#3](https://github.com/NVIDIA/NeMo-Guardrails/issues/3) and [#32](https://github.com/NVIDIA/NeMo-Guardrails/issues/32).
 - Improved event property validation in `new_event_dict`.
+- Refactored imports to allow installing from source without Annoy/SentenceTransformers (would need a custom embedding search provider to work).
 
 ### Fixed
 
diff --git a/nemoguardrails/embeddings/basic.py b/nemoguardrails/embeddings/basic.py
@@ -16,7 +16,6 @@
 from typing import List
 
 from annoy import AnnoyIndex
-from sentence_transformers import SentenceTransformer
 from torch import cuda
 
 from nemoguardrails.embeddings.index import EmbeddingModel, EmbeddingsIndex, IndexItem
@@ -115,6 +114,8 @@ class SentenceTransformerEmbeddingModel(EmbeddingModel):
     """Embedding model using sentence-transformers."""
 
     def __init__(self, embedding_model: str):
+        from sentence_transformers import SentenceTransformer
+
         device = "cuda" if cuda.is_available() else "cpu"
         self.model = SentenceTransformer(embedding_model, device=device)
         # Get the embedding dimension of the model
diff --git a/nemoguardrails/kb/kb.py b/nemoguardrails/kb/kb.py
@@ -21,7 +21,6 @@
 
 from annoy import AnnoyIndex
 
-from nemoguardrails.embeddings.basic import BasicEmbeddingsIndex
 from nemoguardrails.embeddings.index import EmbeddingsIndex, IndexItem
 from nemoguardrails.kb.utils import split_markdown_in_topic_chunks
 from nemoguardrails.rails.llm.config import EmbeddingSearchProvider, KnowledgeBaseConfig
@@ -89,6 +88,8 @@ async def build(self):
             and os.path.exists(cache_file)
             and os.path.exists(embedding_size_file)
         ):
+            from nemoguardrails.embeddings.basic import BasicEmbeddingsIndex
+
             log.info(cache_file)
             self.index = cast(
                 BasicEmbeddingsIndex,
@@ -116,6 +117,8 @@ async def build(self):
             # For the default Embedding Search provider, which uses annoy, we also
             # persist the index after it's computed.
             if self.config.embedding_search_provider.name == "default":
+                from nemoguardrails.embeddings.basic import BasicEmbeddingsIndex
+
                 # We also save the file for future use
                 os.makedirs(CACHE_FOLDER, exist_ok=True)
                 basic_index = cast(BasicEmbeddingsIndex, self.index)
diff --git a/nemoguardrails/rails/llm/llmrails.py b/nemoguardrails/rails/llm/llmrails.py
@@ -31,7 +31,6 @@
 from nemoguardrails.actions.math import wolfram_alpha_request
 from nemoguardrails.actions.output_moderation import output_moderation
 from nemoguardrails.actions.retrieve_relevant_chunks import retrieve_relevant_chunks
-from nemoguardrails.embeddings.basic import BasicEmbeddingsIndex
 from nemoguardrails.embeddings.index import EmbeddingsIndex
 from nemoguardrails.flows.runtime import Runtime
 from nemoguardrails.kb.kb import KnowledgeBase
@@ -227,6 +226,8 @@ def _get_embeddings_search_provider_instance(
             esp_config = EmbeddingSearchProvider()
 
         if esp_config.name == "default":
+            from nemoguardrails.embeddings.basic import BasicEmbeddingsIndex
+
             return BasicEmbeddingsIndex(
                 embedding_model=esp_config.parameters.get(
                     "embedding_model", self.default_embedding_model