langchain-ai · hemidactylus · Aug 28, 2024 · Aug 24, 2024 · Aug 26, 2024 · Aug 28, 2024
diff --git a/libs/astradb/langchain_astradb/__init__.py b/libs/astradb/langchain_astradb/__init__.py
@@ -6,6 +6,7 @@
 from langchain_astradb.chat_message_histories import AstraDBChatMessageHistory
 from langchain_astradb.document_loaders import AstraDBLoader
 from langchain_astradb.storage import AstraDBByteStore, AstraDBStore
+from langchain_astradb.utils.encoders import AstraDBVectorStoreDocumentEncoder
 from langchain_astradb.vectorstores import AstraDBVectorStore
 
 __all__ = [
@@ -16,5 +17,6 @@
     "AstraDBChatMessageHistory",
     "AstraDBLoader",
     "AstraDBVectorStore",
+    "AstraDBVectorStoreDocumentEncoder",
     "CollectionVectorServiceOptions",
 ]
diff --git a/libs/astradb/langchain_astradb/utils/encoders.py b/libs/astradb/langchain_astradb/utils/encoders.py
@@ -28,16 +28,16 @@ def _default_encode_filter(filter_dict: dict[str, Any]) -> dict[str, Any]:
     return metadata_filter
 
 
-class VSDocumentEncoder(ABC):
+class AstraDBVectorStoreDocumentEncoder(ABC):
     """A document encoder for the Astra DB vector store.
 
     The document encoder contains the information for consistent interaction
     with documents as stored on the Astra DB collection.
 
     Implementations of this class must:
     - define how to encode/decode documents consistently to and from
-      Astra DB collections. The two operations must combine to the identity
-      on both sides.
+      Astra DB collections. The two operations must, so to speak, combine
+      to the identity on both sides (except for the quirks of their signatures).
     - provide the adequate projection dictionaries for running find
       operations on Astra DB, with and without the field containing the vector.
     - encode IDs to the `_id` field on Astra DB.
@@ -98,7 +98,7 @@ def encode_filter(self, filter_dict: dict[str, Any]) -> dict[str, Any]:
         """
 
 
-class DefaultVSDocumentEncoder(VSDocumentEncoder):
+class _DefaultVSDocumentEncoder(AstraDBVectorStoreDocumentEncoder):
     """Encoder for the default vector store usage with client-side embeddings.
 
     This encoder expresses how document are stored for collections created
@@ -148,7 +148,7 @@ def encode_filter(self, filter_dict: dict[str, Any]) -> dict[str, Any]:
         return _default_encode_filter(filter_dict)
 
 
-class DefaultVectorizeVSDocumentEncoder(VSDocumentEncoder):
+class _DefaultVectorizeVSDocumentEncoder(AstraDBVectorStoreDocumentEncoder):
     """Encoder for the default vector store usage with server-side embeddings.
 
     This encoder expresses how document are stored for collections created