albert-labs · prasad-albert · Apr 9, 2026 · Apr 9, 2026 · Apr 9, 2026 · Apr 9, 2026
diff --git a/docs/collections/substances_v4.md b/docs/collections/substances_v4.md
@@ -0,0 +1 @@
+::: albert.collections.substance_v4.SubstanceCollectionV4
diff --git a/docs/resources/substances_v4.md b/docs/resources/substances_v4.md
@@ -0,0 +1 @@
+::: albert.resources.substance_v4
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -173,6 +173,7 @@ nav:
           - Storage Classes: collections/storage_classes.md
           - Storage Locations: collections/storage_locations.md
           - Substances: collections/substances.md
+          - Substances V4 (🧪Beta): collections/substances_v4.md
           - Synthesis: collections/synthesis.md
           - Tags: collections/tags.md
           - Targets (🧪Beta): collections/targets.md
@@ -222,6 +223,7 @@ nav:
           - Storage Classes: resources/storage_classes.md
           - Storage Locations: resources/storage_locations.md
           - Substances: resources/substances.md
+          - Substances V4: resources/substances_v4.md
           - Synthesis: resources/synthesis.md
           - Tags: resources/tags.md
           - Targets (🧪Beta): resources/targets.md

diff --git a/src/albert/client.py b/src/albert/client.py
@@ -43,6 +43,7 @@
 from albert.collections.storage_classes import StorageClassesCollection
 from albert.collections.storage_locations import StorageLocationsCollection
 from albert.collections.substance import SubstanceCollection
+from albert.collections.substance_v4 import SubstanceCollectionV4
 from albert.collections.synthesis import SynthesisCollection
 from albert.collections.tags import TagCollection
 from albert.collections.targets import TargetCollection
@@ -337,6 +338,10 @@ def smart_datasets(self) -> SmartDatasetCollection:
     def substances(self) -> SubstanceCollection:
         return SubstanceCollection(session=self.session)
 
+    @property
+    def substances_v4(self) -> SubstanceCollectionV4:
+        return SubstanceCollectionV4(session=self.session)
+
     @property
     def links(self) -> LinksCollection:
         return LinksCollection(session=self.session)

diff --git a/src/albert/collections/inventory.py b/src/albert/collections/inventory.py
@@ -929,6 +929,7 @@ def update(self, *, inventory_item: InventoryItem) -> InventoryItem:
         Notes
         -----
         The following fields can be updated: ``alias``, ``description``, ``is_formula_override``, ``metadata``, ``name``, ``security_class``, ``unit_category``.
+        On individual CAS entries (via ``cas``): ``min``, ``max``, ``target``, ``cas_category``, ``substance_id``, ``inventory_function``.
         """
         # Fetch the current object state from the server or database
         current_object = self.get_by_id(id=inventory_item.id)

diff --git a/src/albert/collections/substance_v4.py b/src/albert/collections/substance_v4.py
@@ -0,0 +1,338 @@
+import json
+from collections.abc import Iterator
+from typing import Any
+
+from pydantic import validate_call
+
+from albert.collections.base import BaseCollection
+from albert.core.pagination import AlbertPaginator
+from albert.core.session import AlbertSession
+from albert.core.shared.enums import PaginationMode
+from albert.resources.substance_v4 import (
+    SubstanceV4Create,
+    SubstanceV4CreateResult,
+    SubstanceV4Info,
+    SubstanceV4Metadata,
+    SubstanceV4Response,
+    SubstanceV4SearchItem,
+)
+
+
+class SubstanceV4SearchPaginator(AlbertPaginator):
+    """Paginator for substance v4 search using integer offset pagination."""
+
+    def __init__(
+        self,
+        *,
+        path: str,
+        session: AlbertSession,
+        params: dict[str, Any] | None = None,
+        max_items: int | None = None,
+    ):
+        params = dict(params or {})
+        self._offset = int(params.get("startKey", 0))
+        params["startKey"] = self._offset
+        params["limit"] = 20  # API maximum
+        super().__init__(
+            path=path,
+            mode=PaginationMode.OFFSET,
+            session=session,
+            deserialize=lambda items: [SubstanceV4SearchItem.model_validate(i) for i in items],
+            params=params,
+            max_items=max_items,
+        )
+
+    def _create_iterator(self) -> Iterator[SubstanceV4SearchItem]:
+        """Yield paginated search items."""
+        yielded = 0
+        while True:
+            response = self._request()
+            items = response.json().get("substances", [])
+
+            if not items:
+                return
+
+            for item in self.deserialize(items):
+                yield item
+                yielded += 1
+                if self.max_items is not None and yielded >= self.max_items:
+                    return
+
+            self._offset += len(items)
+            self.params["startKey"] = self._offset
+
+
+class SubstanceCollectionV4(BaseCollection):
+    """SubstanceCollectionV4 manages substance entities in the Albert platform (🧪Beta).
+
+    !!! warning "Beta Feature!"
+        Please do not use in production or without explicit guidance from Albert. You might otherwise have a bad experience.
+        This feature currently falls outside of the Albert support contract, but we'd love your feedback!
+
+    Parameters
+    ----------
+    session : AlbertSession
+        The Albert session instance.
+
+    Attributes
+    ----------
+    base_path : str
+        The base URL for substance API requests.
+
+    Methods
+    -------
+    get_by_ids(...) -> list[SubstanceV4Info]
+        Retrieves substances by CAS IDs, substance IDs, or external IDs.
+    get_by_id(...) -> SubstanceV4Info
+        Retrieves a single substance by CAS ID, substance ID, or external ID.
+    search(...) -> Iterator[SubstanceV4SearchItem]
+        Searches substances by keyword or advanced filters.
+    create(substance) -> SubstanceV4CreateResult
+        Creates a new substance record.
+    update_metadata(id, metadata) -> None
+        Updates metadata fields on a substance.
+    """
+
+    _api_version = "v4"
+
+    def __init__(self, *, session: AlbertSession):
+        super().__init__(session=session)
+        self.base_path = f"/api/{SubstanceCollectionV4._api_version}/substances"
+
+    @validate_call
+    def get_by_ids(
+        self,
+        *,
+        cas_ids: list[str] | None = None,
+        sub_ids: list[str] | None = None,
+        external_ids: list[str] | None = None,
+        region: str = "global",
+        catch_errors: bool | None = None,
+        language: str | None = None,
+        classification_type: str | None = None,
+    ) -> list[SubstanceV4Info]:
+        """Retrieve substances by their identifiers.
+
+        At least one of ``cas_ids``, ``sub_ids``, or ``external_ids`` must be provided.
+
+        Parameters
+        ----------
+        cas_ids : list[str] | None
+            CAS numbers to look up.
+        sub_ids : list[str] | None
+            Substance IDs to look up.
+        external_ids : list[str] | None
+            External IDs to look up.
+        region : str, optional
+            Region for hazard information, by default ``"global"``.
+        catch_errors : bool | None, optional
+            Whether to suppress errors for unknown substances, by default None.
+        language : str | None, optional
+            Language code for name translation, by default None.
+        classification_type : str | None, optional
+            Filter by classification type, by default None.
+
+        Returns
+        -------
+        list[SubstanceV4Info]
+            The matching substances.
+        """
+        if not any([cas_ids, sub_ids, external_ids]):
+            raise ValueError("At least one of cas_ids, sub_ids, or external_ids must be provided.")
+
+        params: dict = {"region": region}
+        if cas_ids:
+            params["casIDs"] = ",".join(cas_ids)
+        if sub_ids:
+            params["subIDs"] = ",".join(sub_ids)
+        if external_ids:
+            params["externalIDs"] = ",".join(external_ids)
+        if catch_errors is not None:
+            params["catchErrors"] = json.dumps(catch_errors)
+        if language:
+            params["language"] = language
+        if classification_type:
+            params["classificationType"] = classification_type
+
+        response = self.session.get(self.base_path, params=params)
+        return SubstanceV4Response.model_validate(response.json()).substances
+
+    @validate_call
+    def get_by_id(
+        self,
+        *,
+        cas_id: str | None = None,
+        sub_id: str | None = None,
+        external_id: str | None = None,
+        region: str = "global",
+        catch_errors: bool | None = None,
+        language: str | None = None,
+        classification_type: str | None = None,
+    ) -> SubstanceV4Info:
+        """Retrieve a single substance by its identifier.
+
+        Provide exactly one of ``cas_id``, ``sub_id``, or ``external_id``.
+
+        Parameters
+        ----------
+        cas_id : str | None
+            The CAS number.
+        sub_id : str | None
+            The substance ID.
+        external_id : str | None
+            The external ID.
+        region : str, optional
+            Region for hazard information, by default ``"global"``.
+        catch_errors : bool | None, optional
+            Whether to suppress errors for unknown substances, by default None.
+        language : str | None, optional
+            Language code for name translation, by default None.
+        classification_type : str | None, optional
+            Filter by classification type, by default None.
+
+        Returns
+        -------
+        SubstanceV4Info
+            The matching substance.
+        """
+        provided = sum([cas_id is not None, sub_id is not None, external_id is not None])
+        if provided != 1:
+            raise ValueError("Exactly one of cas_id, sub_id, or external_id must be provided.")
+
+        results = self.get_by_ids(
+            cas_ids=[cas_id] if cas_id else None,
+            sub_ids=[sub_id] if sub_id else None,
+            external_ids=[external_id] if external_id else None,
+            region=region,
+            catch_errors=catch_errors,
+            language=language,
+            classification_type=classification_type,
+        )
+        if not results:
+            raise ValueError("No substance found for the provided identifier.")
+        return results[0]
+
+    @validate_call
+    def search(
+        self,
+        *,
+        search_key: str | None = None,
+        cas: str | None = None,
+        ec: str | None = None,
+        name: str | None = None,
+        region: str = "global",
+        classification_type: str | None = None,
+        start_key: int = 0,
+        max_items: int = 100,
+    ) -> Iterator[SubstanceV4SearchItem]:
+        """Search for substances by keyword or advanced filters.
+
+        At least one of ``search_key``, ``cas``, ``ec``, or ``name`` must be provided.
+        If both ``search_key`` and advanced filters are provided, the advanced filters
+        take precedence.
+
+        Parameters
+        ----------
+        search_key : str | None
+            Free-text search term.
+        cas : str | None
+            Filter by CAS identifier.
+        ec : str | None
+            Filter by EC identifier.
+        name : str | None
+            Filter by substance name.
+        region : str, optional
+            Region for hazard information, by default ``"global"``.
+        classification_type : str | None, optional
+            Filter by classification type, by default None.
+        start_key : int, optional
+            Offset to resume pagination from, by default 0.
+        max_items : int, optional
+            Maximum number of items to yield, by default 100.
+
+        Yields
+        ------
+        SubstanceV4SearchItem
+            Matching substance search records.
+        """
+        if not any([search_key, cas, ec, name]):
+            raise ValueError("At least one of search_key, cas, ec, or name must be provided.")
+
+        params: dict = {"region": region, "startKey": start_key}
+        if search_key:
+            params["searchKey"] = search_key
+        if cas:
+            params["cas"] = cas
+        if ec:
+            params["ec"] = ec
+        if name:
+            params["name"] = name
+        if classification_type:
+            params["classificationType"] = classification_type
+
+        yield from SubstanceV4SearchPaginator(
+            path=f"{self.base_path}/search",
+            session=self.session,
+            params=params,
+            max_items=max_items,
+        )
+
+    @validate_call
+    def create(self, *, substance: SubstanceV4Create) -> SubstanceV4CreateResult:
+        """Create a new substance record.
+
+        Parameters
+        ----------
+        substance : SubstanceV4Create
+            The substance data to create.
+
+        Returns
+        -------
+        SubstanceV4CreateResult
+            The result containing created, failed, and existing items.
+        """
+        payload = [substance.model_dump(by_alias=True, mode="json", exclude_none=True)]
+        response = self.session.post(self.base_path, json=payload)
+        return SubstanceV4CreateResult.model_validate(response.json())
+
+    @validate_call
+    def update_metadata(self, *, id: str, metadata: SubstanceV4Metadata) -> None:
+        """Update metadata fields on a substance.
+
+        Only fields set to a non-``None`` value are sent. Fields omitted or left
+        as ``None`` are not modified.
+
+        Parameters
+        ----------
+        id : str
+            The substance ID to update.
+        metadata : SubstanceV4Metadata
+            The metadata fields to update.
+
+        Notes
+        -----
+        The following fields can be updated: ``notes``, ``description``, ``cas_smiles``,
+        and any custom metadata fields configured for the tenant.
+        """
+        operations = []
+
+        for attr, wire_name in [
+            ("notes", "notes"),
+            ("description", "description"),
+            ("cas_smiles", "casSmiles"),
+        ]:
+            value = getattr(metadata, attr)
+            if value is not None:
+                operations.append({"operation": "add", "attribute": wire_name, "newValue": value})
+
+        if metadata.metadata:
+            for key, value in metadata.metadata.items():
+                operations.append(
+                    {"operation": "add", "attribute": f"Metadata.{key}", "newValue": value}
+                )
+
+        if not operations:
+            return
+
+        sub_id = id if id.startswith("SUB") else f"SUB{id}"
+        self.session.patch(f"{self.base_path}/metadata/{sub_id}", json={"data": operations})
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		::: albert.collections.substance_v4.SubstanceCollectionV4