From 1447f49b72e6481ffe1c65d9b041c67ccf53df65 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=C5=A0ar=C5=ABnas=20Nejus?= <snejus@protonmail.com>
Date: Wed, 24 Dec 2025 21:42:48 +0000
Subject: [PATCH] Add some documentation to musicbrainz api mixins

---
 beetsplug/_utils/musicbrainz.py | 31 ++++++++++++++++++++++-
 beetsplug/mbcollection.py       | 44 +++++++++++++++++++++++++++++++++
 2 files changed, 74 insertions(+), 1 deletion(-)

diff --git a/beetsplug/_utils/musicbrainz.py b/beetsplug/_utils/musicbrainz.py
index 17a83dd9b..47a2550f0 100644
--- a/beetsplug/_utils/musicbrainz.py
+++ b/beetsplug/_utils/musicbrainz.py
@@ -1,3 +1,13 @@
+"""Helpers for communicating with the MusicBrainz webservice.
+
+Provides rate-limited HTTP session and convenience methods to fetch and
+normalize API responses.
+
+This module centralizes request handling and response shaping so callers can
+work with consistently structured data without embedding HTTP or rate-limit
+logic throughout the codebase.
+"""
+
 from __future__ import annotations
 
 import operator
@@ -21,11 +31,22 @@ log = logging.getLogger(__name__)
 
 
 class LimiterTimeoutSession(LimiterMixin, TimeoutAndRetrySession):
-    pass
+    """HTTP session that enforces rate limits."""
 
 
 @dataclass
 class MusicBrainzAPI(RequestHandler):
+    """High-level interface to the MusicBrainz WS/2 API.
+
+    Responsibilities:
+    - Configure the API host and request rate from application configuration.
+    - Offer helpers to fetch common entity types and to run searches.
+    - Normalize MusicBrainz responses so relation lists are grouped by target
+      type for easier downstream consumption.
+
+    Documentation: https://musicbrainz.org/doc/MusicBrainz_API
+    """
+
     api_host: str = field(init=False)
     rate_limit: float = field(init=False)
 
@@ -67,6 +88,12 @@ class MusicBrainzAPI(RequestHandler):
     def get_entity(
         self, entity: str, includes: list[str] | None = None, **kwargs
     ) -> JSONDict:
+        """Retrieve and normalize data from the API entity endpoint.
+
+        If requested, includes are appended to the request. The response is
+        passed through a normalizer that groups relation entries by their
+        target type so that callers receive a consistently structured mapping.
+        """
         if includes:
             kwargs["inc"] = "+".join(includes)
 
@@ -154,6 +181,8 @@ class MusicBrainzAPI(RequestHandler):
 
 
 class MusicBrainzAPIMixin:
+    """Mixin that provides a cached MusicBrainzAPI helper instance."""
+
     @cached_property
     def mb_api(self) -> MusicBrainzAPI:
         return MusicBrainzAPI()
diff --git a/beetsplug/mbcollection.py b/beetsplug/mbcollection.py
index 95ceb3fcf..25f16228a 100644
--- a/beetsplug/mbcollection.py
+++ b/beetsplug/mbcollection.py
@@ -43,6 +43,19 @@ UUID_PAT = re.compile(r"^[a-f0-9]{8}(-[a-f0-9]{4}){3}-[a-f0-9]{12}$")
 
 @dataclass
 class MusicBrainzUserAPI(MusicBrainzAPI):
+    """MusicBrainz API client with user authentication.
+
+    In order to retrieve private user collections and modify them, we need to
+    authenticate the requests with the user's MusicBrainz credentials.
+
+    See documentation for authentication details:
+        https://musicbrainz.org/doc/MusicBrainz_API#Authentication
+
+    Note that the documentation misleadingly states HTTP 'basic' authentication,
+    and I had to reverse-engineer musicbrainzngs to discover that it actually
+    uses HTTP 'digest' authentication.
+    """
+
     auth: HTTPDigestAuth = field(init=False)
 
     @cached_property
@@ -57,12 +70,18 @@ class MusicBrainzUserAPI(MusicBrainzAPI):
         )
 
     def request(self, *args, **kwargs) -> Response:
+        """Authenticate and include required client param in all requests."""
         kwargs.setdefault("params", {})
         kwargs["params"]["client"] = f"beets-{__version__}"
         kwargs["auth"] = self.auth
         return super().request(*args, **kwargs)
 
     def get_collections(self) -> list[JSONDict]:
+        """Get all collections for the authenticated user.
+
+        Note that both URL parameters must be included to retrieve private
+        collections.
+        """
         return self.get_entity(
             "collection", editor=self.user, includes=["user-collections"]
         ).get("collections", [])
@@ -70,6 +89,13 @@ class MusicBrainzUserAPI(MusicBrainzAPI):
 
 @dataclass
 class MBCollection:
+    """Representation of a user's MusicBrainz collection.
+
+    Provides convenient, chunked operations for retrieving releases and updating
+    the collection via the MusicBrainz web API. Fetch and submission limits are
+    controlled by class-level constants to avoid oversized requests.
+    """
+
     SUBMISSION_CHUNK_SIZE: ClassVar[int] = 200
     FETCH_CHUNK_SIZE: ClassVar[int] = 100
 
@@ -78,22 +104,31 @@ class MBCollection:
 
     @property
     def id(self) -> str:
+        """Unique identifier assigned to the collection by MusicBrainz."""
         return self.data["id"]
 
     @property
     def release_count(self) -> int:
+        """Total number of releases recorded in the collection."""
         return self.data["release-count"]
 
     @property
     def releases_url(self) -> str:
+        """Complete API endpoint URL for listing releases in this collection."""
         return f"{self.mb_api.api_root}/collection/{self.id}/releases"
 
     @property
     def releases(self) -> list[JSONDict]:
+        """Retrieve all releases in the collection, fetched in successive pages.
+
+        The fetch is performed in chunks and returns a flattened sequence of
+        release records.
+        """
         offsets = list(range(0, self.release_count, self.FETCH_CHUNK_SIZE))
         return [r for offset in offsets for r in self.get_releases(offset)]
 
     def get_releases(self, offset: int) -> list[JSONDict]:
+        """Fetch a single page of releases beginning at a given position."""
         return self.mb_api.get_json(
             self.releases_url,
             params={"limit": self.FETCH_CHUNK_SIZE, "offset": offset},
@@ -101,15 +136,24 @@ class MBCollection:
 
     @classmethod
     def get_id_chunks(cls, id_list: list[str]) -> Iterator[list[str]]:
+        """Yield successive sublists of identifiers sized for safe submission.
+
+        Splits a long sequence of identifiers into batches that respect the
+        service's submission limits to avoid oversized requests.
+        """
         for i in range(0, len(id_list), cls.SUBMISSION_CHUNK_SIZE):
             yield id_list[i : i + cls.SUBMISSION_CHUNK_SIZE]
 
     def add_releases(self, releases: list[str]) -> None:
+        """Add releases to the collection in batches."""
         for chunk in self.get_id_chunks(releases):
+            # Need to escape semicolons: https://github.com/psf/requests/issues/6990
             self.mb_api.put(f"{self.releases_url}/{'%3B'.join(chunk)}")
 
     def remove_releases(self, releases: list[str]) -> None:
+        """Remove releases from the collection in chunks."""
         for chunk in self.get_id_chunks(releases):
+            # Need to escape semicolons: https://github.com/psf/requests/issues/6990
             self.mb_api.delete(f"{self.releases_url}/{'%3B'.join(chunk)}")