move MBCS check to bytestring_path

This should be used in *every* filename conversion, not just the destination generation. Also required a change to sorted_walk (erroneously didn't use syspath).
2026-02-13 10:51:59 +01:00 · 2012-07-17 11:45:44 -07:00 · 2012-07-17 11:45:44 -07:00 · 70000ec4e4
commit 70000ec4e4
parent 44459f88d0
2 changed files with 14 additions and 13 deletions
--- a/beets/library.py
+++ b/beets/library.py
@ -1123,17 +1123,9 @@ class Library(BaseLibrary):
            subpath = unicodedata.normalize('NFC', subpath)
        # Truncate components and remove forbidden characters.
        subpath = util.sanitize_path(subpath, pathmod, self.replacements)
-        # Encode for the filesystem, dropping unencodable characters.
-        if isinstance(subpath, unicode) and not fragment:
-            encoding = sys.getfilesystemencoding() or sys.getdefaultencoding()
-            if encoding == 'mbcs':
-                # On Windows, a broken encoding known to Python as
-                # "MBCS" is used for the filesystem. However, we only
-                # use the Unicode API for Windows paths, so the encoding
-                # is actually immaterial so we can avoid dealing with
-                # this nastiness. We arbitrarily choose UTF-8.
-                encoding = 'utf8'
-            subpath = subpath.encode(encoding, 'replace')
+        # Encode for the filesystem.
+        if not fragment:
+            subpath = bytestring_path(subpath)

        # Preserve extension.
        _, extension = pathmod.splitext(item.path)
--- a/beets/util/init.py
+++ b/beets/util/init.py
@ -141,7 +141,9 @@ def sorted_walk(path, ignore=()):
    # Get all the directories and files at this level.
    dirs = []
    files = []
-    for base in os.listdir(path):
+    for base in os.listdir(syspath(path)):
+        base = bytestring_path(base)
+
        # Skip ignored filenames.
        skip = False
        for pat in ignore:
@ -166,7 +168,7 @@ def sorted_walk(path, ignore=()):
    # Recurse into directories.
    for base in dirs:
        cur = os.path.join(path, base)
-        # yield from _sorted_walk(cur)
+        # yield from sorted_walk(...)
        for res in sorted_walk(cur, ignore):
            yield res

@ -250,6 +252,13 @@ def bytestring_path(path):

    # Try to encode with default encodings, but fall back to UTF8.
    encoding = sys.getfilesystemencoding() or sys.getdefaultencoding()
+    if encoding == 'mbcs':
+        # On Windows, a broken encoding known to Python as "MBCS" is
+        # used for the filesystem. However, we only use the Unicode API
+        # for Windows paths, so the encoding is actually immaterial so
+        # we can avoid dealing with this nastiness. We arbitrarily
+        # choose UTF-8.
+        encoding = 'utf8'
    try:
        return path.encode(encoding)
    except (UnicodeError, LookupError):