From 670405d9391e10b0b3318963a24f8e892de8d84b Mon Sep 17 00:00:00 2001 From: infojunkie Date: Sun, 23 Jun 2024 14:46:30 -0700 Subject: [PATCH] Rename command --- README.md | 64 +++++++++++++- poetry.lock | 17 +++- pyproject.toml | 3 +- src/discogs_tag/cli.py | 178 +++++++++++++++++++++++++++++++++++--- tests/test_discogs_tag.py | 106 +++++++++++++++++++++-- 5 files changed, 344 insertions(+), 24 deletions(-) diff --git a/README.md b/README.md index 115fb4b..301142a 100644 --- a/README.md +++ b/README.md @@ -9,6 +9,26 @@ A rudimentary audio tagger based on Discogs metadata. # Usage ```shell +NAME + discogs-tag + +SYNOPSIS + discogs-tag COMMAND + +COMMANDS + COMMAND is one of the following: + + tag + Tag the audio files with the given Discogs release. + + copy + Copy the audio tags from source to destination folders. + + rename + Rename the audio files based on the given format string. +``` +## tag +```shell NAME discogs-tag tag - Tag the audio files with the given Discogs release. @@ -16,7 +36,10 @@ SYNOPSIS discogs-tag tag RELEASE DESCRIPTION - The skip flag can take one or more of the following values, comma-separated: + The RELEASE is the numeric portion of a Discogs release URL, e.g. 16215626 in + https://www.discogs.com/release/16215626-Pink-Floyd-Wish-You-Were-Here + + The SKIP flag can take one or more of the following values, comma-separated: artist, composer, title, position, date, subtrack, album, genre, albumartist POSITIONAL ARGUMENTS @@ -36,6 +59,7 @@ FLAGS NOTES You can also use flags syntax for POSITIONAL ARGUMENTS ``` +## copy ```shell NAME discogs-tag copy - Copy the audio tags from source to destination folders. @@ -44,7 +68,7 @@ SYNOPSIS discogs-tag copy SRC DESCRIPTION - The skip flag can take one or more of the following values, comma-separated: + The SKIP flag can take one or more of the following values, comma-separated: artist, composer, title, position, date, subtrack, album, genre, albumartist POSITIONAL ARGUMENTS @@ -64,3 +88,39 @@ FLAGS NOTES You can also use flags syntax for POSITIONAL ARGUMENTS ``` +## rename +```shell +NAME + discogs-tag rename - Rename the audio files based on the given format string. + +SYNOPSIS + discogs-tag rename FORMAT + +DESCRIPTION + The FORMAT string specifies how to rename the audio files and/or directories according to the following tags: + %a Artist + %z Album artist + %b Album title + %p Composer + %d Disc nummber + %g Genre + %n Track number + %t Track title + %y Year + / Directory separator: Specifies subdirectories to be created starting from the given directory. + Non-audio files will be moved to their existing subdirectories within the destination root which is assumed to be unique. + +POSITIONAL ARGUMENTS + FORMAT + +FLAGS + --dir=DIR + Default: './' + --dry=DRY + Default: False + -i, --ignore=IGNORE + Default: False + +NOTES + You can also use flags syntax for POSITIONAL ARGUMENTS +``` diff --git a/poetry.lock b/poetry.lock index a383eab..53e0b79 100644 --- a/poetry.lock +++ b/poetry.lock @@ -91,6 +91,21 @@ files = [ {file = "packaging-24.0.tar.gz", hash = "sha256:eb82c5e3e56209074766e6885bb04b8c38a0c015d0a30036ebe7ece34c9989e9"}, ] +[[package]] +name = "pathvalidate" +version = "3.2.0" +description = "pathvalidate is a Python library to sanitize/validate a string such as filenames/file-paths/etc." +optional = false +python-versions = ">=3.7" +files = [ + {file = "pathvalidate-3.2.0-py3-none-any.whl", hash = "sha256:cc593caa6299b22b37f228148257997e2fa850eea2daf7e4cc9205cef6908dee"}, + {file = "pathvalidate-3.2.0.tar.gz", hash = "sha256:5e8378cf6712bff67fbe7a8307d99fa8c1a0cb28aa477056f8fc374f0dff24ad"}, +] + +[package.extras] +docs = ["Sphinx (>=2.4)", "sphinx-rtd-theme (>=1.2.2)", "urllib3 (<2)"] +test = ["Faker (>=1.0.8)", "allpairspy (>=2)", "click (>=6.2)", "pytest (>=6.0.1)", "pytest-discord (>=0.1.4)", "pytest-md-report (>=0.4.1)"] + [[package]] name = "pluggy" version = "1.5.0" @@ -199,4 +214,4 @@ testing = ["big-O", "jaraco.functools", "jaraco.itertools", "jaraco.test", "more [metadata] lock-version = "2.0" python-versions = "^3.10" -content-hash = "5f88cb4f98a6b5052bb3b7f625f5b1e4d209e008b464829882303bd90223080c" +content-hash = "a47a75040450020af9a98940fe5e36e01df90cfb17e913c34ad7ea9efd68ba36" diff --git a/pyproject.toml b/pyproject.toml index 059c8a3..a845935 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "discogs-tag" -version = "0.3.2" +version = "0.4.0" description = "A rudimentary audio tagger based on Discogs metadata." authors = ["infojunkie "] readme = "README.md" @@ -11,6 +11,7 @@ python = "^3.10" fire = "^0.5.0" mutagen = "^1.46.0" importlib-metadata = "^6.8.0" +pathvalidate = "^3.2.0" [tool.poetry.group.dev.dependencies] pytest = "^7.0.0" diff --git a/src/discogs_tag/cli.py b/src/discogs_tag/cli.py index 80f1de0..4c3cb55 100644 --- a/src/discogs_tag/cli.py +++ b/src/discogs_tag/cli.py @@ -3,11 +3,13 @@ import urllib.request import json import os -from pprint import pprint import glob import sys import re +from pprint import pprint from functools import reduce +from contextlib import suppress +from pathvalidate import sanitize_filename from discogs_tag import __NAME__, __VERSION__ SKIP_KEYS = [ @@ -33,7 +35,10 @@ def tag( ): """Tag the audio files with the given Discogs release. - The skip flag can take one or more of the following values, comma-separated: + The RELEASE is the numeric portion of a Discogs release URL, e.g. 16215626 in + https://www.discogs.com/release/16215626-Pink-Floyd-Wish-You-Were-Here + + The SKIP flag can take one or more of the following values, comma-separated: artist, composer, title, position, date, subtrack, album, genre, albumartist """ @@ -43,7 +48,7 @@ def tag( }) with urllib.request.urlopen(request) as response: data = json.load(response) - files = get_files(dir) + files = list_files(dir) apply_metadata(data, files, options) def copy( @@ -55,29 +60,98 @@ def copy( ): """Copy the audio tags from source to destination folders. - The skip flag can take one or more of the following values, comma-separated: + The SKIP flag can take one or more of the following values, comma-separated: artist, composer, title, position, date, subtrack, album, genre, albumartist """ options = parse_options(locals()) - src_files = get_files(src) + src_files = list_files(src) if not src_files: raise Exception(f'No source files found at {src}. Aborting.') data = read_metadata(src_files, options) - dst_files = get_files(dir) + dst_files = list_files(dir) if options['dry']: pprint(data) else: apply_metadata(data, dst_files, options) +def rename( + format, + dir='./', + dry=False, + ignore=False +): + """Rename the audio files based on the given format string. + + The FORMAT string specifies how to rename the audio files and/or directories according to the following tags: + %a Artist + %z Album artist + %b Album title + %p Composer + %d Disc nummber + %g Genre + %n Track number + %t Track title + %y Year + / Directory separator: Specifies subdirectories to be created starting from the given directory. + Non-audio files will be moved to their existing subdirectories within the destination root which is assumed to be unique. + + """ + options = parse_options(locals()) + src_root = os.path.realpath(dir) + if not os.path.exists(src_root): + raise Exception(f'Directory "{dir}" not found. Aborting.') + files = list_files(src_root) + if not files: + raise Exception(f'Directory "{dir}" has no audio files. Aborting.') + + # Extract and create destination root from first audio file. + audio = mutagen.File(files[0], easy=True) + _, dst_root = rename_path(src_root, audio, format, options) + + # Iterate on all files and directories to move them to the destination. + # - Audio files are renamed according to their format, including subfolder structure + # - Other files are moved to the same subfolder in the destination tree + # - Folders are recreated on the destination and removed from the source if empty + for dirpath, dirnames, filenames in os.walk(src_root, topdown=False): + for filename in filenames: + src_filepath = os.path.join(dirpath, filename) + _, ext = os.path.splitext(src_filepath) + if ext[1:] in AUDIO_EXTENSIONS: + audio = mutagen.File(src_filepath, easy=True) + dst_path, _ = rename_path(src_root, audio, format, options) + rename_file(src_filepath, dst_path, audio, format, options) + else: + dst_filepath = os.path.join(dst_root, os.path.relpath(src_filepath, src_root)) + if options['dry']: + print("%s => %s" % (src_filepath, dst_filepath)) + else: + os.makedirs(os.path.dirname(dst_filepath), exist_ok=True) + os.rename(src_filepath, dst_filepath) + for dirname in dirnames: + src_path = os.path.join(dirpath, dirname) + if options['dry']: + print("✗ %s" % (src_path)) + else: + with suppress(OSError): + os.rmdir(src_path) + + # Also delete source root. + if options['dry']: + print("✗ %s" % (src_root)) + else: + with suppress(OSError): + os.rmdir(src_root) + def read_metadata(files, options): - """Read metadata from OS audio files and return data structure that mimics Discogs release.""" + """Read metadata from audio files and return data structure that mimics Discogs release.""" def safe_position(audio, n): try: return audio['tracknumber'][0].split('/')[0].lstrip('0') except: return str(n) + def safe_year(audio): try: return int(audio['date'][0].split('-')[0]) @@ -106,7 +180,7 @@ def safe_year(audio): } def apply_metadata(release, files, options): - """Apply Discogs release metadada to OS audio files.""" + """Apply Discogs release metadada to audio files.""" def get_tracks(tracklist): def reduce_track(tracks, track): if track['type_'] == 'track': @@ -126,7 +200,7 @@ def reduce_track(tracks, track): for n, track in enumerate(tracks): try: audio = mutagen.File(files[n], easy=True) - merge_metadata(release, track, audio, options) + audio = merge_metadata(release, track, audio, options) if options['dry']: pprint(audio) else: @@ -140,17 +214,90 @@ def reduce_track(tracks, track): if not options['dry']: print(f'Processed {len(files)} audio files.') -def get_files(dir): +def rename_component(audio, format, options): + """ Rename a path component based on format string with tags from the audio metadata. """ + component = format + for tag, fn in { + '%a': (lambda audio: audio.get('artist', [''])[0]), + '%z': (lambda audio: audio.get('albumartist', [''])[0]), + '%b': (lambda audio: audio.get('album', [''])[0]), + '%p': (lambda audio: audio.get('composer', [''])[0]), + '%d': (lambda audio: audio.get('discnumber', [''])[0]), + '%g': (lambda audio: audio.get('genre', [''])[0]), + '%n': (lambda audio: '%02d' % int(audio.get('tracknumber', [0])[0])), + '%t': (lambda audio: audio.get('title', [''])[0]), + '%y': (lambda audio: audio.get('date', [''])[0]) + }.items(): + if tag in component: + try: + replace = fn(audio).strip() + # If replacement is empty, also remove format chars until next tag. + if not replace: + component = re.sub(re.escape(tag) + r"[^%]*", '', component) + else: + component = component.replace(tag, replace) + except Exception as e: + if options['ignore']: + print(e, file=sys.stderr) + else: + raise e + return component + +def rename_path(src_root, audio, format, options): + """ Create directory path based on format string with tags from the audio metadata. """ + # Expand tags in each path component. + paths = [] + for dir in format.split('/')[:-1]: + paths.append(sanitize_filename(rename_component(audio, dir, options))) + if not paths: + return src_root, src_root + + # Create the new path. + dst_path = os.path.join(os.path.dirname(os.path.realpath(src_root)), *paths) + if not options['dry']: + os.makedirs(dst_path, exist_ok=True) + + return dst_path, os.path.join(os.path.dirname(os.path.realpath(src_root)), paths[0]) + +def rename_file(src_file, dst_path, audio, format, options): + """ Rename audio file based on format string with tags from the audio metadata. """ + # Get the last component of the format path. + filename = format.split('/')[-1].strip() + + if len(filename) == 0: + # No format specified: Keep the original filename + filename = os.path.basename(src_file) + else: + # Replace tags in the filename with audio metadata. + filename = rename_component(audio, filename, options) + + # Add back the original file extension. + _, ext = os.path.splitext(src_file) + filename += ext + + # Sanitize the filename. + filename = sanitize_filename(filename) + + # Add the original path. + dst_file = os.path.join(dst_path, filename) + if options['dry']: + print("%s => %s" % (src_file, dst_file)) + else: + os.rename(src_file, dst_file) + + return dst_file + +def list_files(dir): return sorted(reduce(lambda xs, ys: xs + ys, [ glob.glob(os.path.join(glob.escape(dir), '**', f"*.{ext}"), recursive=True) for ext in AUDIO_EXTENSIONS ])) def parse_options(options): for skip in SKIP_KEYS: - options['skip_' + skip] = False - if options['skip'] is not None: - for skip in options['skip'].lower(): - options['skip_' + skip] = True + options['skip_' + skip.lower()] = False + if 'skip' in options and options['skip'] is not None: + for skip in options['skip']: + options['skip_' + skip.lower()] = True return options def merge_metadata(release, track, audio, options): @@ -209,8 +356,11 @@ def artist_name(artist): if 'year' in release and release['year']: audio['date'] = str(release['year']) + return audio + def cli(): fire.Fire({ 'tag': tag, 'copy': copy, + 'rename': rename }) diff --git a/tests/test_discogs_tag.py b/tests/test_discogs_tag.py index ef31514..7b7352e 100644 --- a/tests/test_discogs_tag.py +++ b/tests/test_discogs_tag.py @@ -1,9 +1,9 @@ -from discogs_tag.cli import merge_metadata, apply_metadata, parse_options, get_files +from discogs_tag.cli import merge_metadata, apply_metadata, parse_options, list_files, rename_component, rename_path, rename_file import pytest import json -def test_get_files(): - files = get_files('tests/glob') +def test_list_files(): + files = list_files('tests/glob') assert files == [ 'tests/glob/01.mp3', 'tests/glob/02.flac', @@ -14,8 +14,7 @@ def test_get_files(): ] def test_merge_metadata(): - audio = {} - merge_metadata({ + audio = merge_metadata({ 'year': 2002, }, { 'title': 'Title', @@ -35,7 +34,7 @@ def test_merge_metadata(): 'role': 'Written-By', 'name': 'Composer' }] - }, audio, parse_options({ 'skip': None })) + }, { 'title': 'Some other title' }, parse_options({ 'skip': None })) assert audio['title'] == 'Title' assert audio['artist'] == 'Artist 1, Artist 2, Artist 3, Guitarist' assert audio['discnumber'] == '1' @@ -60,3 +59,98 @@ def test_count_subtracks(): with pytest.raises(Exception) as error: apply_metadata(data, [], parse_options({ 'dry': False, 'ignore': False, 'skip': None })) assert "Expecting 18 files" in str(error.value) + +def test_rename_component(): + assert '1-02 Title' == rename_component({ + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + assert '02 Title' == rename_component({ + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + with pytest.raises(IndexError) as error: + rename_component({ + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': [], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + assert "list index out of range" in str(error.value) + +def test_rename_path(): + assert ('/src/path/Album Artist - (2024) Album', '/src/path/Album Artist - (2024) Album') == rename_path('/src/path/from', { + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%z - (%y) %b/%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + assert ('/src/path/from', '/src/path/from') == rename_path('/src/path/from', { + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + assert ('/src/path/Album Artist/(2024) Album', '/src/path/Album Artist') == rename_path('/src/path/from', { + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%z/(%y) %b/%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + +def test_rename_file(): + assert '/dest/path/to/1-02 Title.flac' == rename_file('/src/path/from/test.flac', '/dest/path/to', { + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%z - (%y) %b/%d-%n %t', parse_options({ 'dry': True, 'ignore': False })) + assert '/dest/path/to/test.flac' == rename_file('/src/path/from/test.flac', '/dest/path/to', { + 'artist': ['Artist'], + 'albumartist': ['Album Artist'], + 'album': ['Album'], + 'composer': ['Composer'], + 'discnumber': ['1'], + 'genre': ['Genre'], + 'tracknumber': [2], + 'title': ['Title'], + 'date': ['2024'] + }, '%z - (%y) %b/', parse_options({ 'dry': True, 'ignore': False }))