ordigi/ordigi.py

286 lines
9.8 KiB
Python
Raw Normal View History

#!/usr/bin/env python
import os
import re
import sys
from datetime import datetime
import click
from ordigi.config import Config
2021-08-14 21:31:37 +02:00
from ordigi import constants
from ordigi import log
2021-08-13 21:11:24 +02:00
from ordigi.database import Db
2021-08-27 12:45:25 +02:00
from ordigi.collection import Collection
from ordigi.geolocation import GeoLocation
2021-08-14 21:31:37 +02:00
from ordigi.media import Media, get_all_subclasses
2021-08-13 21:11:24 +02:00
from ordigi.summary import Summary
def print_help(command):
click.echo(command.get_help(click.Context(sort)))
@click.command('sort')
@click.option('--debug', default=False, is_flag=True,
help='Override the value in constants.py with True.')
@click.option('--dry-run', default=False, is_flag=True,
help='Dry run only, no change made to the filesystem.')
@click.option('--destination', '-d', type=click.Path(file_okay=False),
default=None, help='Sort files into this directory.')
2021-08-14 21:37:43 +02:00
@click.option('--clean', '-C', default=False, is_flag=True,
help='Clean empty folders')
@click.option('--copy', '-c', default=False, is_flag=True,
help='True if you want files to be copied over from src_dir to\
dest_dir rather than moved')
@click.option('--exclude-regex', '-e', default=set(), multiple=True,
help='Regular expression for directories or files to exclude.')
@click.option('--filter-by-ext', '-f', default=set(), multiple=True, help='''Use filename
extension to filter files for sorting. If value is '*', use
common media file extension for filtering. Ignored files remain in
the same directory structure''' )
@click.option('--ignore-tags', '-i', default=set(), multiple=True,
help='Specific tags or group that will be ignored when\
searching for file data. Example \'File:FileModifyDate\' or \'Filename\'' )
@click.option('--max-deep', '-m', default=None,
help='Maximum level to proceed. Number from 0 to desired level.')
2021-08-27 12:45:25 +02:00
@click.option('--remove-duplicates', '-R', default=False, is_flag=True,
help='True to remove files that are exactly the same in name\
and a file hash')
2021-08-27 12:45:25 +02:00
@click.option('--reset-cache', '-r', default=False, is_flag=True,
help='Regenerate the hash.json and location.json database ')
@click.option('--verbose', '-v', default=False, is_flag=True,
help='True if you want to see details of file processing')
@click.argument('paths', required=True, nargs=-1, type=click.Path())
2021-08-14 21:37:43 +02:00
def _sort(debug, dry_run, destination, clean, copy, exclude_regex, filter_by_ext, ignore_tags,
max_deep, remove_duplicates, reset_cache, verbose, paths):
"""Sort files or directories by reading their EXIF and organizing them
2021-08-13 21:11:24 +02:00
according to ordigi.conf preferences.
"""
if copy:
mode = 'copy'
else:
mode = 'move'
2021-08-14 21:37:43 +02:00
logger = log.get_logger(verbose, debug)
if max_deep is not None:
max_deep = int(max_deep)
cache = True
if reset_cache:
cache = False
2021-08-27 12:45:25 +02:00
if len(paths) > 1:
if not destination:
# Use last path argument as destination
destination = paths[-1]
paths = paths[0:-1]
elif paths:
# Source and destination are the same
destination = paths[0]
else:
2021-08-27 12:45:25 +02:00
logger.error(f'`ordigi sort` need at least one path argument')
sys.exit(1)
paths = set(paths)
2021-08-14 21:37:43 +02:00
filter_by_ext = set(filter_by_ext)
destination = os.path.abspath(os.path.expanduser(destination))
if not os.path.exists(destination):
logger.error(f'Directory {destination} does not exist')
config = Config(constants.CONFIG_FILE)
opt = config.get_options()
# if no exclude list was passed in we check if there's a config
if len(exclude_regex) == 0:
exclude_regex = opt['exclude_regex']
exclude_regex_list = set(exclude_regex)
# Initialize Db
db = Db(destination)
2021-08-27 12:45:25 +02:00
collection = Collection(opt['path_format'], destination, cache,
opt['day_begins'], dry_run, exclude_regex_list, filter_by_ext,
logger, max_deep, mode)
2021-08-27 12:45:25 +02:00
loc = GeoLocation(opt['geocoder'], opt['prefer_english_names'],
opt['timeout'])
2021-08-27 12:45:25 +02:00
summary, has_errors = collection.sort_files(paths, db, loc,
remove_duplicates, ignore_tags)
2021-08-14 21:37:43 +02:00
if clean:
remove_empty_folders(destination, logger)
if verbose or debug:
summary.write()
if has_errors:
sys.exit(1)
2021-08-14 21:37:43 +02:00
def remove_empty_folders(path, logger, remove_root=True):
'Function to remove empty folders'
if not os.path.isdir(path):
return
# remove empty subfolders
files = os.listdir(path)
if len(files):
for f in files:
fullpath = os.path.join(path, f)
if os.path.isdir(fullpath):
remove_empty_folders(fullpath, logger)
# if folder empty, delete it
files = os.listdir(path)
if len(files) == 0 and remove_root:
logger.info(f"Removing empty folder: {path}")
os.rmdir(path)
@click.command('clean')
@click.option('--debug', default=False, is_flag=True,
help='Override the value in constants.py with True.')
2021-08-27 12:45:25 +02:00
@click.option('--dedup-regex', '-d', default=set(), multiple=True,
help='Regex to match duplicate strings parts')
@click.option('--dry-run', default=False, is_flag=True,
help='Dry run only, no change made to the filesystem.')
@click.option('--folders', '-f', default=False, is_flag=True,
help='Remove empty folders')
@click.option('--max-deep', '-m', default=None,
help='Maximum level to proceed. Number from 0 to desired level.')
@click.option('--path-string', '-p', default=False, is_flag=True,
help='Deduplicate path string')
@click.option('--remove-duplicates', '-R', default=False, is_flag=True,
help='True to remove files that are exactly the same in name\
and a file hash')
@click.option('--root', '-r', type=click.Path(file_okay=False),
default=None, help='Root dir of media collection. If not set, use path')
@click.option('--verbose', '-v', default=False,
2021-08-14 21:37:43 +02:00
help='True if you want to see details of file processing')
@click.argument('path', required=True, nargs=1, type=click.Path())
2021-08-27 12:45:25 +02:00
def _clean(debug, dedup_regex, dry_run, folders, max_deep, path_string, remove_duplicates, root, verbose, path):
2021-08-14 21:37:43 +02:00
"""Remove empty folders
Usage: clean [--verbose|--debug] directory [removeRoot]"""
logger = log.get_logger(verbose, debug)
2021-08-27 12:45:25 +02:00
clean_all = False
if not folders:
clean_all = True
if not root:
root = path
2021-08-14 21:37:43 +02:00
2021-08-27 12:45:25 +02:00
if clean_all or folders:
remove_empty_folders(path, logger)
config = Config(constants.CONFIG_FILE)
opt = config.get_options()
if path_string:
# Initialize Db
db = Db(root)
collection = Collection(opt['path_format'], root, dry_run=dry_run, logger=logger, max_deep=max_deep, mode='move')
dedup_regex = list(dedup_regex)
summary, has_errors = collection.dedup_regex(path, dedup_regex, db, logger, remove_duplicates)
if verbose or debug:
summary.write()
if has_errors:
sys.exit(1)
2021-08-14 21:37:43 +02:00
@click.command('generate-db')
@click.option('--path', type=click.Path(file_okay=False),
required=True, help='Path of your photo library.')
@click.option('--debug', default=False, is_flag=True,
help='Override the value in constants.py with True.')
def _generate_db(path, debug):
2021-08-13 21:11:24 +02:00
"""Regenerate the hash.json database which contains all of the sha256 signatures of media files.
"""
2021-08-27 12:45:25 +02:00
# TODO
pass
@click.command('verify')
@click.option('--path', type=click.Path(file_okay=False),
required=True, help='Path of your photo library.')
@click.option('--debug', default=False, is_flag=True,
help='Override the value in constants.py with True.')
def _verify(path, debug):
2021-08-27 12:45:25 +02:00
"""Verify hashes"""
# TODO
pass
@click.command('compare')
@click.option('--debug', default=False, is_flag=True,
help='Override the value in constants.py with True.')
@click.option('--dry-run', default=False, is_flag=True,
help='Dry run only, no change made to the filesystem.')
@click.option('--find-duplicates', '-f', default=False, is_flag=True)
@click.option('--output-dir', '-o', default=False, is_flag=True, help='output\
dir')
@click.option('--remove-duplicates', '-r', default=False, is_flag=True)
@click.option('--revert-compare', '-R', default=False, is_flag=True, help='Revert\
compare')
2021-08-27 12:45:25 +02:00
@click.option('--root', '-r', type=click.Path(file_okay=False),
default=None, help='Root dir of media collection. If not set, use path')
@click.option('--similar-to', '-s', default=False, help='Similar to given\
image')
@click.option('--similarity', '-S', default=80, help='Similarity level for\
images')
@click.option('--verbose', '-v', default=False, is_flag=True,
help='True if you want to see details of file processing')
@click.argument('path', nargs=1, required=True)
def _compare(debug, dry_run, find_duplicates, output_dir, remove_duplicates,
2021-08-27 12:45:25 +02:00
revert_compare, root, similar_to, similarity, verbose, path):
'''Compare files in directories'''
2021-08-14 21:37:43 +02:00
logger = log.get_logger(verbose, debug)
2021-08-27 12:45:25 +02:00
if not root:
root = path
2021-08-27 12:45:25 +02:00
config = Config(constants.CONFIG_FILE)
opt = config.get_options()
# Initialize Db
db = Db(root)
2021-08-08 13:02:15 +02:00
2021-08-27 12:45:25 +02:00
collection = Collection(path_format, root, mode='move', dry_run=dry_run, logger=logger)
if revert_compare:
2021-08-27 12:45:25 +02:00
summary, has_errors = collection.revert_compare(path, db, dry_run)
else:
2021-08-27 12:45:25 +02:00
summary, has_errors = collection.sort_similar_images(path, db,
2021-08-13 19:24:36 +02:00
similarity)
if verbose or debug:
summary.write()
if has_errors:
sys.exit(1)
@click.group()
def main():
pass
2021-08-14 21:37:43 +02:00
main.add_command(_clean)
main.add_command(_compare)
main.add_command(_sort)
main.add_command(_generate_db)
main.add_command(_verify)
if __name__ == '__main__':
main()