2021-07-30 07:41:02 +02:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
|
|
|
import os
|
|
|
|
import re
|
|
|
|
import sys
|
|
|
|
from datetime import datetime
|
|
|
|
|
|
|
|
import click
|
|
|
|
|
2021-08-24 17:23:51 +02:00
|
|
|
from ordigi.config import Config
|
2021-08-14 21:31:37 +02:00
|
|
|
from ordigi import constants
|
|
|
|
from ordigi import log
|
2021-08-13 21:11:24 +02:00
|
|
|
from ordigi.database import Db
|
2021-08-27 12:45:25 +02:00
|
|
|
from ordigi.collection import Collection
|
2021-08-24 17:23:51 +02:00
|
|
|
from ordigi.geolocation import GeoLocation
|
2021-08-14 21:31:37 +02:00
|
|
|
from ordigi.media import Media, get_all_subclasses
|
2021-08-13 21:11:24 +02:00
|
|
|
from ordigi.summary import Summary
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
|
|
|
|
def print_help(command):
|
|
|
|
click.echo(command.get_help(click.Context(sort)))
|
|
|
|
|
|
|
|
|
|
|
|
@click.command('sort')
|
|
|
|
@click.option('--debug', default=False, is_flag=True,
|
|
|
|
help='Override the value in constants.py with True.')
|
|
|
|
@click.option('--dry-run', default=False, is_flag=True,
|
|
|
|
help='Dry run only, no change made to the filesystem.')
|
|
|
|
@click.option('--destination', '-d', type=click.Path(file_okay=False),
|
|
|
|
default=None, help='Sort files into this directory.')
|
2021-08-14 21:37:43 +02:00
|
|
|
@click.option('--clean', '-C', default=False, is_flag=True,
|
|
|
|
help='Clean empty folders')
|
2021-07-30 07:41:02 +02:00
|
|
|
@click.option('--copy', '-c', default=False, is_flag=True,
|
|
|
|
help='True if you want files to be copied over from src_dir to\
|
|
|
|
dest_dir rather than moved')
|
|
|
|
@click.option('--exclude-regex', '-e', default=set(), multiple=True,
|
|
|
|
help='Regular expression for directories or files to exclude.')
|
|
|
|
@click.option('--filter-by-ext', '-f', default=set(), multiple=True, help='''Use filename
|
|
|
|
extension to filter files for sorting. If value is '*', use
|
|
|
|
common media file extension for filtering. Ignored files remain in
|
|
|
|
the same directory structure''' )
|
|
|
|
@click.option('--ignore-tags', '-i', default=set(), multiple=True,
|
|
|
|
help='Specific tags or group that will be ignored when\
|
|
|
|
searching for file data. Example \'File:FileModifyDate\' or \'Filename\'' )
|
|
|
|
@click.option('--max-deep', '-m', default=None,
|
|
|
|
help='Maximum level to proceed. Number from 0 to desired level.')
|
2021-08-27 12:45:25 +02:00
|
|
|
@click.option('--remove-duplicates', '-R', default=False, is_flag=True,
|
2021-07-30 07:41:02 +02:00
|
|
|
help='True to remove files that are exactly the same in name\
|
|
|
|
and a file hash')
|
2021-08-27 12:45:25 +02:00
|
|
|
@click.option('--reset-cache', '-r', default=False, is_flag=True,
|
2021-07-30 07:41:02 +02:00
|
|
|
help='Regenerate the hash.json and location.json database ')
|
|
|
|
@click.option('--verbose', '-v', default=False, is_flag=True,
|
|
|
|
help='True if you want to see details of file processing')
|
|
|
|
@click.argument('paths', required=True, nargs=-1, type=click.Path())
|
2021-08-14 21:37:43 +02:00
|
|
|
def _sort(debug, dry_run, destination, clean, copy, exclude_regex, filter_by_ext, ignore_tags,
|
2021-07-30 07:41:02 +02:00
|
|
|
max_deep, remove_duplicates, reset_cache, verbose, paths):
|
|
|
|
"""Sort files or directories by reading their EXIF and organizing them
|
2021-08-13 21:11:24 +02:00
|
|
|
according to ordigi.conf preferences.
|
2021-07-30 07:41:02 +02:00
|
|
|
"""
|
|
|
|
|
|
|
|
if copy:
|
|
|
|
mode = 'copy'
|
|
|
|
else:
|
|
|
|
mode = 'move'
|
|
|
|
|
2021-08-14 21:37:43 +02:00
|
|
|
logger = log.get_logger(verbose, debug)
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
if max_deep is not None:
|
|
|
|
max_deep = int(max_deep)
|
|
|
|
|
|
|
|
cache = True
|
|
|
|
if reset_cache:
|
|
|
|
cache = False
|
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
if len(paths) > 1:
|
|
|
|
if not destination:
|
|
|
|
# Use last path argument as destination
|
|
|
|
destination = paths[-1]
|
|
|
|
paths = paths[0:-1]
|
|
|
|
elif paths:
|
|
|
|
# Source and destination are the same
|
|
|
|
destination = paths[0]
|
2021-07-30 07:41:02 +02:00
|
|
|
else:
|
2021-08-27 12:45:25 +02:00
|
|
|
logger.error(f'`ordigi sort` need at least one path argument')
|
2021-07-30 07:41:02 +02:00
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
paths = set(paths)
|
2021-08-14 21:37:43 +02:00
|
|
|
filter_by_ext = set(filter_by_ext)
|
|
|
|
|
2021-07-30 07:41:02 +02:00
|
|
|
destination = os.path.abspath(os.path.expanduser(destination))
|
|
|
|
|
|
|
|
if not os.path.exists(destination):
|
|
|
|
logger.error(f'Directory {destination} does not exist')
|
|
|
|
|
2021-08-24 17:23:51 +02:00
|
|
|
config = Config(constants.CONFIG_FILE)
|
|
|
|
opt = config.get_options()
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
# if no exclude list was passed in we check if there's a config
|
|
|
|
if len(exclude_regex) == 0:
|
2021-08-24 17:23:51 +02:00
|
|
|
exclude_regex = opt['exclude_regex']
|
2021-07-30 07:41:02 +02:00
|
|
|
exclude_regex_list = set(exclude_regex)
|
|
|
|
|
|
|
|
# Initialize Db
|
|
|
|
db = Db(destination)
|
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
collection = Collection(opt['path_format'], destination, cache,
|
|
|
|
opt['day_begins'], dry_run, exclude_regex_list, filter_by_ext,
|
|
|
|
logger, max_deep, mode)
|
2021-08-24 17:23:51 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
loc = GeoLocation(opt['geocoder'], opt['prefer_english_names'],
|
|
|
|
opt['timeout'])
|
2021-07-30 07:41:02 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
summary, has_errors = collection.sort_files(paths, db, loc,
|
|
|
|
remove_duplicates, ignore_tags)
|
2021-07-30 07:41:02 +02:00
|
|
|
|
2021-08-14 21:37:43 +02:00
|
|
|
if clean:
|
|
|
|
remove_empty_folders(destination, logger)
|
|
|
|
|
2021-07-30 07:41:02 +02:00
|
|
|
if verbose or debug:
|
|
|
|
summary.write()
|
|
|
|
|
|
|
|
if has_errors:
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
|
2021-08-14 21:37:43 +02:00
|
|
|
def remove_empty_folders(path, logger, remove_root=True):
|
|
|
|
'Function to remove empty folders'
|
|
|
|
if not os.path.isdir(path):
|
|
|
|
return
|
|
|
|
|
|
|
|
# remove empty subfolders
|
|
|
|
files = os.listdir(path)
|
|
|
|
if len(files):
|
|
|
|
for f in files:
|
|
|
|
fullpath = os.path.join(path, f)
|
|
|
|
if os.path.isdir(fullpath):
|
|
|
|
remove_empty_folders(fullpath, logger)
|
|
|
|
|
|
|
|
# if folder empty, delete it
|
|
|
|
files = os.listdir(path)
|
|
|
|
if len(files) == 0 and remove_root:
|
|
|
|
logger.info(f"Removing empty folder: {path}")
|
|
|
|
os.rmdir(path)
|
|
|
|
|
|
|
|
|
|
|
|
@click.command('clean')
|
|
|
|
@click.option('--debug', default=False, is_flag=True,
|
|
|
|
help='Override the value in constants.py with True.')
|
2021-08-27 12:45:25 +02:00
|
|
|
@click.option('--dedup-regex', '-d', default=set(), multiple=True,
|
|
|
|
help='Regex to match duplicate strings parts')
|
|
|
|
@click.option('--dry-run', default=False, is_flag=True,
|
|
|
|
help='Dry run only, no change made to the filesystem.')
|
|
|
|
@click.option('--folders', '-f', default=False, is_flag=True,
|
|
|
|
help='Remove empty folders')
|
|
|
|
@click.option('--max-deep', '-m', default=None,
|
|
|
|
help='Maximum level to proceed. Number from 0 to desired level.')
|
|
|
|
@click.option('--path-string', '-p', default=False, is_flag=True,
|
|
|
|
help='Deduplicate path string')
|
|
|
|
@click.option('--remove-duplicates', '-R', default=False, is_flag=True,
|
|
|
|
help='True to remove files that are exactly the same in name\
|
|
|
|
and a file hash')
|
|
|
|
@click.option('--root', '-r', type=click.Path(file_okay=False),
|
|
|
|
default=None, help='Root dir of media collection. If not set, use path')
|
|
|
|
@click.option('--verbose', '-v', default=False,
|
2021-08-14 21:37:43 +02:00
|
|
|
help='True if you want to see details of file processing')
|
|
|
|
@click.argument('path', required=True, nargs=1, type=click.Path())
|
2021-08-27 12:45:25 +02:00
|
|
|
def _clean(debug, dedup_regex, dry_run, folders, max_deep, path_string, remove_duplicates, root, verbose, path):
|
2021-08-14 21:37:43 +02:00
|
|
|
"""Remove empty folders
|
|
|
|
Usage: clean [--verbose|--debug] directory [removeRoot]"""
|
|
|
|
|
|
|
|
logger = log.get_logger(verbose, debug)
|
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
clean_all = False
|
|
|
|
if not folders:
|
|
|
|
clean_all = True
|
|
|
|
if not root:
|
|
|
|
root = path
|
2021-08-14 21:37:43 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
if clean_all or folders:
|
|
|
|
remove_empty_folders(path, logger)
|
|
|
|
|
|
|
|
config = Config(constants.CONFIG_FILE)
|
|
|
|
opt = config.get_options()
|
|
|
|
|
|
|
|
if path_string:
|
|
|
|
# Initialize Db
|
|
|
|
db = Db(root)
|
|
|
|
collection = Collection(opt['path_format'], root, dry_run=dry_run, logger=logger, max_deep=max_deep, mode='move')
|
|
|
|
dedup_regex = list(dedup_regex)
|
|
|
|
summary, has_errors = collection.dedup_regex(path, dedup_regex, db, logger, remove_duplicates)
|
|
|
|
|
|
|
|
if verbose or debug:
|
|
|
|
summary.write()
|
|
|
|
|
|
|
|
if has_errors:
|
|
|
|
sys.exit(1)
|
2021-08-14 21:37:43 +02:00
|
|
|
|
|
|
|
|
2021-07-30 07:41:02 +02:00
|
|
|
@click.command('generate-db')
|
|
|
|
@click.option('--path', type=click.Path(file_okay=False),
|
|
|
|
required=True, help='Path of your photo library.')
|
|
|
|
@click.option('--debug', default=False, is_flag=True,
|
|
|
|
help='Override the value in constants.py with True.')
|
|
|
|
def _generate_db(path, debug):
|
2021-08-13 21:11:24 +02:00
|
|
|
"""Regenerate the hash.json database which contains all of the sha256 signatures of media files.
|
2021-07-30 07:41:02 +02:00
|
|
|
"""
|
2021-08-27 12:45:25 +02:00
|
|
|
# TODO
|
|
|
|
pass
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
|
|
|
|
@click.command('verify')
|
|
|
|
@click.option('--path', type=click.Path(file_okay=False),
|
|
|
|
required=True, help='Path of your photo library.')
|
|
|
|
@click.option('--debug', default=False, is_flag=True,
|
|
|
|
help='Override the value in constants.py with True.')
|
|
|
|
def _verify(path, debug):
|
2021-08-27 12:45:25 +02:00
|
|
|
"""Verify hashes"""
|
|
|
|
# TODO
|
|
|
|
pass
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
|
|
|
|
@click.command('compare')
|
|
|
|
@click.option('--debug', default=False, is_flag=True,
|
|
|
|
help='Override the value in constants.py with True.')
|
|
|
|
@click.option('--dry-run', default=False, is_flag=True,
|
|
|
|
help='Dry run only, no change made to the filesystem.')
|
|
|
|
@click.option('--find-duplicates', '-f', default=False, is_flag=True)
|
|
|
|
@click.option('--output-dir', '-o', default=False, is_flag=True, help='output\
|
|
|
|
dir')
|
|
|
|
@click.option('--remove-duplicates', '-r', default=False, is_flag=True)
|
|
|
|
@click.option('--revert-compare', '-R', default=False, is_flag=True, help='Revert\
|
|
|
|
compare')
|
2021-08-27 12:45:25 +02:00
|
|
|
@click.option('--root', '-r', type=click.Path(file_okay=False),
|
|
|
|
default=None, help='Root dir of media collection. If not set, use path')
|
2021-07-30 07:41:02 +02:00
|
|
|
@click.option('--similar-to', '-s', default=False, help='Similar to given\
|
|
|
|
image')
|
|
|
|
@click.option('--similarity', '-S', default=80, help='Similarity level for\
|
|
|
|
images')
|
|
|
|
@click.option('--verbose', '-v', default=False, is_flag=True,
|
|
|
|
help='True if you want to see details of file processing')
|
|
|
|
@click.argument('path', nargs=1, required=True)
|
|
|
|
def _compare(debug, dry_run, find_duplicates, output_dir, remove_duplicates,
|
2021-08-27 12:45:25 +02:00
|
|
|
revert_compare, root, similar_to, similarity, verbose, path):
|
2021-07-30 07:41:02 +02:00
|
|
|
'''Compare files in directories'''
|
|
|
|
|
2021-08-14 21:37:43 +02:00
|
|
|
logger = log.get_logger(verbose, debug)
|
2021-07-30 07:41:02 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
if not root:
|
|
|
|
root = path
|
2021-07-30 07:41:02 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
config = Config(constants.CONFIG_FILE)
|
|
|
|
opt = config.get_options()
|
|
|
|
|
|
|
|
# Initialize Db
|
|
|
|
db = Db(root)
|
2021-08-08 13:02:15 +02:00
|
|
|
|
2021-08-27 12:45:25 +02:00
|
|
|
collection = Collection(path_format, root, mode='move', dry_run=dry_run, logger=logger)
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
if revert_compare:
|
2021-08-27 12:45:25 +02:00
|
|
|
summary, has_errors = collection.revert_compare(path, db, dry_run)
|
2021-07-30 07:41:02 +02:00
|
|
|
else:
|
2021-08-27 12:45:25 +02:00
|
|
|
summary, has_errors = collection.sort_similar_images(path, db,
|
2021-08-13 19:24:36 +02:00
|
|
|
similarity)
|
2021-07-30 07:41:02 +02:00
|
|
|
|
|
|
|
if verbose or debug:
|
|
|
|
summary.write()
|
|
|
|
|
|
|
|
if has_errors:
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
|
|
|
|
@click.group()
|
|
|
|
def main():
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
2021-08-14 21:37:43 +02:00
|
|
|
main.add_command(_clean)
|
2021-07-30 07:41:02 +02:00
|
|
|
main.add_command(_compare)
|
|
|
|
main.add_command(_sort)
|
|
|
|
main.add_command(_generate_db)
|
|
|
|
main.add_command(_verify)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
2021-08-08 11:55:38 +02:00
|
|
|
main()
|