-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathhasher.py
91 lines (73 loc) · 2.39 KB
/
hasher.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
#!/usr/bin/env python
"""
Goal: Implement the entry point for the hash generator
@authors:
Andrei Sura <sura.andrei@gmail.com>
"""
import os
import sys
import time
import argparse
from datetime import timedelta
from multiprocessing import freeze_support
from onefl import logutils
from onefl.config import Config
from onefl.hash_generator import HashGenerator
from onefl.normalized_patient import NormalizedPatient
from onefl.version import __version__
logger = logutils.get_a_logger(__file__)
# The config file is looked up relative to this "root" folder
ROOT_PATH = '.'
DEFAULT_SETTINGS_FILE = 'config/settings_hasher.py'
def main():
"""
Configure the logger object and read the command line arguments
for invoking the generator.
.. seealso::
:meth:`HashGenerator.generate`
"""
HashGenerator.configure_logger(logger)
NormalizedPatient.configure_logger(logger)
parser = argparse.ArgumentParser()
parser.add_argument("-v", "--version",
default=False,
action='store_true',
help="Show the version number")
parser.add_argument("-c", "--config",
default=DEFAULT_SETTINGS_FILE,
help="Application config file")
parser.add_argument(
'-i', '--inputdir',
# required=True,
default='.',
help='input directory name')
parser.add_argument(
'-o', '--outputdir',
# required=True,
default='.',
help='output directory name')
parser.add_argument(
'-a', '--ask', action='store_true', default=False,
help='ask for confirmation to proceed')
args = parser.parse_args()
if args.version:
import sys
print("deduper, version {}".format(__version__))
sys.exit()
config = Config(root_path=ROOT_PATH, defaults={})
config.from_pyfile(args.config)
start = time.monotonic()
success = HashGenerator.generate(config,
args.inputdir,
args.outputdir,
args.ask)
end = time.monotonic()
elapsed = (end - start)
if success:
logger.info("Done. Process duration: {}"
.format(str(timedelta(seconds=elapsed))))
else:
logger.error("Failed!")
if __name__ == '__main__':
freeze_support()
main()