Last active
May 23, 2018 09:55
-
-
Save an0th3rhuman/bc73b2104cf48e3290a95f1b5942b659 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import argparse | |
import gzip | |
import os | |
import shutil | |
import sys | |
import threading | |
def parse_input(): | |
parser = argparse.ArgumentParser() | |
parser.add_argument('-target', nargs=1, required=True, | |
help='Target Backup folder') | |
parser.add_argument('-source', nargs='+', required=True, | |
help='Source Files to be added') | |
parser.add_argument('-compress', nargs=1, type=int, | |
help='Gzip threshold in bytes', default=[100000]) | |
# no input means show me the help | |
if len(sys.argv) == 1: | |
parser.print_help() | |
sys.exit() | |
return parser.parse_args() | |
def size_if_newer(source, target): | |
""" If newer it returns size, otherwise it returns False """ | |
src_stat = os.stat(source) | |
try: | |
target_ts = os.stat(target).st_mtime | |
except FileNotFoundError: | |
try: | |
target_ts = os.stat(target + '.gz').st_mtime | |
except FileNotFoundError: | |
target_ts = 0 | |
# The time difference of one second is necessary since subsecond accuracy | |
# of os.st_mtime is striped by copy2 | |
return src_stat.st_size if (src_stat.st_mtime - target_ts > 1) else False | |
def threaded_sync_file(source, target, compress): | |
size = size_if_newer(source, target) | |
if size: | |
thread = threading.Thread(target=transfer_file, | |
args=(source, target, size > compress)) | |
thread.start() | |
return thread | |
def sync_file(source, target, compress): | |
size = size_if_newer(source, target) | |
if size: | |
transfer_file(source, target, size > compress) | |
def transfer_file(source, target, compress): | |
""" Either copy or compress and copies the file """ | |
try: | |
if compress: | |
with gzip.open(target + '.gz', 'wb') as target_fid: | |
with open(source, 'rb') as source_fid: | |
target_fid.writelines(source_fid) | |
print('Compress {}'.format(source)) | |
else: | |
shutil.copy2(source, target) | |
print('Copy {}'.format(source)) | |
except FileNotFoundError: | |
os.makedirs(os.path.dirname(target)) | |
transfer_file(source, target, compress) | |
def sync_root(root, arg): | |
target = arg.target[0] | |
compress = arg.compress[0] | |
threads = [] | |
for path, _, files in os.walk(root): | |
for source in files: | |
source = path + '/' + source | |
threads.append(threaded_sync_file(source, | |
target + source, compress)) | |
# sync_file(source, target + source, compress) | |
for thread in threads: | |
thread.join() | |
if __name__ == '__main__': | |
arg = parse_input() | |
print('### Start copy ####') | |
for root in arg.source: | |
sync_root(root, arg) | |
print('### Done ###') |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment