summaryrefslogtreecommitdiff
path: root/megapixels/commands/datasets/download_images.py
diff options
context:
space:
mode:
authoradamhrv <adam@ahprojects.com>2019-09-08 21:32:10 +0200
committeradamhrv <adam@ahprojects.com>2019-09-08 21:32:10 +0200
commitaed339c29abce0fad683736622c20427da8ad3a6 (patch)
treed1999418ddf276f36473c828561e02279a809e9b /megapixels/commands/datasets/download_images.py
parent48d181774888206434d8096770022532bd09af87 (diff)
add flickr search
Diffstat (limited to 'megapixels/commands/datasets/download_images.py')
-rw-r--r--megapixels/commands/datasets/download_images.py8
1 files changed, 5 insertions, 3 deletions
diff --git a/megapixels/commands/datasets/download_images.py b/megapixels/commands/datasets/download_images.py
index 45ca8f6e..f2fdfb8f 100644
--- a/megapixels/commands/datasets/download_images.py
+++ b/megapixels/commands/datasets/download_images.py
@@ -10,8 +10,10 @@ import click
help='Number of threads')
@click.option('--wayback', 'opt_wayback', is_flag=True, default=False,
help='Check Wayback archive for URL and download cached image')
+@click.option('--url', 'opt_key_url', default='url', help='Field name for URL', show_default=True)
+@click.option('--filepath', 'opt_key_filepath', default='filepath', help='Field name for filepath', show_default=True)
@click.pass_context
-def cli(ctx, opt_fp_in, opt_fp_out, opt_threads, opt_wayback):
+def cli(ctx, opt_fp_in, opt_fp_out, opt_threads, opt_key_filepath, opt_key_url, opt_wayback):
"""Threaded image downloader"""
"""
@@ -69,11 +71,11 @@ def cli(ctx, opt_fp_in, opt_fp_out, opt_threads, opt_wayback):
pool_items = []
log.debug(f'Initializing multithreaded pool...')
for x in tqdm(records):
- fp_dst = join(opt_fp_out, x['filepath'])
+ fp_dst = join(opt_fp_out, x[opt_key_filepath])
fp_dst_is_file = Path(fp_dst).is_file()
fp_dst_is_err = Path(f'{fp_dst}_error.txt').is_file()
if not fp_dst_is_file and not fp_dst_is_err:
- pool_items.append({'url':x['url'], 'filepath': fp_dst, 'opt_wayback': opt_wayback})
+ pool_items.append({'url':x[opt_key_url], 'filepath': fp_dst, 'opt_wayback': opt_wayback})
num_items = len(pool_items)
log.info(f'Going to download {num_items:,} files')