diff options
| author | Jules Laplace <julescarbon@gmail.com> | 2018-11-03 18:10:49 +0100 |
|---|---|---|
| committer | Jules Laplace <julescarbon@gmail.com> | 2018-11-03 18:10:49 +0100 |
| commit | 723f339cd33288813fb3106b55233c1d1429d481 (patch) | |
| tree | 6c091cc787c0f3ba485d4b9d8cf2a61422deb49a /s2-extract-papers.py | |
| parent | 753e41d819030a62418705fc4484d9303e3e1a00 (diff) | |
| parent | c6f3973534d861d61939b691f1b8c697369f069c (diff) | |
Merge branch 'master' of asdf.us:megapixels_dev
Diffstat (limited to 's2-extract-papers.py')
| -rw-r--r-- | s2-extract-papers.py | 6 |
1 files changed, 6 insertions, 0 deletions
diff --git a/s2-extract-papers.py b/s2-extract-papers.py index e84ffd0f..00301433 100644 --- a/s2-extract-papers.py +++ b/s2-extract-papers.py @@ -34,10 +34,16 @@ def process_paper(line, ids): def load_id_lookup(fn): lookup = {} ids = read_json(fn) + skip_count = 0 + save_count = 0 for paper_id in ids: path = paper_path(paper_id) if not os.path.exists(path): lookup[paper_id] = True + save_count += 1 + else: + skip_count += 1 + print("finding {} ids ({} already pulled)".format(save_count, skip_count)) return lookup def paper_path(paper_id): |
