diff options
Diffstat (limited to 's2-fetch-doi.py')
| -rw-r--r-- | s2-fetch-doi.py | 8 |
1 files changed, 5 insertions, 3 deletions
diff --git a/s2-fetch-doi.py b/s2-fetch-doi.py index cd1d7999..4ca0119d 100644 --- a/s2-fetch-doi.py +++ b/s2-fetch-doi.py @@ -20,7 +20,9 @@ def fetch_doi_list(fn): domains = [] for line in lines: paper_id, url = line - domain = fetch_doi(paper_id, url) + if url: + domain = fetch_doi(paper_id, url) + print(domain) print("{} papers processed".format(len(lines))) def fetch_doi(paper_id, url): @@ -30,12 +32,12 @@ def fetch_doi(paper_id, url): txt_fn = make_txt_fn(paper_id) if os.path.exists(doi_fn) or os.path.exists(txt_fn): # return read_json(doi_fn) - return + return None, None size, final_url = s2.fetch_doi(url, doi_fn) if size is None: print("{} empty?".format(paper_id)) time.sleep(random.randint(2, 5)) - return None + return None, None print("{} {} kb".format(paper_id, int(size / 1024))) domain = urlparse(final_url).netloc write_json(url_fn, { |
