diff options
| author | adamhrv <adam@ahprojects.com> | 2019-03-08 21:56:41 +0100 |
|---|---|---|
| committer | adamhrv <adam@ahprojects.com> | 2019-03-08 21:56:41 +0100 |
| commit | 69c4157f599846173362d2a450f58b5f58c0d8d8 (patch) | |
| tree | 342e4e295820f6daaa130032fdb10bdf4ee1f2b7 /scraper/s2-papers.py | |
| parent | 5bcbb24791062b6524c06e2bf2bd4a61965ba6e8 (diff) | |
| parent | 377279bd1fb43d8752f7a664fe0f5c2ae20c0bc3 (diff) | |
Merge branch 'master' of github.com:adamhrv/megapixels_dev
Diffstat (limited to 'scraper/s2-papers.py')
| -rw-r--r-- | scraper/s2-papers.py | 10 |
1 files changed, 8 insertions, 2 deletions
diff --git a/scraper/s2-papers.py b/scraper/s2-papers.py index 782dc198..ef7d3d81 100644 --- a/scraper/s2-papers.py +++ b/scraper/s2-papers.py @@ -9,11 +9,15 @@ import operator import click from s2 import SemanticScholarAPI from util import * +from urllib.parse import unquote +import importlib +raw_papers_api = importlib.import_module('s2-raw-papers') s2 = SemanticScholarAPI() @click.command() -def fetch_papers(): +@click.option('--freshen/--no-freshen', '-f', help='Force it to query the paper API again') +def fetch_papers(freshen): addresses = AddressBook() lookup_keys, lines = fetch_google_sheet('citation_lookup') report_keys = [ @@ -30,9 +34,11 @@ def fetch_papers(): paper_id = line[3] if paper_id == '': continue - paper = fetch_paper(s2, paper_id) + paper = fetch_paper(s2, paper_id, freshen) if paper is None: continue + if freshen: + raw_papers_api.fetch_raw_paper(paper_id, freshen) db_paper = load_paper(paper_id) pdf_link = db_paper.pdf_link if db_paper else "" |
