diff options
Diffstat (limited to 'scraper/s2-papers.py')
| -rw-r--r-- | scraper/s2-papers.py | 5 |
1 files changed, 4 insertions, 1 deletions
diff --git a/scraper/s2-papers.py b/scraper/s2-papers.py index 2e382900..8f318d57 100644 --- a/scraper/s2-papers.py +++ b/scraper/s2-papers.py @@ -17,7 +17,8 @@ s2 = SemanticScholarAPI() @click.command() @click.option('--freshen/--no-freshen', '-f', help='Force it to query the paper API again') -def fetch_papers(freshen): +@click.option('--dataset', '-d', default=None, help='Specific dataset to query') +def fetch_papers(freshen, dataset): addresses = AddressBook() lookup_keys, lines = fetch_google_sheet('citation_lookup') report_keys = [ @@ -32,6 +33,8 @@ def fetch_papers(freshen): name = line[1] title = line[2] paper_id = line[3] + if dataset is not None and dataset != key: + continue if paper_id == '': continue paper = fetch_paper(s2, paper_id, freshen) |
