summaryrefslogtreecommitdiff
path: root/scraper/s2-fetch-doi.py
diff options
context:
space:
mode:
authorJules Laplace <julescarbon@gmail.com>2019-02-10 17:15:58 +0100
committerJules Laplace <julescarbon@gmail.com>2019-02-10 17:15:58 +0100
commit7fe9d36385a2350c9c4fd5dec105e34d85fe637a (patch)
tree313db438bed35e4763df66df6adc89bed85e6616 /scraper/s2-fetch-doi.py
parent478903401f480f2284f8f534ac5ef9b99fdc0b1c (diff)
parallelize doi
Diffstat (limited to 'scraper/s2-fetch-doi.py')
-rw-r--r--scraper/s2-fetch-doi.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/scraper/s2-fetch-doi.py b/scraper/s2-fetch-doi.py
index ae80036e..5e98d898 100644
--- a/scraper/s2-fetch-doi.py
+++ b/scraper/s2-fetch-doi.py
@@ -17,12 +17,12 @@ s2 = SemanticScholarAPI()
@click.option('--fn', '-i', default='db_paper_doi.csv', help='Filename of CSV (id, url,)')
def fetch_doi_list(fn):
lines = read_csv(fn, keys=False)
- domains = []
+ urls = []
for line in lines:
paper_id, url = line
if url:
- domain = fetch_doi(paper_id, url)
- print(domain)
+ urls.append(line)
+ parallelize(fetch_doi, urls)
print("{} papers processed".format(len(lines)))
def fetch_doi(paper_id, url, replace=False):