summaryrefslogtreecommitdiff
path: root/scraper/s2-final-report.py
diff options
context:
space:
mode:
authorJules Laplace <julescarbon@gmail.com>2019-02-18 13:28:06 +0100
committerJules Laplace <julescarbon@gmail.com>2019-02-18 13:28:06 +0100
commitb28f65ad5016ba3c3c9f973bd2a64ea3c8a3f84c (patch)
tree66cd5ba28f0b3687871d4f7f65078329463fd00c /scraper/s2-final-report.py
parent98d7c92f0050ca92ec6b72758a6d5b680f9e4d7f (diff)
get institutions from spreadsheet
Diffstat (limited to 'scraper/s2-final-report.py')
-rw-r--r--scraper/s2-final-report.py5
1 files changed, 3 insertions, 2 deletions
diff --git a/scraper/s2-final-report.py b/scraper/s2-final-report.py
index f08bc748..eff9a736 100644
--- a/scraper/s2-final-report.py
+++ b/scraper/s2-final-report.py
@@ -12,6 +12,7 @@ DIR_PUBLIC_CITATIONS = "../site/datasets/final"
DIR_UNKNOWN_CITATIONS = "../site/datasets/unknown"
addresses = AddressBook()
+paper_location_lookup = fetch_google_lookup('paper_locations')
@click.command()
def s2_final_report():
@@ -90,7 +91,7 @@ def process_single_paper(row, paper_id, addresses, aggregate_citations, unknown_
# res['authors'] = ', '.join(paper.authors)
# res['citations'] = []
- paper_institutions = load_institutions(paper.paper_id)
+ paper_institutions = load_institutions(paper.paper_id, paper_location_lookup)
paper_address = None
for inst in sorted(paper_institutions, key=operator.itemgetter(1)):
# print(inst[1])
@@ -119,7 +120,7 @@ def process_single_paper(row, paper_id, addresses, aggregate_citations, unknown_
if citation is None or citation.data is None:
print("Citation missing! {}".format(cite['paperId']))
continue
- institutions = load_institutions(citationId)
+ institutions = load_institutions(citationId, paper_location_lookup)
geocoded_addresses = []
geocoded_institutions = []
institution = ''