diff options
Diffstat (limited to 'scraper/s2-final-report.py')
| -rw-r--r-- | scraper/s2-final-report.py | 5 |
1 files changed, 3 insertions, 2 deletions
diff --git a/scraper/s2-final-report.py b/scraper/s2-final-report.py index f08bc748..eff9a736 100644 --- a/scraper/s2-final-report.py +++ b/scraper/s2-final-report.py @@ -12,6 +12,7 @@ DIR_PUBLIC_CITATIONS = "../site/datasets/final" DIR_UNKNOWN_CITATIONS = "../site/datasets/unknown" addresses = AddressBook() +paper_location_lookup = fetch_google_lookup('paper_locations') @click.command() def s2_final_report(): @@ -90,7 +91,7 @@ def process_single_paper(row, paper_id, addresses, aggregate_citations, unknown_ # res['authors'] = ', '.join(paper.authors) # res['citations'] = [] - paper_institutions = load_institutions(paper.paper_id) + paper_institutions = load_institutions(paper.paper_id, paper_location_lookup) paper_address = None for inst in sorted(paper_institutions, key=operator.itemgetter(1)): # print(inst[1]) @@ -119,7 +120,7 @@ def process_single_paper(row, paper_id, addresses, aggregate_citations, unknown_ if citation is None or citation.data is None: print("Citation missing! {}".format(cite['paperId'])) continue - institutions = load_institutions(citationId) + institutions = load_institutions(citationId, paper_location_lookup) geocoded_addresses = [] geocoded_institutions = [] institution = '' |
