From b28f65ad5016ba3c3c9f973bd2a64ea3c8a3f84c Mon Sep 17 00:00:00 2001 From: Jules Laplace Date: Mon, 18 Feb 2019 13:28:06 +0100 Subject: get institutions from spreadsheet --- scraper/util.py | 25 +++++++++++++++++++++++-- 1 file changed, 23 insertions(+), 2 deletions(-) (limited to 'scraper/util.py') diff --git a/scraper/util.py b/scraper/util.py index 899089f7..4a43a913 100644 --- a/scraper/util.py +++ b/scraper/util.py @@ -338,8 +338,29 @@ class AddressBook (object): } return None - -def load_institutions(paperId): +def load_institutions(paperId, paper_location_lookup={}): + if paperId in paper_location_lookup: + items = paper_location_lookup[paperId] + result = [] + if items['institution_1']: + result.append([items['institution_1'], '', '']) + if items['institution_2']: + result.append([items['institution_2'], '', '']) + if items['institution_3']: + result.append([items['institution_3'], '', '']) + if items['institution_4']: + result.append([items['institution_4'], '', '']) + if items['institution_5']: + result.append([items['institution_5'], '', '']) + if items['institution_6']: + result.append([items['institution_6'], '', '']) + if items['institution_7']: + result.append([items['institution_7'], '', '']) + if items['institution_8']: + result.append([items['institution_8'], '', '']) + return { + 'institutions': result + } if os.path.exists(file_path('pdf', paperId, 'institutions.json')): return read_json(file_path('pdf', paperId, 'institutions.json'))['institutions'] elif os.path.exists(file_path('doi', paperId, 'institutions.json')): -- cgit v1.2.3-70-g09d2