summaryrefslogtreecommitdiff
path: root/scraper/util.py
diff options
context:
space:
mode:
Diffstat (limited to 'scraper/util.py')
-rw-r--r--scraper/util.py6
1 files changed, 4 insertions, 2 deletions
diff --git a/scraper/util.py b/scraper/util.py
index 65194fd1..05b01fa7 100644
--- a/scraper/util.py
+++ b/scraper/util.py
@@ -308,7 +308,10 @@ class AddressBook (object):
for index, line in enumerate(data):
if line[0] == line[1] or line[0] not in entities:
entities[line[0]] = index
- name = line[1].lower().strip()
+ name = line[0].lower().strip().strip(string.digits)
+ if name not in lookup:
+ lookup[name] = line[0]
+ name = line[1].lower().strip().strip(string.digits)
if name not in lookup:
lookup[name] = line[0]
self.data = data
@@ -347,7 +350,6 @@ def load_institutions(paperId, paper_location_lookup={}):
if paperId in paper_location_lookup:
items = paper_location_lookup[paperId]
result = []
- print(items)
if items['validate_1'] is True or items['validate_1'] == 'TRUE':
result.append(['', items['institution_1'], '', ''])
if items['validate_2'] is True or items['validate_2'] == 'TRUE':