summaryrefslogtreecommitdiff
path: root/scraper/util.py
diff options
context:
space:
mode:
authorJules Laplace <julescarbon@gmail.com>2019-03-28 17:25:28 +0100
committerJules Laplace <julescarbon@gmail.com>2019-03-28 17:25:28 +0100
commitfd4faf7fb94e7b5cbcf5e232d1fd08822e8825bb (patch)
tree060e7ff9b25402e90eb3cab078193155e60b1fcf /scraper/util.py
parent7347fb5a2a8b966b9dce79d97a5d2bdf3c6557d1 (diff)
build verified citations report
Diffstat (limited to 'scraper/util.py')
-rw-r--r--scraper/util.py14
1 files changed, 14 insertions, 0 deletions
diff --git a/scraper/util.py b/scraper/util.py
index 96ced430..ad7b1f4d 100644
--- a/scraper/util.py
+++ b/scraper/util.py
@@ -452,6 +452,20 @@ def fetch_google_lookup(name, item_key='key'):
lookup[rec[item_key]] = rec
return lookup
+def fetch_verified_paper_lookup():
+ """Fetch a lookup keyed by dataset, where each dataset points to a hash of valid or invalid papers..."""
+ keys, rows = fetch_google_sheet('verifications')
+ verified_lookup = {}
+ for row in rows:
+ rec = {}
+ for index, key in enumerate(keys):
+ rec[key] = row[index]
+ if rec['dataset'] not in verified_lookup:
+ verified_lookup[rec['dataset']] = {}
+ if str(rec['uses_dataset']) == '1':
+ verified_lookup[rec['dataset']][rec['paper_id']] = rec
+ return verified_lookup
+
def update_or_append_worksheet(name, form):
worksheet = fetch_worksheet(name)
keys = worksheet.row_values(1)