diff options
| author | jules@lens <julescarbon@gmail.com> | 2019-02-20 18:36:25 +0100 |
|---|---|---|
| committer | jules@lens <julescarbon@gmail.com> | 2019-02-20 18:36:25 +0100 |
| commit | 2116027843edad22d87e6a56269b26cd6aafb8e8 (patch) | |
| tree | ae15c70898a3ee28668a154ccdc1e600af51834c /scraper/s2-citation-report.py | |
| parent | 1ef0b07c0bbd779f3ab9b618a0edb768b927816e (diff) | |
updating all reports
Diffstat (limited to 'scraper/s2-citation-report.py')
| -rw-r--r-- | scraper/s2-citation-report.py | 7 |
1 files changed, 6 insertions, 1 deletions
diff --git a/scraper/s2-citation-report.py b/scraper/s2-citation-report.py index e4e41478..c515ec37 100644 --- a/scraper/s2-citation-report.py +++ b/scraper/s2-citation-report.py @@ -184,6 +184,10 @@ def process_paper(row, addresses, success): address_count = 0 fn = file_path('papers', row['paper_id'], 'paper.json') + if not os.path.exists(fn): + print("not found: {}".format(fn)) + print(row) + return with open(fn, 'r') as f: data = json.load(f) @@ -364,7 +368,8 @@ def load_megapixels_queries(): rec = {} for index, key in enumerate(keys): rec[key] = row[index] - recs.append(rec) + if rec['verified'] == '1': + recs.append(rec) return recs #def load_institutions(paperId): |
