summaryrefslogtreecommitdiff
path: root/scraper/s2-search.py
diff options
context:
space:
mode:
authorJules Laplace <julescarbon@gmail.com>2018-12-16 16:29:04 +0100
committerJules Laplace <julescarbon@gmail.com>2018-12-16 16:29:04 +0100
commit05fc975a313aa38483d904cb9ad07a029641d086 (patch)
tree85f3d4fdf3688c2779d3ca3ba9c59910a48d1df9 /scraper/s2-search.py
parent110f3a34f1f36d0ea999d4aa34bbe66d5f2a01da (diff)
rebuild
Diffstat (limited to 'scraper/s2-search.py')
-rw-r--r--scraper/s2-search.py20
1 files changed, 11 insertions, 9 deletions
diff --git a/scraper/s2-search.py b/scraper/s2-search.py
index 9ec20cc9..d9b1beca 100644
--- a/scraper/s2-search.py
+++ b/scraper/s2-search.py
@@ -38,22 +38,24 @@ def fetch_entries(index, refresh):
if len(clean_title) < 2:
continue
dump_fn = './datasets/s2/dumps/{}.json'.format(key)
- entry_fn = './datasets/s2/entries/{}.json'.format(key)
result = None
- if not refresh and os.path.exists(entry_fn):
- result = read_json(entry_fn)
+ if not refresh and os.path.exists(dump_fn):
+ results = read_json(dump_fn)
else:
results = s2.search(clean_title)
write_json(dump_fn, results)
- if len(results['results']) == 0:
- print("- {}".format(title))
- else:
- print("+ {}".format(title))
- result = results['results'][0]
- write_json(entry_fn, result)
+
+ if len(results['results']) == 0:
+ print("- {}".format(title))
+ else:
+ print("+ {}".format(title))
+ result = results['results'][0]
+
if result:
paper_id = result['id']
paper = fetch_paper(s2, paper_id)
+ entry_fn = './datasets/s2/entries/{}.json'.format(paper_id)
+ write_json(entry_fn, result)
citation_lookup.append([key, name, title, paper_id])
write_csv("datasets/citation_lookup.csv", keys=['key', 'name', 'title', 'paper_id'], rows=citation_lookup)