diff options
| author | Jules Laplace <julescarbon@gmail.com> | 2019-02-08 19:22:35 +0100 |
|---|---|---|
| committer | Jules Laplace <julescarbon@gmail.com> | 2019-02-08 19:22:35 +0100 |
| commit | 6059ce2eb68a931a4cbb12049c202c3299e4966b (patch) | |
| tree | 54713073be1c9e8b84fbe14c1b70e3d08a09b627 /scraper | |
| parent | c3ef46181d95f57f72d32e713b732e3875aafc08 (diff) | |
script to aggregate citations from multiple papers
Diffstat (limited to 'scraper')
| -rw-r--r-- | scraper/s2-final-report.py | 5 |
1 files changed, 4 insertions, 1 deletions
diff --git a/scraper/s2-final-report.py b/scraper/s2-final-report.py index 207b7abe..a958e4bc 100644 --- a/scraper/s2-final-report.py +++ b/scraper/s2-final-report.py @@ -80,7 +80,10 @@ def process_single_paper(row, addresses, aggregate_citations): res['title'] = paper.title res['journal'] = paper.journal res['report_link'] = 'papers/{}.html'.format(paper.paper_id) - res['pdf_link'] = paper.pdf_link + pdf_link = paper.pdf_link + if type(pdf_link) == dict and 'url' in pdf_link: + pdf_link = pdf_link['url'] + res['pdf_link'] = pdf_link # res['authors'] = ', '.join(paper.authors) # res['citations'] = [] |
