From b248ce4f21a94e4d081d93328961aca5942ac8f0 Mon Sep 17 00:00:00 2001 From: Jules Laplace Date: Sun, 10 Feb 2019 16:16:24 +0100 Subject: citation files --- scraper/s2-final-report.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) (limited to 'scraper/s2-final-report.py') diff --git a/scraper/s2-final-report.py b/scraper/s2-final-report.py index f81d1835..e20b3d98 100644 --- a/scraper/s2-final-report.py +++ b/scraper/s2-final-report.py @@ -24,12 +24,14 @@ def s2_final_report(): def process_paper(row, addresses): aggregate_citations = {} papers = [] + print(row['paper_ids']) for paper_id in row['paper_ids']: - res = process_single_paper(row, addresses, aggregate_citations) + res = process_single_paper(row, paper_id, addresses, aggregate_citations) if res: papers.append(res) if not len(papers): return + print(papers) with open('{}/{}.json'.format(DIR_PUBLIC_CITATIONS, row['key']), 'w') as f: json.dump({ 'id': papers[0]['paper_id'], @@ -39,7 +41,7 @@ def process_paper(row, addresses): 'citations': [aggregate_citations[key] for key in aggregate_citations.keys()], }, f) -def process_single_paper(row, addresses, aggregate_citations): +def process_single_paper(row, paper_id, addresses, aggregate_citations): res = { 'paper_id': '', 'key': '', @@ -62,7 +64,6 @@ def process_single_paper(row, addresses, aggregate_citations): pdf_count = 0 doi_count = 0 address_count = 0 - paper_id = row['paper_id'] fn = file_path('papers', paper_id, 'paper.json') -- cgit v1.2.3-70-g09d2