diff options
Diffstat (limited to 'scraper/s2-final-report.py')
| -rw-r--r-- | scraper/s2-final-report.py | 7 |
1 files changed, 4 insertions, 3 deletions
diff --git a/scraper/s2-final-report.py b/scraper/s2-final-report.py index f81d1835..e20b3d98 100644 --- a/scraper/s2-final-report.py +++ b/scraper/s2-final-report.py @@ -24,12 +24,14 @@ def s2_final_report(): def process_paper(row, addresses): aggregate_citations = {} papers = [] + print(row['paper_ids']) for paper_id in row['paper_ids']: - res = process_single_paper(row, addresses, aggregate_citations) + res = process_single_paper(row, paper_id, addresses, aggregate_citations) if res: papers.append(res) if not len(papers): return + print(papers) with open('{}/{}.json'.format(DIR_PUBLIC_CITATIONS, row['key']), 'w') as f: json.dump({ 'id': papers[0]['paper_id'], @@ -39,7 +41,7 @@ def process_paper(row, addresses): 'citations': [aggregate_citations[key] for key in aggregate_citations.keys()], }, f) -def process_single_paper(row, addresses, aggregate_citations): +def process_single_paper(row, paper_id, addresses, aggregate_citations): res = { 'paper_id': '', 'key': '', @@ -62,7 +64,6 @@ def process_single_paper(row, addresses, aggregate_citations): pdf_count = 0 doi_count = 0 address_count = 0 - paper_id = row['paper_id'] fn = file_path('papers', paper_id, 'paper.json') |
