diff options
| author | jules@lens <julescarbon@gmail.com> | 2019-02-16 15:19:13 +0100 |
|---|---|---|
| committer | jules@lens <julescarbon@gmail.com> | 2019-02-16 15:19:13 +0100 |
| commit | 68a3a4a479f326fc1446d565510f01cb9d6fa86b (patch) | |
| tree | 86fdaa683206ac89b75458bd5e405437946d62dd /scraper/s2-pdf-report.py | |
| parent | 1ed1e140cbdff2eb1168d35a043f67cbb897264d (diff) | |
updating doi report
Diffstat (limited to 'scraper/s2-pdf-report.py')
| -rw-r--r-- | scraper/s2-pdf-report.py | 2 |
1 files changed, 2 insertions, 0 deletions
diff --git a/scraper/s2-pdf-report.py b/scraper/s2-pdf-report.py index cdb340f5..d9d70514 100644 --- a/scraper/s2-pdf-report.py +++ b/scraper/s2-pdf-report.py @@ -29,6 +29,8 @@ def s2_pdf_report(): for fn in glob.iglob('{}/**/*.txt'.format(PDF_DIR), recursive=True): paper_id = fn.replace(PDF_DIR, '').split('/')[2] paper = load_paper(paper_id) + if paper is None or paper.data is None: + continue total_count += 1 # print(paper_id) headings, found_abstract = read_headings(fn, paper) |
