diff options
| author | Jules Laplace <julescarbon@gmail.com> | 2018-12-07 22:05:55 +0100 |
|---|---|---|
| committer | Jules Laplace <julescarbon@gmail.com> | 2018-12-07 22:05:55 +0100 |
| commit | 61c2add5fe0cb914f09ab33e63ce801002d59c86 (patch) | |
| tree | 8d77733cc767d34d31f9e78110947f7cb4cf3791 /scraper/s2-dump-db-pdf-urls.py | |
| parent | ddafbb5da870aa7a3cd1e1efda3671f1a0595968 (diff) | |
s2-dump-db-pdf-urls.py
Diffstat (limited to 'scraper/s2-dump-db-pdf-urls.py')
| -rw-r--r-- | scraper/s2-dump-db-pdf-urls.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/scraper/s2-dump-db-pdf-urls.py b/scraper/s2-dump-db-pdf-urls.py index 608248e9..ae8faede 100644 --- a/scraper/s2-dump-db-pdf-urls.py +++ b/scraper/s2-dump-db-pdf-urls.py @@ -21,7 +21,7 @@ def s2_dump_pdf_urls(): domains = {} pdf = [] doi = [] - for fn in glob.iglob('./datasets/s2/*_paper/**/paper.json', recursive=True): + for fn in glob.iglob('./datasets/s2/*_papers/**/paper.json', recursive=True): if 'db_paper' in fn: row = process_db_paper(fn) elif 'raw_paper' in fn: |
