index
:
megapixels_dev.git
master
Unnamed repository; edit this file 'description' to name the repository.
git daemon user
summary
refs
log
tree
commit
diff
log msg
author
committer
range
path:
root
/
scraper
Mode
Name
Size
-rw-r--r--
.gitignore
111
log
plain
-rw-r--r--
README.md
5070
log
plain
-rw-r--r--
__init__.py
0
log
plain
-rw-r--r--
check-counts.py
888
log
plain
d---------
client
351
log
plain
-rw-r--r--
content-script.crx
26845
log
plain
-rw-r--r--
content-script.pem
1708
log
plain
d---------
content-script
471
log
plain
d---------
datasets
272
log
plain
-rw-r--r--
db_paper_doi.csv
2446622
log
plain
-rw-r--r--
db_paper_pdf.csv
3586062
log
plain
-rw-r--r--
db_paper_pdf_list.csv
8536115
log
plain
-rw-r--r--
expand-uni-lookup.py
1033
log
plain
-rw-r--r--
ids.json
1603624
log
plain
-rw-r--r--
missing.csv
68376
log
plain
-rw-r--r--
pdf_dump_all.sh
380
log
plain
-rw-r--r--
pdf_dump_first_page.sh
300
log
plain
d---------
reports
1935
log
plain
-rw-r--r--
requirements.txt
35
log
plain
-rw-r--r--
s2-citation-report.py
12377
log
plain
-rw-r--r--
s2-doi-report.py
9210
log
plain
-rw-r--r--
s2-dump-db-pdf-urls.py
3558
log
plain
-rw-r--r--
s2-dump-ids.py
736
log
plain
-rw-r--r--
s2-dump-missing-paper-ids.py
1270
log
plain
-rw-r--r--
s2-extract-papers.py
1590
log
plain
-rw-r--r--
s2-extract-pdf-txt.py
693
log
plain
-rw-r--r--
s2-fetch-doi.py
2083
log
plain
-rw-r--r--
s2-fetch-google-sheet.py
70
log
plain
-rw-r--r--
s2-fetch-pdf.py
1248
log
plain
-rw-r--r--
s2-final-report.py
5991
log
plain
-rw-r--r--
s2-geocode-server.py
1649
log
plain
-rw-r--r--
s2-geocode-spreadsheet.py
2467
log
plain
-rw-r--r--
s2-geocode.py
2352
log
plain
-rw-r--r--
s2-merge-csv.py
664
log
plain
-rw-r--r--
s2-papers.py
2681
log
plain
-rw-r--r--
s2-pdf-first-pages.py
4164
log
plain
-rw-r--r--
s2-pdf-report.py
3814
log
plain
-rw-r--r--
s2-raw-papers.py
1174
log
plain
-rw-r--r--
s2-scrape.sh
384
log
plain
-rw-r--r--
s2-search.py
1607
log
plain
-rw-r--r--
s2-tar-papers.sh
219
log
plain
-rw-r--r--
s2.py
6609
log
plain
d---------
samples
185
log
plain
-rw-r--r--
scholar-fetch.py
1086
log
plain
-rw-r--r--
split-csv.py
1263
log
plain
-rw-r--r--
util.py
11089
log
plain
d---------
vendor
38
log
plain