diff options
| author | Jules Laplace <julescarbon@gmail.com> | 2018-11-02 21:35:09 +0100 |
|---|---|---|
| committer | Jules Laplace <julescarbon@gmail.com> | 2018-11-02 21:35:09 +0100 |
| commit | 1a5effec286e4753dfdd8e8279abbbdf1ce8e0d2 (patch) | |
| tree | 1136e5231a758b8503785a2be66b558510ea2ea6 /fetch-entries.py | |
| parent | ec63582b349eaa23a9e22fc160ab3a3d621c4f47 (diff) | |
s2 scripts
Diffstat (limited to 'fetch-entries.py')
| -rw-r--r-- | fetch-entries.py | 44 |
1 files changed, 0 insertions, 44 deletions
diff --git a/fetch-entries.py b/fetch-entries.py deleted file mode 100644 index e206b058..00000000 --- a/fetch-entries.py +++ /dev/null @@ -1,44 +0,0 @@ -import os -import sys -import csv -import subprocess -import time -import random -import re -import click - -@click.command() -@click.option('--index', '-n', default=1, help='Index of CSV.') -def fetch_entries(index): - keys, lines = read_citation_list(index) - - for line in lines: - label = line[0] - title = line[1] - entries_fn = './datasets/scholar/entries/{}.csv'.format(title) - # print(entries_fn) - if not os.path.exists(entries_fn): - with open(entries_fn, 'w') as f: - t = re.sub(r'[^-0-9a-zA-Z ]+', '', title) - print(t) - subprocess.call([ - './vendor/scholar.py', - '-t', '-A', t, '--csv', - ], stdout=f) - time.sleep(random.randint(30, 60)) - - -def read_citation_list(index): - filename = './datasets/citations.csv' - # fn, ext = os.path.splitext(filename) - # in_fn = fn + '-' + str(index) + ext - # with open(in_fn, 'r') as f: - with open(filename, 'r') as f: - reader = csv.reader(f) - lines = list(reader) - keys = lines[0] - lines = lines[1:] - return keys, lines - -if __name__ == '__main__': - fetch_entries() |
