summaryrefslogtreecommitdiff
path: root/megapixels/commands/datasets/pull_spreadsheet.py
diff options
context:
space:
mode:
authoradamhrv <adam@ahprojects.com>2019-03-19 12:20:38 +0100
committeradamhrv <adam@ahprojects.com>2019-03-19 12:20:38 +0100
commit53f6e26015e65b8696ed1a6e5c74bdfef14b3ac2 (patch)
tree8bf8b0019ff604b2165bc66e3b5deaba355b46af /megapixels/commands/datasets/pull_spreadsheet.py
parent389f1f162720b577fcc652c95620eadd5e77ec43 (diff)
add cmds
Diffstat (limited to 'megapixels/commands/datasets/pull_spreadsheet.py')
-rw-r--r--megapixels/commands/datasets/pull_spreadsheet.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/megapixels/commands/datasets/pull_spreadsheet.py b/megapixels/commands/datasets/pull_spreadsheet.py
index 0094ea59..b8b68094 100644
--- a/megapixels/commands/datasets/pull_spreadsheet.py
+++ b/megapixels/commands/datasets/pull_spreadsheet.py
@@ -20,7 +20,7 @@ from app.utils.logger_utils import Logger
log = Logger.getLogger()
-opt_sheets = ['datasets', 'relationships', 'funding', 'references', 'sources', 'tags', 'citations', 'legal', ]
+opt_sheets = ['datasets', 'relationships', 'funding', 'references', 'sources', 'tags', 'citations', 'legal']
@click.command()
@click.option('-n', '--name', 'opt_spreadsheets', multiple=True,
@@ -65,14 +65,14 @@ def clean_datasets_sheet_ft(df):
# clean data for FT
df = df[df['ft_share'] == 'Y']
keys = ['key', 'name_short', 'name_full', 'url', 'downloaded', 'purpose', 'wild']
- keys += ['campus', 'year_start', 'year_end', 'year_published', 'images', 'videos', 'identities', 'faces', 'youtube', 'flickr', 'google', 'bing', 'comment']
+ keys += ['campus', 'year_start', 'year_end', 'year_published', 'images', 'videos', 'identities', 'faces_or_persons', 'youtube', 'flickr', 'google', 'bing', 'comment']
return df[keys]
def clean_datasets_sheet_nyt(df):
# clean data for FT
df = df[df['ft_share'] == 'Y']
keys = ['key', 'name_short', 'name_full', 'url', 'downloaded', 'purpose', 'wild']
- keys += ['campus', 'year_start', 'year_end', 'year_published', 'images', 'videos', 'identities', 'faces', 'youtube', 'flickr', 'google', 'bing', 'comment']
+ keys += ['campus', 'year_start', 'year_end', 'year_published', 'images', 'videos', 'identities', 'faces_or_persons', 'youtube', 'flickr', 'google', 'bing', 'comment']
return df[keys]
def fetch_spreadsheet():