1 files changed, 57 insertions, 0 deletions
diff --git a/cli/app/commands/bigbigan/fetch.py b/cli/app/commands/bigbigan/fetch.py
new file mode 100644
index 0000000..5b6c102
--- /dev/null
+++ b/cli/app/commands/bigbigan/fetch.py
@@ -0,0 +1,57 @@
+import click
+
+from app.utils import click_utils
+from app.settings import app_cfg
+
+from os.path import join
+from subprocess import call
+
+@click.command('')
+# @click.option('-i', '--input', 'opt_dir_in', required=True, 
+#   help='Path to input image glob directory')
+# @click.option('-r', '--recursive', 'opt_recursive', is_flag=True)
+@click.pass_context
+def cli(ctx):
+  """
+  """
+
+  # app_cfg.MODELZOO_CFG
+  import gensim
+  
+  # from nltk.corpus import wordnet as wn
+  # synsets = wordnet.synsets("fir_tree")
+  # synonyms = [ lemma.name() for lemma in synsets[0].lemmas() ]
+
+  imagenet = Imagenet()
+
+  sentence = "The quick brown fox jumps over the lazy dog"
+  tokens = gensim.utils.simple_preprocess(sentence)
+
+class Imagenet:
+  def __init__():
+    tokens = {}
+    with open(app_cfg.FP_IMAGENET_WORDS, "r") as fp:
+      for line in fp.readlines():
+        wordnet_id, word_list = line.split('\t')
+        words = [word.trim() for word in word_list.split(',')]
+        for word in words:
+          tokens[word] = wordnet_id
+    self.tokens = tokens
+ 
+  def get_wordnet_ids_for_words(tokens):
+    # for token in tokens:
+      # if token in tokens:
+    pass
+
+  def images_from_wordnet_id(wordnet_id):
+    """
+    Given a Wordnet ID, download images for this class
+    """
+    call([
+      "python",
+      join(app_cfg.DIR_APP, "../ImageNet-Datasets-Downloader/downloader.py"),
+      '-data_root', app_cfg.FP_IMAGENET,
+      '-use_class_list', 'True',
+      '-class_list', wordnet_id,
+      '-images_per_class', app_cfg.IMAGENET_IMAGES_PER_CLASS
+    ])