summaryrefslogtreecommitdiff
path: root/app/client/dataset/dataset.loader.js
blob: f6b8d211aa585b4436fb31a74d8d7ca6ca8f4e0a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
import actions from '../actions'

const unsortedFolders = {}

export const unsortedFolder = (module, instantiate=false) => {
  if (!unsortedFolders[module] || instantiate) {
    const folder = {
      id: 0,
      module,
      name: 'unsorted',
      files: [],
      datasets: [],
    }
    unsortedFolders[module] = folder
  }
  return unsortedFolders[module]
}

export const emptyDataset = (module, datasetLookup, name, folder) => {
  const dataset = {
    name,
    input: [],
    checkpoints: [],
    output: [],
  }
  datasetLookup[name] = dataset
  folder = folder || unsortedFolder(module)
  folder.datasets.push(name)
  return dataset
}

export const getDataset = (module, datasetLookup, name, folder, date) => {
  let dataset = datasetLookup[name] || emptyDataset(module, datasetLookup, name, folder)
  // folder = folder || unsortedFolder(module)
  if (date) {
    dataset.date = (dataset.date && ! isNaN(dataset.date)) ? Math.max(+new Date(date), dataset.date) : +new Date(date)
  }
  return dataset
}

export const load = module => {
  console.log(module)
  return Promise.all([
    actions.folder.index({ module, limit: 0 }),
    actions.file.index({ module, limit: 0 }),
    actions.task.index({ module }),
  ]).then(res => {
    const [folders, files, tasks] = res

    let datasetLookup = {}
    let folderLookup = {}
    let fileLookup = {}

    let resultsFolder = {}

    // take all of the folders and put them in a lookup
    folderLookup = folders.reduce((folderLookup, folder) => {
      folderLookup[folder.id] = {
        id: folder.id,
        name: folder.name,
        folder,
        files: [],
        datasets: [],
      }
      resultsFolder = resultsFolder || (folder.name === 'results' && folder)
      return folderLookup
    }, {
      unsorted: unsortedFolder(module, true)
    })

    if (! resultsFolder) {
      console.log('creating results folder...')
      actions.folder.create({
        module,
        name: 'results',
        activity: 'results',
      }).then(folder => {
        console.log('created folder', folder)
        folderLookup.results = folder
      })
    }
    else {
      console.log('got results folder', resultsFolder)
    }

    // prepare the files by splitting into two groups
    const generatedFiles = files.filter(file => file.generated)
    const ungeneratedFiles = files.filter(file => !file.generated)

    // build the initial dataset lookup table using the ungenerated files
    ungeneratedFiles.reduce((datasetLookup, file) => {
      fileLookup[file.id] = file
      if (! file.name) {
        if (file.opt && file.opt.media && file.opt.media.token) {
          file.name = file.opt.media.token
        }
        else {          
          file.name = file.url.replace(/^https?:\/\/(www.)?/,'').replace(/[^a-zA-Z0-9_]/g, '_').replace(/_+/g, '_') || 'unknown_' + Math.floor(1000*Math.random())
        }
      }
      const name = (file.name || 'unsorted').split('.')[0]
      const folder = folderLookup[file.folder_id] || unsortedFolder(module)
      const dataset = getDataset(module, datasetLookup, file.dataset || name, folder, file.date || file.created_at)
      if (file.url.match(file.name)) file.persisted = true
      dataset.input.push(file.id)
      folder.files.push(file.id)
      return datasetLookup
    }, datasetLookup)

    // go over the generated files and add addl datasets (if the files were deleted)
    generatedFiles.map(file => {
      fileLookup[file.id] = file
      const pair = file.name.split('.')[0].split('-')
      const folder = folderLookup[file.folder_id] || unsortedFolder(module)
      const dataset = getDataset(module, datasetLookup, file.dataset || pair[0], folder, file.date || file.created_at)
      dataset.output.push(file.id)
      folder.files.push(file.id)
      file.epoch = file.epoch || pair[1]
    })

    return {
      folderLookup,
      fileLookup,
      datasetLookup,
      folders,
      files,
      unsortedFolder: folderLookup.unsorted,
      resultsFolder,
    }
  }).catch(e => {
    console.error(e)
  })
}