2014-11-12 05:48:26 +03:00
|
|
|
/**********************************************************************
|
|
|
|
|
*
|
|
|
|
|
*
|
|
|
|
|
*
|
|
|
|
|
**********************************************************************/
|
|
|
|
|
|
2014-12-28 03:47:44 +03:00
|
|
|
var pathlib = require('path')
|
2014-12-16 04:50:34 +03:00
|
|
|
var events = require('events')
|
|
|
|
|
|
|
|
|
|
var fse = require('fs.extra')
|
|
|
|
|
var glob = require('glob')
|
2014-12-31 05:42:28 +03:00
|
|
|
var Promise = require('promise')
|
|
|
|
|
|
|
|
|
|
var guaranteeEvents = require('guarantee-events')
|
2014-11-14 21:57:55 +03:00
|
|
|
|
|
|
|
|
|
2014-11-12 05:48:26 +03:00
|
|
|
define(function(require){ var module = {}
|
|
|
|
|
console.log('>>> file')
|
|
|
|
|
|
|
|
|
|
//var DEBUG = DEBUG != null ? DEBUG : true
|
|
|
|
|
|
2014-11-14 21:57:55 +03:00
|
|
|
var tasks = require('lib/tasks')
|
2014-11-12 05:48:26 +03:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2014-11-14 21:57:55 +03:00
|
|
|
/*********************************************************************/
|
2014-11-12 05:48:26 +03:00
|
|
|
|
2014-11-14 21:57:55 +03:00
|
|
|
var INDEX_DIR = '.ImageGrid'
|
2014-11-12 05:48:26 +03:00
|
|
|
|
|
|
|
|
|
2014-12-28 23:49:42 +03:00
|
|
|
|
2014-12-16 04:50:34 +03:00
|
|
|
/*********************************************************************/
|
|
|
|
|
// Queue
|
|
|
|
|
//
|
|
|
|
|
// Task
|
|
|
|
|
//
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2014-11-12 05:48:26 +03:00
|
|
|
/*********************************************************************/
|
2014-12-28 23:49:42 +03:00
|
|
|
// helpers...
|
|
|
|
|
|
|
|
|
|
// Guarantee that the 'end' and 'match' handlers will always get called
|
|
|
|
|
// with all results at least once...
|
2014-12-16 04:50:34 +03:00
|
|
|
//
|
2014-12-28 23:49:42 +03:00
|
|
|
// This does two things:
|
|
|
|
|
// - every 'end' event handler will get the full result set, regardless
|
|
|
|
|
// of when it was set...
|
|
|
|
|
// - every 'match' handler will be called for every match found, again
|
|
|
|
|
// regardless of whether it was set before or after the time of
|
|
|
|
|
// match.
|
2014-12-16 04:50:34 +03:00
|
|
|
//
|
2014-12-28 23:49:42 +03:00
|
|
|
// This prevents handlers from missing the event they are waiting for,
|
|
|
|
|
// essentially making it similar to how Promise/Deferred handle their
|
|
|
|
|
// callbacks.
|
2014-12-12 03:56:58 +03:00
|
|
|
//
|
2014-12-28 20:46:06 +03:00
|
|
|
var guaranteeGlobEvents =
|
|
|
|
|
module.guaranteeGlobEvents =
|
2014-12-29 18:47:27 +03:00
|
|
|
function(glob){ return guaranteeEvents('match end', glob) }
|
2014-12-28 20:46:06 +03:00
|
|
|
|
2014-12-28 23:49:42 +03:00
|
|
|
|
|
|
|
|
|
|
|
|
|
/*********************************************************************/
|
|
|
|
|
// Reader...
|
|
|
|
|
|
|
|
|
|
|
2014-12-28 20:46:06 +03:00
|
|
|
// XXX return a promise rather than an event emitter (???)
|
|
|
|
|
// XXX glob has a problem: if a match happens fast enough and we are slow
|
|
|
|
|
// enough to register a 'match' handler, then that match(s) will get
|
|
|
|
|
// missed...
|
2014-11-14 21:57:55 +03:00
|
|
|
function listIndexes(base){
|
2014-12-28 20:46:06 +03:00
|
|
|
return guaranteeGlobEvents(glob(base +'/**/'+ INDEX_DIR))
|
2014-11-14 21:57:55 +03:00
|
|
|
}
|
2014-11-12 05:48:26 +03:00
|
|
|
|
|
|
|
|
|
2014-12-28 20:46:06 +03:00
|
|
|
// XXX return a promise rather than an event emitter (???)
|
2014-12-16 04:50:34 +03:00
|
|
|
function listJSON(path, pattern){
|
|
|
|
|
pattern = pattern || '*'
|
2014-12-28 20:46:06 +03:00
|
|
|
return guaranteeGlobEvents(glob(path +'/'+ pattern +'.json'))
|
2014-12-16 04:50:34 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2014-12-31 05:42:28 +03:00
|
|
|
var loadFile = Promise.denodeify(fse.readFile)
|
2014-12-28 20:46:06 +03:00
|
|
|
|
|
|
|
|
|
|
|
|
|
// XXX handle errors...
|
2014-12-16 04:50:34 +03:00
|
|
|
function loadJSON(path){
|
2014-12-28 03:47:44 +03:00
|
|
|
return loadFile(path).then(JSON.parse)
|
2014-12-16 04:50:34 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2014-12-29 18:47:27 +03:00
|
|
|
// Load index(s)...
|
|
|
|
|
//
|
|
|
|
|
// loadIndex(path)
|
|
|
|
|
// -> data
|
|
|
|
|
//
|
|
|
|
|
// loadIndex(path, logger)
|
|
|
|
|
// -> data
|
|
|
|
|
//
|
|
|
|
|
//
|
|
|
|
|
// Procedure:
|
|
|
|
|
// - locate indexes in path given
|
|
|
|
|
// - per each index
|
|
|
|
|
// - get all .json files
|
|
|
|
|
// - get and load latest base file per keyword
|
|
|
|
|
// - merge all later than loaded base diff files per keyword
|
|
|
|
|
//
|
|
|
|
|
//
|
|
|
|
|
// Index format (input):
|
|
|
|
|
// .ImageGrid/
|
|
|
|
|
// +- [<timestamp>-]<keyword>[-diff].json
|
|
|
|
|
// +- ...
|
|
|
|
|
//
|
|
|
|
|
//
|
|
|
|
|
// Output format:
|
|
|
|
|
// {
|
|
|
|
|
// // one per index found...
|
|
|
|
|
// <path>/<sub-path>: {
|
|
|
|
|
// <keyword>: <kw-data>,
|
|
|
|
|
// ...
|
|
|
|
|
// },
|
|
|
|
|
// ...
|
|
|
|
|
// }
|
|
|
|
|
//
|
2014-12-16 04:50:34 +03:00
|
|
|
//
|
2014-12-29 18:47:27 +03:00
|
|
|
// Events emitted on logger if passed:
|
2014-12-16 04:50:34 +03:00
|
|
|
// - queued <path> - json file path queued for loading
|
|
|
|
|
// - loaded <path> - done loading json file path
|
2014-12-28 23:49:42 +03:00
|
|
|
// - index <path> <data> - done loading index at path
|
|
|
|
|
// - error <err> - an error occurred...
|
2014-12-28 05:09:28 +03:00
|
|
|
//
|
2014-12-16 04:50:34 +03:00
|
|
|
//
|
2014-12-31 19:18:03 +03:00
|
|
|
// NOTE: this is fairly generic and does not care about the type of data
|
|
|
|
|
// or it's format as long as it's JSON and the file names comply
|
|
|
|
|
// with the scheme above...
|
|
|
|
|
//
|
|
|
|
|
// XXX add support for sharding...
|
2014-12-28 03:47:44 +03:00
|
|
|
// XXX test with:
|
2014-12-28 04:33:57 +03:00
|
|
|
// requirejs(['file'],
|
|
|
|
|
// function(m){
|
|
|
|
|
// f = m.loadIndex("L:/mnt/hdd15 (photo)/NTFS1/media/img/others") })
|
|
|
|
|
// .done(function(d){ console.log(d) })
|
2014-12-31 19:18:03 +03:00
|
|
|
// XXX need to do better error handling -- stop when an error is not recoverable...
|
2014-12-28 23:49:42 +03:00
|
|
|
// XXX a bit overcomplicated (???), see if this can be split into more generic
|
2014-12-28 05:09:28 +03:00
|
|
|
// sections...
|
2014-12-28 03:47:44 +03:00
|
|
|
var loadIndex =
|
|
|
|
|
module.loadIndex =
|
2014-12-28 04:33:57 +03:00
|
|
|
function(path, logger){
|
2014-12-16 04:50:34 +03:00
|
|
|
var p = path.split(INDEX_DIR)
|
|
|
|
|
var last = p.slice(-1)[0].trim()
|
|
|
|
|
|
2014-12-31 05:42:28 +03:00
|
|
|
return new Promise(function(resolve, reject){
|
2014-12-28 04:33:57 +03:00
|
|
|
// we've got an index...
|
|
|
|
|
if(p.length > 1 && /^\/*$/.test(last)){
|
|
|
|
|
listJSON(path)
|
2014-12-28 20:46:06 +03:00
|
|
|
// XXX handle errors...
|
|
|
|
|
.on('error', function(err){
|
|
|
|
|
logger && logger.emit('error', err)
|
|
|
|
|
})
|
2014-12-28 04:33:57 +03:00
|
|
|
.on('end', function(files){
|
|
|
|
|
var res = {}
|
|
|
|
|
var index = {}
|
|
|
|
|
var root = {}
|
|
|
|
|
|
|
|
|
|
// group by keyword...
|
|
|
|
|
files
|
|
|
|
|
.sort()
|
|
|
|
|
.reverse()
|
|
|
|
|
.forEach(function(n){
|
|
|
|
|
var b = pathlib.basename(n)
|
|
|
|
|
var s = b.split(/[-.]/g).slice(0, -1)
|
|
|
|
|
|
|
|
|
|
// <keyword>.json / non-diff
|
|
|
|
|
// NOTE: this is a special case, we add this to
|
|
|
|
|
// a seporate index and then concat it to
|
|
|
|
|
// the final list if needed...
|
|
|
|
|
if(s.length == 1){
|
|
|
|
|
var k = s[0]
|
|
|
|
|
root[k] = n
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
// <timestamp>-<keyword>[-diff].json / diff / non-diff
|
|
|
|
|
} else {
|
|
|
|
|
var k = s[1]
|
|
|
|
|
var d = s[2] == 'diff'
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// new keyword...
|
|
|
|
|
if(index[k] == null){
|
|
|
|
|
index[k] = [[d, n]]
|
|
|
|
|
logger && logger.emit('queued', n)
|
|
|
|
|
|
|
|
|
|
// do not add anything past the latest non-diff
|
|
|
|
|
// for each keyword...
|
|
|
|
|
} else if(index[k].slice(-1)[0][0] == true){
|
|
|
|
|
index[k].push([d, n])
|
|
|
|
|
logger && logger.emit('queued', n)
|
|
|
|
|
}
|
|
|
|
|
})
|
|
|
|
|
|
2014-12-28 23:49:42 +03:00
|
|
|
// add base files back where needed...
|
2014-12-28 20:46:06 +03:00
|
|
|
Object.keys(root)
|
|
|
|
|
.forEach(function(k){
|
|
|
|
|
var n = root[k]
|
2014-12-28 04:33:57 +03:00
|
|
|
|
2014-12-28 20:46:06 +03:00
|
|
|
// no diffs...
|
|
|
|
|
if(index[k] == null){
|
|
|
|
|
index[k] = [[false, n]]
|
|
|
|
|
logger && logger.emit('queued', n)
|
2014-12-16 04:50:34 +03:00
|
|
|
|
2014-12-28 20:46:06 +03:00
|
|
|
// add root file if no base is found...
|
|
|
|
|
} else if(index[k].slice(-1)[0][0] == true){
|
|
|
|
|
index[k].push([false, n])
|
|
|
|
|
logger && logger.emit('queued', n)
|
|
|
|
|
}
|
|
|
|
|
})
|
2014-12-28 03:47:44 +03:00
|
|
|
|
2014-12-28 04:33:57 +03:00
|
|
|
// load...
|
2014-12-31 05:42:28 +03:00
|
|
|
Promise
|
2014-12-28 04:33:57 +03:00
|
|
|
.all(Object.keys(index).map(function(k){
|
|
|
|
|
// get relevant paths...
|
|
|
|
|
var diffs = index[k]
|
|
|
|
|
var latest = diffs.splice(-1)[0][1]
|
|
|
|
|
|
2014-12-28 23:49:42 +03:00
|
|
|
// NOTE: so far I really do not like how nested and
|
|
|
|
|
// unreadable the Promise/Deferred code becomes
|
|
|
|
|
// even with a small rise in complexity...
|
|
|
|
|
// ...for example, the following code is quite
|
|
|
|
|
// simple, but does not look the part.
|
|
|
|
|
//
|
|
|
|
|
// Maybe it's a style thing...
|
|
|
|
|
|
2014-12-28 04:33:57 +03:00
|
|
|
// load latest...
|
|
|
|
|
return loadJSON(latest)
|
|
|
|
|
.then(function(data){
|
|
|
|
|
// handle diffs...
|
2014-12-31 05:42:28 +03:00
|
|
|
return Promise
|
2014-12-28 04:33:57 +03:00
|
|
|
.all(diffs
|
|
|
|
|
.reverse()
|
|
|
|
|
.map(function(p){
|
|
|
|
|
p = p[1]
|
|
|
|
|
// load diff...
|
|
|
|
|
return loadJSON(p)
|
2014-12-28 20:46:06 +03:00
|
|
|
// XXX handle errors...
|
2014-12-28 23:49:42 +03:00
|
|
|
// XXX we should abort loading this index...
|
|
|
|
|
.catch(function(err){
|
|
|
|
|
logger && logger.emit('error', err)
|
|
|
|
|
})
|
2014-12-28 04:33:57 +03:00
|
|
|
.done(function(json){
|
|
|
|
|
// merge...
|
|
|
|
|
for(var k in json){
|
|
|
|
|
data[k] = json[k]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
logger && logger.emit('loaded', p)
|
|
|
|
|
})
|
|
|
|
|
}))
|
|
|
|
|
.then(function(){
|
|
|
|
|
res[k] = data
|
|
|
|
|
|
|
|
|
|
logger && logger.emit('loaded', latest)
|
|
|
|
|
})
|
|
|
|
|
})
|
|
|
|
|
}))
|
|
|
|
|
.then(function(){
|
|
|
|
|
logger && logger.emit('index', path, res)
|
|
|
|
|
|
|
|
|
|
var d = {}
|
|
|
|
|
d[path] = res
|
|
|
|
|
|
|
|
|
|
resolve(d)
|
|
|
|
|
})
|
2014-12-28 03:47:44 +03:00
|
|
|
})
|
2014-12-16 04:50:34 +03:00
|
|
|
|
2014-12-28 04:33:57 +03:00
|
|
|
// no explicit index given -- find all in sub tree...
|
|
|
|
|
} else {
|
|
|
|
|
var res = {}
|
|
|
|
|
|
2014-12-28 05:09:28 +03:00
|
|
|
// XXX handle 'error' event...
|
2014-12-28 04:33:57 +03:00
|
|
|
listIndexes(path)
|
2014-12-28 20:46:06 +03:00
|
|
|
// XXX handle errors...
|
|
|
|
|
.on('error', function(err){
|
|
|
|
|
logger && logger.emit('error', err)
|
|
|
|
|
})
|
2014-12-28 05:09:28 +03:00
|
|
|
// collect the found indexes...
|
|
|
|
|
.on('match', function(path){
|
|
|
|
|
loadIndex(path, logger)
|
|
|
|
|
.done(function(obj){ res[path] = obj[path] })
|
|
|
|
|
})
|
|
|
|
|
// done...
|
|
|
|
|
.on('end', function(paths){
|
|
|
|
|
resolve(res)
|
2014-12-28 03:47:44 +03:00
|
|
|
})
|
2014-12-28 04:33:57 +03:00
|
|
|
}
|
|
|
|
|
})
|
2014-12-16 04:50:34 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2014-12-28 23:49:42 +03:00
|
|
|
/*********************************************************************/
|
|
|
|
|
// Writer...
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2014-12-16 04:50:34 +03:00
|
|
|
|
2014-11-12 05:48:26 +03:00
|
|
|
/**********************************************************************
|
|
|
|
|
* vim:set ts=4 sw=4 : */
|
|
|
|
|
return module })
|