ImageGrid/index.py

#=======================================================================

__version__ = '''0.0.01'''
__sub_version__ = '''20111110194845'''
__copyright__ = '''(c) Alex A. Naanou 2011'''


#-----------------------------------------------------------------------

import os
import json
import uuid

from itertools import izip, izip_longest

from pli.logictypes import ANY, OR

from pprint import pprint


#-----------------------------------------------------------------------

CONFIG_NAME = 'test_config.json'

config = json.load(open(CONFIG_NAME))

RAW = OR(
	'NEF', 'nef', 
	'CRW', 'crw',
	'CR2', 'cr2',
	'X3F', 'x3f'
)

JPEG = OR(
	'JPG', 'jpg', 
	'JPEG', 'jpeg'
)

PSD = OR(
	'PSD', 'psd'
)

TIFF = OR(
	'TIFF', 'tiff', 
	'TIF', 'tif'
)

XMP = OR(
	'XMP', 'xmp'
)

ITEM = OR(RAW, JPEG, PSD, TIFF, XMP)

TYPES = {
	'raw': RAW,
	'jpeg': JPEG,
	'psd': PSD,
	'tiff': TIFF,
	'xmp': XMP,
}


SUBTREE_CLASSES = {
	'preview': 'preview', 
	'preview (RAW)': 'RAW preview', 
}


#-----------------------------------------------------------------------

##!!! we will need to normalize the paths to one single scheme (either relative or absolute)...
def list_files(root, sub_trees=SUBTREE_CLASSES, type=ITEM):
	'''
	'''
	for path, dirs, files in os.walk(root):
		path = path.split(os.path.sep)
		# process files...
		for f in files:
			name, ext = os.path.splitext(f)
			# we need the extension wothout the dot...
			ext = ext[1:]
			# filter by ext...
			if ext == type:
				yield path, name, ext


# XXX need to split duplicate named raw files and corresponding
# 	  previews...
# XXX we are loosing the real extension here...
def index_by_name(file_list, types=TYPES.items()):
	'''
	format:
		{
			<name>: {
				<type>: [
					<path>,
					...
				],
				...
			},
			...
		}
	'''
	res = {}
	for path, name, ext in file_list:
		# normalize extension...
		orig_ext, ext = ext, types[types.index((ANY, ext))][0]
		if name not in res:
			# create a name...
			res[name] = {}
		if ext not in res[name]:
			# create an extension...
			res[name][ext] = []
		# general case...
##		res[name][ext] += [(path, name, ext)]
		res[name][ext] += [(path, orig_ext)]
##		res[name][ext] += [path]
	return res


# for this to work correctly it must:
# 	- return unique paths
# 	- non of the returnd paths can be a strict subset of any other...
##!!!
def split_common(paths):
	'''
	'''
	# pass 1: build list of common paths (None for all differences)
	# NOTE: we may have stray common path elements but we do
	# 		not care abut anything after a None...
	index = izip_longest(*paths)
	common = []
	for s in index:
		next = []
		for i in s:
			if s.count(i) > 1:
				next += [i]
			else:
				next += [None]
		common += [next]
	# pass 2: cap each common section with a unique element...
	common = [ list(e) for e in izip(*common)]
	for c, p in izip(common, paths):
		if None in c:
			i = c.index(None)
			if len(p) <= i:
				# NOTE: this is the case when we have a None 
				# 		because a path just ended... i.e. there 
				# 		was no different element to split at...
				# XXX do we need to break here?
				# XXX one way to go here is to simply ignore
				# 	  such paths...
				del c[i]
				continue
			# in-place update and truncate the common path...
			c[i] = p[i]
			del c[i+1:]
	return common

# in essance this need to replace image name with a GID and split up
# images that are identically named into seporate GIDs...
def split_images(index):
	'''
	This will split groups that contain multiple raw files.

	Groups are split to contain one raw each.

	Each image will be grouped to the raw that containse the ragest 
	matching sub-path, starting from root.

	Resulting groups will have a gid as it's key

	This will fail for any files that live in a common sub-path of any
	two or more raw files.


	NOTE: in the case there are two raw files in one path, then we will 
		  favor the deeper / longer mathch.
	'''
	for name, data in index.items():
		# this will not let us lose the name of the image...
		data['name'] = name
		raw = data['raw']
		if len(raw) > 1:
			# split the images...
			# split images via closeness to one of the raw files...
			# XXX the simple way to split files is to remove the
			# 	  common part of the path between two raw files and
			# 	  then split the other files by root of the
			# 	  subtree.
			# 	  this will not work in one case:
			# 	  	- at least two of the raw files are in a deeper
			# 	  	  subtree than the other accompanying files.
			# 	  	  in this case wa can not use the topology to
			# 	  	  decide which is wich and need either to use
			# 	  	  some other means or to go inside the image...
			#
			common = split_common([r for r, e in raw])

			# prepare the return structure...
			res = []
			for path in raw:
				##!!!
				res += [{
					'gid': str(uuid.uuid4()),
					'name': name,
					'raw': [path],
				}]
			# start splitting the data...
			for t, paths in data.items():
				# skip non-type fields...
				if t not in TYPES:
					continue
				if t == 'raw':
					continue
				# start the work...
				for path, ext in paths:
					matches = []
					for i, c in enumerate(common):
						# use matching path head to match targets...
						if path[:len(c)] == c:
							matches += [(len(c), i)]
					# multiple matches...
					if len(matches) > 1:
						# longest match wins...
						matches.sort(key=lambda e: e[0])
						if matches[0][0] == matches[1][0]:
							# XXX we could try and use a different
							# 	  strategy...
							##!!! do a better error...
							raise Exception, 'got two targets with same score, can\'t decide where to put the file.'
						del matches[1:]
					if len(matches) == 1:
						i = matches[0][1]
						# we found a location...
						if t not in res[i]:
							res[i][t] = []
						res[i][t] += [(path, ext)]
					else:
						##!!! XXX ungrouped files...
						raise Exception, 'still got ungrouped files...'

			# yield the results...
			for e in res:
				yield e['gid'], e
		else:
			gid = data['gid'] = str(uuid.uuid4())
			yield gid, data


#-----------------------------------------------------------------------
if __name__ == '__main__':
	lst = list(list_files(config['ARCHIVE_ROOT']))

	print len(lst)

	index = index_by_name(list_files(config['ARCHIVE_ROOT']))

	print len(index)

	index = list(split_images(index_by_name(list_files(config['ARCHIVE_ROOT']))))

	print len(index)

	json.dump(index, file(os.path.join('test', 'filelist.json'), 'w'))


#=======================================================================
#                                            vim:set ts=4 sw=4 nowrap :
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`#=======================================================================`

			`__version__ = '''0.0.01'''`
now why is UUID is not serializable to json... JUST HATE IT WHEN PYTHON DOES THINGS LIKE THESE\! Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:50:58 +04:00			`__sub_version__ = '''20111110194845'''`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`__copyright__ = '''(c) Alex A. Naanou 2011'''`


			`#-----------------------------------------------------------------------`

			`import os`
			`import json`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`import uuid`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`from itertools import izip, izip_longest`

			`from pli.logictypes import ANY, OR`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`from pprint import pprint`

started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00
			`#-----------------------------------------------------------------------`

got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`CONFIG_NAME = 'test_config.json'`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00
			`config = json.load(open(CONFIG_NAME))`

got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`RAW = OR(`
			`'NEF', 'nef',`
			`'CRW', 'crw',`
			`'CR2', 'cr2',`
			`'X3F', 'x3f'`
			`)`

			`JPEG = OR(`
			`'JPG', 'jpg',`
			`'JPEG', 'jpeg'`
			`)`

			`PSD = OR(`
			`'PSD', 'psd'`
			`)`

			`TIFF = OR(`
			`'TIFF', 'tiff',`
			`'TIF', 'tif'`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`)`

got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`XMP = OR(`
			`'XMP', 'xmp'`
			`)`

			`ITEM = OR(RAW, JPEG, PSD, TIFF, XMP)`

			`TYPES = {`
			`'raw': RAW,`
			`'jpeg': JPEG,`
			`'psd': PSD,`
			`'tiff': TIFF,`
			`'xmp': XMP,`
			`}`


started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`SUBTREE_CLASSES = {`
			`'preview': 'preview',`
			`'preview (RAW)': 'RAW preview',`
			`}`


			`#-----------------------------------------------------------------------`

got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`##!!! we will need to normalize the paths to one single scheme (either relative or absolute)...`
			`def list_files(root, sub_trees=SUBTREE_CLASSES, type=ITEM):`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`'''`
			`'''`
			`for path, dirs, files in os.walk(root):`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`path = path.split(os.path.sep)`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`# process files...`
			`for f in files:`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`name, ext = os.path.splitext(f)`
			`# we need the extension wothout the dot...`
			`ext = ext[1:]`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00			`# filter by ext...`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`if ext == type:`
			`yield path, name, ext`


			`# XXX need to split duplicate named raw files and corresponding`
			`# previews...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`# XXX we are loosing the real extension here...`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`def index_by_name(file_list, types=TYPES.items()):`
			`'''`
			`format:`
			`{`
			`<name>: {`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`<type>: [`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`<path>,`
			`...`
			`],`
			`...`
			`},`
			`...`
			`}`
			`'''`
			`res = {}`
			`for path, name, ext in file_list:`
			`# normalize extension...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`orig_ext, ext = ext, types[types.index((ANY, ext))][0]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`if name not in res:`
			`# create a name...`
			`res[name] = {}`
			`if ext not in res[name]:`
			`# create an extension...`
			`res[name][ext] = []`
			`# general case...`
			`## res[name][ext] += [(path, name, ext)]`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`res[name][ext] += [(path, orig_ext)]`
			`## res[name][ext] += [path]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`return res`


			`# for this to work correctly it must:`
			`# - return unique paths`
			`# - non of the returnd paths can be a strict subset of any other...`
			`##!!!`
			`def split_common(paths):`
			`'''`
			`'''`
			`# pass 1: build list of common paths (None for all differences)`
			`# NOTE: we may have stray common path elements but we do`
			`# not care abut anything after a None...`
			`index = izip_longest(*paths)`
			`common = []`
			`for s in index:`
			`next = []`
			`for i in s:`
			`if s.count(i) > 1:`
			`next += [i]`
			`else:`
			`next += [None]`
			`common += [next]`
			`# pass 2: cap each common section with a unique element...`
			`common = [ list(e) for e in izip(*common)]`
			`for c, p in izip(common, paths):`
			`if None in c:`
			`i = c.index(None)`
			`if len(p) <= i:`
			`# NOTE: this is the case when we have a None`
			`# because a path just ended... i.e. there`
			`# was no different element to split at...`
			`# XXX do we need to break here?`
			`# XXX one way to go here is to simply ignore`
			`# such paths...`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`del c[i]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`continue`
			`# in-place update and truncate the common path...`
			`c[i] = p[i]`
			`del c[i+1:]`
			`return common`

			`# in essance this need to replace image name with a GID and split up`
			`# images that are identically named into seporate GIDs...`
			`def split_images(index):`
			`'''`
added docs and fixed a minor bug... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:47:45 +04:00			`This will split groups that contain multiple raw files.`

			`Groups are split to contain one raw each.`

			`Each image will be grouped to the raw that containse the ragest`
			`matching sub-path, starting from root.`

			`Resulting groups will have a gid as it's key`

			`This will fail for any files that live in a common sub-path of any`
			`two or more raw files.`


			`NOTE: in the case there are two raw files in one path, then we will`
			`favor the deeper / longer mathch.`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`'''`
			`for name, data in index.items():`
			`# this will not let us lose the name of the image...`
			`data['name'] = name`
			`raw = data['raw']`
			`if len(raw) > 1:`
			`# split the images...`
			`# split images via closeness to one of the raw files...`
			`# XXX the simple way to split files is to remove the`
			`# common part of the path between two raw files and`
			`# then split the other files by root of the`
			`# subtree.`
			`# this will not work in one case:`
			`# - at least two of the raw files are in a deeper`
			`# subtree than the other accompanying files.`
			`# in this case wa can not use the topology to`
			`# decide which is wich and need either to use`
			`# some other means or to go inside the image...`
			`#`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`common = split_common([r for r, e in raw])`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00
			`# prepare the return structure...`
			`res = []`
			`for path in raw:`
			`##!!!`
			`res += [{`
now why is UUID is not serializable to json... JUST HATE IT WHEN PYTHON DOES THINGS LIKE THESE\! Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:50:58 +04:00			`'gid': str(uuid.uuid4()),`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`'name': name,`
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`'raw': [path],`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`}]`
			`# start splitting the data...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`for t, paths in data.items():`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`# skip non-type fields...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`if t not in TYPES:`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`continue`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`if t == 'raw':`
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`continue`
			`# start the work...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`for path, ext in paths:`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`matches = []`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`for i, c in enumerate(common):`
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`# use matching path head to match targets...`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`if path[:len(c)] == c:`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`matches += [(len(c), i)]`
			`# multiple matches...`
			`if len(matches) > 1:`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`# longest match wins...`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`matches.sort(key=lambda e: e[0])`
			`if matches[0][0] == matches[1][0]:`
			`# XXX we could try and use a different`
			`# strategy...`
			`##!!! do a better error...`
			`raise Exception, 'got two targets with same score, can\'t decide where to put the file.'`
			`del matches[1:]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`if len(matches) == 1:`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`i = matches[0][1]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`# we found a location...`
grouping appears to be working correctly. still need more tests and to check for corner cases... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:38:43 +04:00			`if t not in res[i]:`
			`res[i][t] = []`
			`res[i][t] += [(path, ext)]`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`else:`
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`##!!! XXX ungrouped files...`
grouping almost done, still needs cleaningup and revising... (also think of better strategies to resolve and test corner cases) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:02:26 +04:00			`raise Exception, 'still got ungrouped files...'`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00
			`# yield the results...`
			`for e in res:`
fixed a bug. and discovered that we effectively lost the actual extension of a file in the indexing process... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:17:38 +04:00			`yield e['gid'], e`
got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`else:`
now why is UUID is not serializable to json... JUST HATE IT WHEN PYTHON DOES THINGS LIKE THESE\! Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:50:58 +04:00			`gid = data['gid'] = str(uuid.uuid4())`
added docs and fixed a minor bug... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:47:45 +04:00			`yield gid, data`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00


			`#-----------------------------------------------------------------------`
			`if __name__ == '__main__':`
			`lst = list(list_files(config['ARCHIVE_ROOT']))`

			`print len(lst)`

got the grouping mostly working. corner cases still fail (run index.py to see the ungrouped files) Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 18:43:46 +04:00			`index = index_by_name(list_files(config['ARCHIVE_ROOT']))`

			`print len(index)`

			`index = list(split_images(index_by_name(list_files(config['ARCHIVE_ROOT']))))`

			`print len(index)`
started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00
now why is UUID is not serializable to json... JUST HATE IT WHEN PYTHON DOES THINGS LIKE THESE\! Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-10 19:50:58 +04:00			`json.dump(index, file(os.path.join('test', 'filelist.json'), 'w'))`


started work on indexing... Signed-off-by: Alex A. Naanou <alex.nanou@gmail.com> 2011-11-03 01:11:10 +03:00

			`#=======================================================================`
			`# vim:set ts=4 sw=4 nowrap :`