xmpgen.py

#!/bin/env python
#=======================================================================

__version__ = '''0.1.09'''
__sub_version__ = '''20120908235504'''
__copyright__ = '''(c) Alex A. Naanou 2011'''


#-----------------------------------------------------------------------

import shutil, sys, os, os.path
from itertools import chain, imap, islice
import json

from pli.functional import curry
from pli.logictypes import OR

# compatibility with Python 2.5
if sys.version_info < (2, 6):
	from xmpgen_legacy import izip_longest
else:
	from itertools import izip_longest


metadata = None
# NOTE: I prefer freedom as in free, to freedom as in forced
# 		to be free...
# XXX add plugin metadata writers...
# 		an example using command-line exiv2:
# 			exiv2 -M "set Xmp.xmp.Rating 2" DSC_0055.XMP
try:
	# this is optional...
	import pyexiv2 as metadata
except ImportError:
	pass


#-----------------------------------------------------------------------
#
#
#-----------------------------------------------------------------------
# helpers...
#----------------------------------------------------------------join---
def join(*p, **n):
	'''
	'''
	n.pop('path', None)
	return os.path.join(*p, **n)
	

#--------------------------------------------------------------locate---
def locate(name, locations=(), default=None):
	'''
	locate an entity in locations and if none are available use a default.

	NOTE: this will read the contents of the file.
	'''
	for l in locations:
		try:
			return file(os.path.join(l, name), 'r').read()
		except IOError:
			continue
	return default


#-----------------------------------------------------------------------
# config data and defaults...
HOME_CFG = '~'
LOCAL_CFG = '.'

XMP_TEMPLATE_NAME = 'TEMPLATE.XMP'
CONFIG_NAME = '.xmpgen'

BACKUP_EXT_TPL = '.bak%03d'
BACKUP_EXT = '.bak'

DEFAULT_CFG = {
	'ROOT_DIR': '.',
	'INPUT_DIR': 'preview (RAW)',
	# NOTE: we do not need a default aoutput dir as it will default to
	# 		ROOT_DIR...
	#'OUTPUT_DIR': None,
	'TRAVERSE_DIR': 'fav',

	'RAW_EXTENSION': '.NEF',
	'THRESHOLD': 5,
	'RATINGS': [
		# basic ratings...
		5, 4, 3, 2, 1,
	],
	'LABELS': [
		# default labels...
		# yellow
		'Second',
		# blue
		'Review',
	],
	'LABEL_CFG': '.label',

	'XMP_TEMPLATE': '''\
<x:xmpmeta xmlns:x="adobe:ns:meta/">
	<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
		<rdf:Description rdf:about="" xmlns:xap="http://ns.adobe.com/xap/1.0/">
			<xap:CreatorTool>XMPGen</xap:CreatorTool>
			<xap:Rating>%(rating)s</xap:Rating>
			<xap:Label>%(label)s</xap:Label>
		</rdf:Description>
	</rdf:RDF>
</x:xmpmeta>''',

	'RATE_TOP_LEVEL': False,
	'SEARCH_INPUT': True,
	'SEARCH_OUTPUT': True,
	'VERBOSITY': 1,
	'USE_LABELS': False,
	'SKIP': ['preview (RAW)',],

	# for available options see: HANDLE_OVERFLOW_OPTIONS
	'OVERFLOW_STRATEGY': 'merge-bottom',
	# for available options see: HANDLE_EXISTING_XMP_OPTIONS
	'HANDLE_EXISTING_XMP': 'rewrite',
	'SKIP_UNKNOWN_DESTINATIONS': False,
	'CONFIG_SAVE_LOCAL': False,
	'INPUT_EXT': ['jpg', 'JPG']
}

HANDLE_OVERFLOW_OPTIONS = [
	'abort',
##	'skip-top',
	'skip-bottom',
##	'merge-top',
	'merge-bottom',
##	'increase-threshold',
##	'growing-threshold',
##	'use-labels',
]

HANDLE_EXISTING_XMP_OPTIONS = [
	'abort',
	'skip',
	# NOTE: this will fail on RO files... ##!!! is this correct?
	'rewrite',
]

# NOTE: these depend on an optional .xmp editor...
if metadata is not None:
	HANDLE_EXISTING_XMP_OPTIONS += [
		'update',
		'highest',
		'lowest',
	]
	DEFAULT_CFG['HANDLE_EXISTING_XMP'] = 'update'


#-----------------------------------------------------------------------
#----------------------------------------------------load_commandline---
def load_commandline(config, default_cfg=DEFAULT_CFG):
	'''
	load configuration data from command-line arguments.
	'''
	from optparse import OptionParser, OptionGroup

	parser = OptionParser(
						usage='Usage: %prog [options]',
						version='%prog ' + __version__,
						epilog='NOTEs: xmpgen will overwrite existing .XMP files (will be fixed soon). '
						'xmpgen will search for both INPUT and OUTPUT so explicit declaration is needed '
						'only in non-standard cases and for fine control.')
	parser.add_option('--root',
						default=config['ROOT_DIR'],
						help='root of the directory tree we will be working at (default: "%default").', 
						metavar='PATH')
	parser.add_option('--input',
						default=config['INPUT_DIR'],
						help='name of directory containing previews (default: "%default").\n'
						'NOTE: this directory tree can not be used for output.', 
						metavar='DIR_NAME')
	parser.add_option('--output',
						help='name of directory to store .XMP files. if --no-search '
						'is not set this is where we search for relevant files (default: ROOT).', 
						metavar='DIR_NAME')
	# verbosity level...
	parser.add_option('-v', '--verbose',
						dest='verbosity',
						action='store_const',
						const=2,
						default=config['VERBOSITY'],
						help='increase output verbosity.')
	parser.add_option('-q', '--quiet',
						dest='verbosity',
						action='store_const',
						const=0,
						default=config['VERBOSITY'],
						help='decrease output verbosity.')
	parser.add_option('-m', '--mute',
						dest='verbosity',
						action='store_const',
						const=-1,
						default=config['VERBOSITY'],
						help='mute output.')

	ratings_n_labels = OptionGroup(parser, 'Ratings & Labels')
	ratings_n_labels.add_option('--use-labels', 
						action='store_true',
						default=config['USE_LABELS'],
						help='if set, use both labels and ratings.') 
	ratings_n_labels.add_option('--clear-labels',
						action='store_true',
						default=False,
						help='clear list of labels, shorthand to removing all '
						'the labels one by one.')
	ratings_n_labels.add_option('--label',
						action='append',
						default=config['LABELS'][:],
						help='add label to list of labels (default: %default). '
						'NOTE: the order in which labels are added is '
						'significant - first is higher priority last lower.', 
						metavar='LABEL')
	ratings_n_labels.add_option('--remove-label',
						action='append',
						default=[],
						help='remove label from list of labels (default: %default).', 
						metavar='LABEL')
	ratings_n_labels.add_option('--rate-top-level', 
						action='store_true',
						default=config['RATE_TOP_LEVEL'],
						help='if set, also rate top level previews.')
	ratings_n_labels.add_option('--group-threshold', 
						default=config['THRESHOLD'],
						help='percentage of elements unique to a level below which '
						'the level will be merged with the next one (default: "%default").',
						metavar='THRESHOLD') 
	ratings_n_labels.add_option('--overflow-strategy', 
						default=config['OVERFLOW_STRATEGY'],
						help='the way to handle tree depth greater than the number '
						'of given ratings (default: %default). '
						'available options are: ' + str(tuple(HANDLE_OVERFLOW_OPTIONS)),
						metavar='STRATEGY') 
	parser.add_option_group(ratings_n_labels)

	advanced = OptionGroup(parser, 'Advanced options')
	advanced.add_option('--no-search-input', 
						dest='search_input',
						action='store_false',
						default=config['SEARCH_INPUT'],
						help='if set, this will disable searching for input directories, '
						'otherwise ROOT/INPUT will be used directly.\n'
						'NOTE: this will find all matching INPUT directories, '
						'including nested ones.') 
	advanced.add_option('--no-search-output', 
						dest='search_output',
						action='store_false',
						default=config['SEARCH_OUTPUT'],
						help='if set, this will disable searching for RAW files, '
						'and XMPs will be stored directly in the OUTPUT directory.') 
	advanced.add_option('-s', '--skip', 
						action='append',
						default=config['SKIP'][:],
						help='list of directories to skip from searching for RAW '
						'files (default: %default)',
						metavar='DIR_NAME') 
	advanced.add_option('--traverse-dir-name',
						default=config['TRAVERSE_DIR'],
						help='directory used to traverse to next level (default: "%default").', 
						metavar='DIR_NAME')
	##!!! do we need a clear/remove here??
	advanced.add_option('--input-ext',
						action='append',
						default=config['INPUT_EXT'][:],
						help='add extension to list of ext\'s to be searched (default: %default).',
						metavar='INPUT_EXT')
	##!!! add '.' if not present...
	advanced.add_option('--raw-extension',
						default=config['RAW_EXTENSION'],
						help='use as the extension for RAW files (default: "%default").', 
						metavar='EXTENSION')
	advanced.add_option('--xmp-template',
						help='use XMP_TEMPLATE instead of the internal template.', 
						metavar='PATH')
	advanced.add_option('--handle-existing-xmp', 
						default=config['HANDLE_EXISTING_XMP'],
						help='the way to handle existing xmp files (default: %default). '
						'available options are: ' + str(tuple(HANDLE_EXISTING_XMP_OPTIONS)),
						metavar='STRATEGY') 
	##!!! need to resolve this situation - not every one is shooting RAW...
	advanced.add_option('--skip-unknown-destinations', 
						action='store_true',
						default=config['SKIP_UNKNOWN_DESTINATIONS'],
						help='if set, skip generating .XMP files for targets that '
						'can not be located. this can happen for example when '
						'rating a file that was shot in JPEG or was processed in cammera.')
	parser.add_option_group(advanced)

	runtime = OptionGroup(parser, 'Runtime options')
	runtime.add_option('--dry-run',
						action='store_true',
						default=False,
						help='run but do not create any files.')
	parser.add_option_group(runtime)


	configuration = OptionGroup(parser, 'Configuration options')
	configuration.add_option('--config-print', 
						action='store_true',
						default=False,
						help='print current configuration and exit.')
	configuration.add_option('--config-defaults-print', 
						action='store_true',
						default=False,
						help='print default configuration and exit.')
	configuration.add_option('--config-save-local', 
						action='store_true',
						default=False,
						help='save current configuration at the root location. '
						'this is a shorthand for: '
						'xmpgen ... --config-print > ROOT/.xmpgen; xmpgen ...')
	parser.add_option_group(configuration)

	options, args = parser.parse_args()

	# be polite and save the originla config data...
	config = config.copy()

	# prune and write the data...
	config.update({
			'ROOT_DIR': options.root,
			'INPUT_DIR': options.input,
			'OUTPUT_DIR': options.output if options.output else options.root,
			'TRAVERSE_DIR': options.traverse_dir_name,
			'RAW_EXTENSION': options.raw_extension,
			'THRESHOLD': options.group_threshold,
			'LABELS': [ l for l in options.label if l not in options.remove_label ],
			'XMP_TEMPLATE': file(options.xmp_template, 'r').read() 
								if options.xmp_template 
								else config['XMP_TEMPLATE'],
			'RATE_TOP_LEVEL': options.rate_top_level,
			'SEARCH_INPUT': options.search_input,
			'SEARCH_OUTPUT': options.search_output,
			'VERBOSITY': options.verbosity,
			'USE_LABELS': options.use_labels,
			'SKIP': list(set(options.skip + [options.input])),
			'SKIP_UNKNOWN_DESTINATIONS': options.skip_unknown_destinations,
			'CONFIG_SAVE_LOCAL': options.config_save_local,
			'INPUT_EXT': options.input_ext,
			})

	if options.overflow_strategy not in HANDLE_OVERFLOW_OPTIONS:
		raise ValueError, ('OVERFLOW_STRATEGY value %s unsupported '
								'(use --help flag for list of options).' % options.overflow_strategy)
	config['OVERFLOW_STRATEGY'] = options.overflow_strategy 

	if options.handle_existing_xmp not in HANDLE_EXISTING_XMP_OPTIONS:
		raise ValueError, ('HANDLE_EXISTING_XMP value %s unsupported '
								'(use --help flag for list of options).' % options.handle_existing_xmp)
	config['HANDLE_EXISTING_XMP'] = options.handle_existing_xmp


	# configuration stuff...
	# write a local configuration...
	if options.config_save_local:
		file(os.path.join(config['ROOT_DIR'], CONFIG_NAME), 'w').write(
				json.dumps(config, sort_keys=True, indent=4))

	# print configuration data...
	if True in (options.config_defaults_print, options.config_print):
		print_prefix = False
		if len([ s for  s in  (options.config_defaults_print, options.config_print) if s]) > 1:
			print_prefix = True
		if options.config_print:
			if print_prefix:
				print 'Current Configuration:'
			print json.dumps(config, sort_keys=True, indent=4)
			print
		if options.config_defaults_print:
			if print_prefix:
				print 'Default Configuration:'
			print json.dumps(default_cfg, sort_keys=True, indent=4)
			print
		raise SystemExit

	return config, options


#----------------------------------------------------load_config_file---
# TODO search for config within the root topology (???)
def load_config_file(config, default_cfg=DEFAULT_CFG):
	'''
	load configuration data from config file
	'''
	# NOTE: this does not like empty configurations files...
	user_config = json.loads(locate(CONFIG_NAME, (config.get('ROOT_DIR', '.'), LOCAL_CFG, HOME_CFG), default='{}'))

	config = default_cfg.copy()
	config.update(user_config)

	config['XMP_TEMPLATE'] = locate(
			XMP_TEMPLATE_NAME, 
			(config.get('ROOT_DIR', '.'), LOCAL_CFG, HOME_CFG), 
			default=config['XMP_TEMPLATE'])
	return config


#-----------------------------------------------------------------------
#------------------------------------------------------------rcollect---
# XXX make this read/locate .label files at the bottom of the tree...
def rcollect(root, next_dir=DEFAULT_CFG['TRAVERSE_DIR'],
		collect_base=True, ext=OR(*DEFAULT_CFG['INPUT_EXT']), 
		label_cfg=DEFAULT_CFG['LABEL_CFG']):
	'''
	generator to collect all the files in the topology.

	yield:
		# lists of file names on each level, starting from the top and
		# going down.
		(
			[...],
			labels
		)
	'''
	for r, dirs, files in os.walk(root):
		if collect_base:
			# filter files...
##			res = [ (root, f) for f in files if f.split('.')[-1] == ext ]
			res = [ (root, '.'.join(f.split('.')[:-1])) for f in files if f.split('.')[-1] == ext ]
			# skip empty levels...
			if len(res) == 0:
				continue
			yield res
		else:
			collect_base = True
		# filter dirs...
		if next_dir in dirs:
			dirs[:] = [next_dir]
		else:
			del dirs[:] 


#-------------------------------------------------------------collect---
def collect(root, next_dir=DEFAULT_CFG['TRAVERSE_DIR'], 
		collect_base=True, ext=OR(*DEFAULT_CFG['INPUT_EXT']),
		label_cfg=DEFAULT_CFG['LABEL_CFG']):
	'''
	same as collect, but does its work bottom-down.

	yield:
		same as rcollect(...) but in reverse order...
	'''
	##!!! STUB
	data = list(rcollect(root, next_dir, collect_base, ext))
	for e in data[::-1]:
		yield e


#---------------------------------------------------------------index---
##!!! this does not split items that are the same but with different extensions...
def index(collection):
	'''
	generator to index the collection.

	each level represents the difference between itself and the previous level.
	each level also contains the original number of elements.

	NOTE: duplicate file names will be merged.

	yeild:
		{
			# same as collect(...) but diffed with the previous
			# level...
			'items': [...],
			# original number of elements...
			'total count': N,
			# root path for the current sub tree...
			'path': S,
		}
	'''
	prev = None
##	for level, label in collection:
	for level in collection:
		cur = set(level)
		# skip empty levels...
		if len(level) == 0:
			continue
		if prev is not None:
			cur.difference_update(set(prev))
		prev = level
		yield {
			'total count': len(level),
			'items': cur, 
##			'label': label,
		}


#----------------------------------------------------------------rate---
def rate(index, ratings=DEFAULT_CFG['RATINGS'], 
		threshold=DEFAULT_CFG['THRESHOLD'], 
		overflow_strategy=DEFAULT_CFG['OVERFLOW_STRATEGY']):
	'''
	generator to rate the indexed elements.

	this also combines similar levels.

	NOTE: if the count of non-intersecting elements relative to the total 
	      number of elements is below the threshold, the level will be 
		  merged with the next. such levels are called "similar".

	yield:
		(
			# rating...
			N,
			# list of levels, each same as returned by index(...)...
			(...)
		)
	'''
	threshold = float(threshold)/100

	if overflow_strategy.endswith('-top'):
		raise NotImplementedError, '"*-top" strategies not yet implemented.'
		##!!! this will break the threshold mechanics...
		ratings = ratings[::-1]
		index = list(index)[::-1]

	i = 0
	buf = ()
	for level in index:
		buf += (level,)
		# skip empty levels or levels that do not pass the threshold...
		if level['total count'] <= 0 or float(len(level['items']))/level['total count'] <= threshold:
			continue
		# merge levels when we run out of ratings ('merge-bottom' or
		# 'merge-top')...
		if len(ratings) == i+1:
			if overflow_strategy.startswith('skip-'):
				yield ratings[i], buf
				return
			continue
		yield ratings[i], buf
		buf = ()
		i += 1
	# the buffer is not yet empty, so we need to flush the results...
	if buf != ():
		yield ratings[-1], buf
		# XXX might be good not to write anything in this situatio...
		if overflow_strategy == 'abort':
			raise ValueError, ('number of levels is greater than the number '
								'of ratings, use more labels or a different strategy.')


#-----------------------------------------------------------------------
#--------------------------------------------------------action_dummy---
def action_dummy(path, rating, label, data, config):
	'''
	dummy action, does nothing.
	'''
	return True


#----------------------------------------------------------filewriter---
##!!! check if file already exists...
def action_filewriter(path, rating, label, data, config):
	'''
	action to write a file.
	'''
	##!!! check if file already exists...
	if os.path.isfile(path):
		return handle_existing_xmp(path, rating, label, data, config)
	file(path, 'w').write(data)
	return True


#-------------------------------------------------------action_logger---
def action_logger(path, rating, label, data, config):
	'''
	action to log the current processed file.
	'''
	verbosity = config['VERBOSITY']
	if verbosity == 1:
		print '.',
	elif verbosity == 2:
		print '%s (%s, %s)' % (path, rating, label)
	return True


#--------------------------------------------------------action_break---
def action_break(path, rating, label, data, config):
	'''
	action that prevents executions of subsequent actions.
	'''
	return False


def get_backup_name(path):
	'''
	'''
	# create a backup file name...
	i = 0
	ext_tpl = BACKUP_EXT_TPL 
	ext = BACKUP_EXT
	while os.path.isfile(path + ext):
		i += 1
		ext = ext_tpl % i
	return path + ext

#-------------------------------------------------handle_existing_xmp---
##!!! do we just create a file with a .bak extension or move to a backup dir...
def handle_existing_xmp(path, rating, label, data, config):
	'''
	handle the situations when the .XMP file already exists...
	'''
	action = config['HANDLE_EXISTING_XMP']
	if action == 'abort':
		raise ValueError, 'file "%s" already exists.' % path
	elif action == 'skip':
		return False
	# XXX backup needs more testing...
	elif action == 'rewrite':
		# NOTE: this will fail for RO files...
		# check if we need to backup...
		if open(path).read() == data:
			# we need to do nothing...
			return False
		# do a backup...
		shutil.move(path, get_backup_name(path))
		# now we can continue...
		return True
	# these will update the xmp...
	if metadata is not None:
		##!!! need testing...
		if action in ('update', 'highest', 'lowest'):
			# do a backup...
			shutil.copy2(path, get_backup_name(path))
			# load metadata...
			im = metadata.ImageMetadata(path)
			im.read()
			if action == 'update':
				im['Xmp.xmp.Rating'] = rating
				if label != '':
					im['Xmp.xmp.Label'] = label
			elif action == 'highest':
				im['Xmp.xmp.Rating'] = max(im['Xmp.xmp.Rating'].value, rating)
				##!!! can't order-compare labels...
				if label != '':
					im['Xmp.xmp.Label'] = label
			elif action == 'lowest':
				im['Xmp.xmp.Rating'] = min(im['Xmp.xmp.Rating'].value, rating)
				##!!! can't order-compare labels...
				if label != '':
					im['Xmp.xmp.Label'] = label
			##!!! do we need to check for RO flag here???
			im.write()
			return True
	raise TypeError, 'unknown handling strategy: "%s"' % action


#------------------------------------------------------------generate---
def generate(ratings, root, getpath=join, 
		actions=(action_filewriter,), template=DEFAULT_CFG['XMP_TEMPLATE'],
		skip_not_found=DEFAULT_CFG['SKIP_UNKNOWN_DESTINATIONS'], config=DEFAULT_CFG):
	'''
	generate XMP files.
	'''
	for rating, data in ratings:
		if type(rating) in (str, unicode):
			label = rating
			rating = 5
		else:
			label = ''
			rating = rating
		xmp_data = template % {'rating': rating, 'label': label}
		for p, name in reduce(list.__add__, [ list(s['items']) for s in data ]):
			try:
##				path = getpath(root, '.'.join(name.split('.')[:-1]), path=p) + '.XMP'
				path = getpath(root, name, path=p) + '.XMP'
			except KeyError:
				if skip_not_found:
					continue
				raise
			for action in actions:
				if action is action_dummy:
					continue
				if not action(path, rating, label, xmp_data, config):
					break


#-----------------------------------------------------------------------
#------------------------------------------------------buildfilecache---
def buildfilecache(root, ext=DEFAULT_CFG['RAW_EXTENSION'], 
		skip_dirs=(DEFAULT_CFG['INPUT_DIR'],)):
	'''
	build a cache of all files in a tree with an extension ext.

	the cache is indexed by file name without extension and contains full paths.

	NOTE: if this finds more than one file with same name in the sub tree it will fail.
	'''
	if not ext.startswith('.'):
		ext = '.' + ext
	res = {}
	for path, dirs, files in os.walk(root): 
		if path in skip_dirs:
			continue
		if len(skip_dirs) > 0:
			dirs[:] = list(set(dirs).difference(skip_dirs))	
		for f in files:
			if f.endswith(ext):
				base = '.'.join(f.split('.')[:-1])
				if base in res:
					res[base] += [(path, f)]
				res[base] = [(path, f)]
	return res


#-------------------------------------------------------bestpathmatch---
def bestpathmatch(source, paths, split=None):
	'''
	select closest path to source.

	here we use two criteria to judge closeness:
		- depth/size of sub-tree.
		  a tree at a deeper location (smaller) beats the more general
		  (larger) sub-tree.
		  e.g. max length of identical path section starting from root 
		  wins.

					A
				   / \			path AB is closer to AB(T) than A (obvious)
				  /   B
				 /   / \		path ABD is closer to AB(T) than AC
			    C   D  (T)

		- within a minimal sub-tree the shortest distance to sub-tree 
		  root wins.

		  		 	A
				   /|\
				  / | \
				 B  C (T)		path AB is closer to T than ACD		
				    |
				    D

	NOTE: we can not decide by our selves if two paths produce identical
		  scores.
		  e.g. paths AB and AC in the above diagram are at the same 
		  distance from T.
	'''
	if split is not None:
		source = split(source)
	final_score = 0
	res = [] 

	for path in paths:
		score = -1
		if split is not None:
			path = split(path)
		# go through path components top down...
		for i, (a, b) in enumerate(zip(path, source)):
			if a != b:
				# miss/stop..
				break
			if a == b:
				# we beet the score...
				if i > score:
					score = i
		# index results with max score...
		if score > final_score:
			final_score = score
			res = [path]
		# multiple possible matches (resolve on next stage)...
		elif score == final_score:
			res += [path]
	if len(res) > 1:
		# we have two+ paths and we need to decide which is a better
		# match via length...
		l = [ len(p) for p in res ]
		if l.count(min(l)) > 1:
			raise ValueError, 'we have more than one %s candidate directories with identical priorities relative to source %s.' % (res, source)
		res = [res[l.index(min(l))]]
	return res[0]


#---------------------------------------------------------getfilepath---
##!!! test for multiple matches...
def getfilepath(root, name, path=None, cache=None):
	'''
	find a file in a directory tree via cache and return it's path.

	NOTE: name should be given without an extension.
	NOTE: this ignores extensions.
	'''
	t_names = cache.get(name, ())
	if len(t_names) == 0:
		raise KeyError, 'file %s not found.' % name
	elif len(t_names) == 1:
		p, n = t_names[0]
		return os.path.join(p, '.'.join(n.split('.')[:-1]))
	elif len(t_names) > 1:
		# select best path match...
		p, n = bestpathmatch(name[0], ( e[0] for e in t_names )), name[1]

		return os.path.join(p, '.'.join(n.split('.')[:-1]))


#-------------------------------------------------------builddircache---
def builddircache(root, name):
	'''
	build directory cache.

	NOTE: for simple name patterns this will return a single item.
	'''
	res = {}
	for path, dirs, _ in os.walk(root): 
		for d in dirs:
			if d == name:
				if d in res:
					res[d] += [os.path.join(path, d)]
				else:
					res[d] = [os.path.join(path, d)]
	return res


#----------------------------------------------------------getdirpath---
def getdirpaths(root, name, cache=None):
	'''
	generator to yield directory cache elements by name.
	'''
	if name not in cache:
		return
##	# make this compatible with name patterns...
##	##!!! this seams to yield odd results -- fails with --search-input...
##	for d in chain(cache[n] for n in (k for k in cache.keys() if k == name)):
	for d in cache[name]:
		yield d


#-----------------------------------------------------------------------
#-----------------------------------------------------------------run---
def run():
	'''
	prepare configuration data and run.
	'''
	# setup config data...
	config, runtime_options = load_commandline(load_config_file(DEFAULT_CFG))

	# cache some names...
	output = config['OUTPUT_DIR']
	root = config['ROOT_DIR']
	input = config['INPUT_DIR']
	traverse_dir = config['TRAVERSE_DIR']
	threshold = config['THRESHOLD']
	raw_ext = config['RAW_EXTENSION']
	rate_top_level = config['RATE_TOP_LEVEL']
	search_input = config['SEARCH_INPUT']
	search_output = config['SEARCH_OUTPUT']
	verbosity = config['VERBOSITY']
	skip = config['SKIP']
	use_labels = config['USE_LABELS']
	overflow_strategy = config['OVERFLOW_STRATEGY']
	in_ext = OR(*config['INPUT_EXT'])

	# runtime options...
	dry_run = runtime_options.dry_run

	ratings = (config['LABELS'] if use_labels else []) + config['RATINGS']

	# prepare to count created files...
	files_written = [0]
	def action_count(*p, **n):
		files_written[0] += 1
		return True
	
	# do the actaual dance...
	res = generate(
		rate(
			index(
				# chose weather we need to skip the last element...
					collect(os.path.join(root, input), traverse_dir, rate_top_level, in_ext) 
						if not search_input 
						# locate correct preview dirs...
						else (reduce(list.__add__, l) 
									for l 
									in izip_longest(
											fillvalue=[], 
											*(collect(d, traverse_dir, rate_top_level, in_ext) 
										for d 
										in getdirpaths(
												root, 
												input, 
												builddircache(root, input)))))), 
			ratings=ratings,
			threshold=threshold,
			overflow_strategy=overflow_strategy), 
		output, 
		# find a location for each output file...
		##!!! we do not need to do this if collect returned no results...
		getpath=(curry(getfilepath, cache=buildfilecache(output, raw_ext, skip_dirs=skip)) 
					if search_output 
					# just write to ROOT...
					else join),
		# actions to perform per XMP file...
		actions=(
			action_logger,
			action_break if dry_run else action_dummy,
			action_filewriter,
			action_count,
		),
		template=config['XMP_TEMPLATE'],
		skip_not_found=config['SKIP_UNKNOWN_DESTINATIONS'],
		config=config)

	if verbosity >= 0:
		if verbosity == 1:
			print
		print 'Written %s files.' % files_written[0]

	return res

	
#-----------------------------------------------------------------------
if __name__ == '__main__':
	run()


#=======================================================================
#                                            vim:set ts=4 sw=4 nowrap :