#!/usr/bin/python import os,re,sys,math,string from optparse import OptionParser, Option # ----------------------------- class extendableOption(Option): # ----------------------------- # used for definition of new option parser action 'extend', which enables to take multiple option arguments # taken from online tutorial http://docs.python.org/library/optparse.html ACTIONS = Option.ACTIONS + ("extend",) STORE_ACTIONS = Option.STORE_ACTIONS + ("extend",) TYPED_ACTIONS = Option.TYPED_ACTIONS + ("extend",) ALWAYS_TYPED_ACTIONS = Option.ALWAYS_TYPED_ACTIONS + ("extend",) def take_action(self, action, dest, opt, value, values, parser): if action == "extend": lvalue = value.split(",") values.ensure_value(dest, []).extend(lvalue) else: Option.take_action(self, action, dest, opt, value, values, parser) def L2(object): return math.sqrt(sum([x*x for x in object])) # -------------------------------------------------------------------- # MAIN # -------------------------------------------------------------------- parser = OptionParser(option_class=extendableOption, usage='%prog options [file[s]]', description = """ Add column(s) containing norm of requested column(s) being either vectors or tensors. """ + string.replace('$Id$','\n','\\n') ) parser.add_option('-m','--memory', dest='memory', action='store_true', \ help='load complete file into memory [%default]') parser.add_option('-v','--vector', dest='vector', action='extend', type='string', \ help='heading of columns containing vector field values') parser.add_option('-t','--tensor', dest='tensor', action='extend', type='string', \ help='heading of columns containing tensor field values') parser.set_defaults(memory = False) parser.set_defaults(vector = []) parser.set_defaults(tensor = []) (options,filenames) = parser.parse_args() if len(options.vector) + len(options.tensor) == 0: parser.error('no data column specified...') datainfo = { # list of requested labels per datatype 'vector': {'len':3, 'label':[]}, 'tensor': {'len':9, 'label':[]}, } if options.vector != None: datainfo['vector']['label'] += options.vector if options.tensor != None: datainfo['tensor']['label'] += options.tensor # ------------------------------------------ setup file handles --------------------------------------- files = [] if filenames == []: files.append({'name':'STDIN', 'input':sys.stdin, 'output':sys.stdout}) else: for name in filenames: if os.path.exists(name): files.append({'name':name, 'input':open(name), 'output':open(name+'_tmp','w')}) # ------------------------------------------ loop over input files --------------------------------------- for file in files: print file['name'] # get labels by either read the first row, or - if keyword header is present - the last line of the header firstline = file['input'].readline() m = re.search('(\d+)\s*head', firstline.lower()) if m: headerlines = int(m.group(1)) passOn = [file['input'].readline() for i in range(1,headerlines)] headers = file['input'].readline().split() else: headerlines = 1 passOn = [] headers = firstline.split() if options.memory: data = file['input'].readlines() else: data = [] for i,l in enumerate(headers): if l.startswith('1_'): if re.match('\d+_',l[2:]) or i == len(headers)-1 or not headers[i+1].endswith(l[2:]): headers[i] = l[2:] active = {} column = {} head = [] for datatype,info in datainfo.items(): for label in info['label']: key = {True :'1_%s', False:'%s' }[info['len']>1]%label if key not in headers: sys.stderr.write('column %s not found...\n'%key) else: if datatype not in active: active[datatype] = [] if datatype not in column: column[datatype] = {} active[datatype].append(label) column[datatype][label] = headers.index(key) head.append('norm(%s)'%label) # ------------------------------------------ assemble header --------------------------------------- output = '%i\theader'%(headerlines+1) + '\n' + \ ''.join(passOn) + \ string.replace('$Id$','\n','\\n')+ '\t' + \ ' '.join(sys.argv[1:]) + '\n' + \ '\t'.join(headers + head) + '\n' # build extended header if not options.memory: file['output'].write(output) output = '' # ------------------------------------------ read file --------------------------------------- for line in {True : data, False : file['input']}[options.memory]: items = line.split()[:len(headers)] if len(items) < len(headers): continue output += '\t'.join(items) for datatype,labels in active.items(): for label in labels: theNorm = L2(map(float,items[column[datatype][label]: column[datatype][label]+datainfo[datatype]['len']])) output += '\t%f'%theNorm output += '\n' if not options.memory: file['output'].write(output) output = '' file['input'].close() # ------------------------------------------ output result --------------------------------------- if options.memory: file['output'].write(output) if file['name'] != 'STDIN': file['output'].close os.rename(file['name']+'_tmp',file['name'])