#!/usr/bin/env python import os,re,sys,math,string,damask from optparse import OptionParser, Option # ----------------------------- class extendableOption(Option): # ----------------------------- # used for definition of new option parser action 'extend', which enables to take multiple option arguments # taken from online tutorial http://docs.python.org/library/optparse.html ACTIONS = Option.ACTIONS + ("extend",) STORE_ACTIONS = Option.STORE_ACTIONS + ("extend",) TYPED_ACTIONS = Option.TYPED_ACTIONS + ("extend",) ALWAYS_TYPED_ACTIONS = Option.ALWAYS_TYPED_ACTIONS + ("extend",) def take_action(self, action, dest, opt, value, values, parser): if action == "extend": lvalue = value.split(",") values.ensure_value(dest, []).extend(lvalue) else: Option.take_action(self, action, dest, opt, value, values, parser) # -------------------------------------------------------------------- # MAIN # -------------------------------------------------------------------- parser = OptionParser(option_class=extendableOption, usage='%prog options [file[s]]', description = """ Add column(s) with derived values according to user defined arithmetic operation between column(s). Columns can be specified either by label or index. Use ';' for ',' in functions. Example: distance to IP coordinates -- "math.sqrt( #ip.x#**2 + #ip.y#**2 + round(#ip.z#;3)**2 )" """ + string.replace('$Id$','\n','\\n') ) parser.add_option('-l','--label', dest='labels', action='extend', type='string', \ help='(list of) new column labels', metavar='') parser.add_option('-f','--formula', dest='formulas', action='extend', type='string', \ help='(list of) formulas corresponding to labels', metavar='') parser.set_defaults(labels= []) parser.set_defaults(formulas= []) (options,filenames) = parser.parse_args() if len(options.labels) != len(options.formulas): parser.error('number of labels (%i) and formulas (%i) do not match'%(len(options.labels),len(options.formulas))) for i in xrange(len(options.formulas)): options.formulas[i]=options.formulas[i].replace(';',',') # ------------------------------------------ setup file handles --------------------------------------- files = [] if filenames == []: files.append({'name':'STDIN', 'input':sys.stdin, 'output':sys.stdout}) else: for name in filenames: if os.path.exists(name): files.append({'name':name, 'input':open(name), 'output':open(name+'_tmp','w')}) # ------------------------------------------ loop over input files --------------------------------------- for file in files: if file['name'] != 'STDIN': print file['name'] specials = { \ '_row_': 0, } table = damask.ASCIItable(file['input'],file['output'],False) # make unbuffered ASCII_table table.head_read() # read ASCII header info table.info_append(string.replace('$Id$','\n','\\n') + \ '\t' + ' '.join(sys.argv[1:])) column = {} evaluator = {} for label,formula in zip(options.labels,options.formulas): table.labels_append(label) interpolator = [] for position,operand in enumerate(set(re.findall(r'#(.+?)#',formula))): formula = formula.replace('#'+operand+'#','{%i}'%position) if operand in specials: interpolator += ['specials["%s"]'%operand] elif operand.isdigit(): if len(table.labels) > int(operand): interpolator += ['float(table.data[%i])'%(int(operand))] else: parser.error('column %s not present...\n'%operand) else: try: interpolator += ['float(table.data[%i])'%table.labels.index(operand)] except: parser.error('column %s not found...\n'%operand) evaluator[label] = "'" + formula + "'.format(" + ','.join(interpolator) + ")" # ------------------------------------------ assemble header --------------------------------------- table.head_write() # ------------------------------------------ process data --------------------------------------- outputAlive = True while outputAlive and table.data_read(): # read next data line of ASCII table specials['_row_'] += 1 # count row for label in options.labels: table.data_append(eval(eval(evaluator[label]))) outputAlive = table.data_write() # output processed line # ------------------------------------------ output result --------------------------------------- outputAlive and table.output_flush() # just in case of buffered ASCII table file['input'].close() # close input ASCII table if file['name'] != 'STDIN': file['output'].close() # close output ASCII table os.rename(file['name']+'_tmp',file['name']) # overwrite old one with tmp new