Home | History | Annotate | Download | only in utils
      1 #! /usr/bin/python
      2 
      3 #changelog: 
      4 #10/13/2005b: replaced the # in tmp(.#*)* with alphanumeric and _, this will then remove
      5 #nodes such as %tmp.1.i and %tmp._i.3
      6 #10/13/2005: exntended to remove variables of the form %tmp(.#)* rather than just 
      7 #%tmp.#, i.e. it now will remove %tmp.12.3.15 etc, additionally fixed a spelling error in
      8 #the comments
      9 #10/12/2005: now it only removes nodes and edges for which the label is %tmp.# rather
     10 #than removing all lines for which the lable CONTAINS %tmp.#
     11 import re
     12 import sys
     13 if( len(sys.argv) < 3 ):
     14 	print 'usage is: ./DSAclean <dot_file_to_be_cleaned> <out_put_file>'
     15 	sys.exit(1)
     16 #get a file object
     17 input = open(sys.argv[1], 'r')
     18 output = open(sys.argv[2], 'w')
     19 #we'll get this one line at a time...while we could just put the whole thing in a string
     20 #it would kill old computers
     21 buffer = input.readline()
     22 while buffer != '':
     23 	if re.compile("label(\s*)=(\s*)\"\s%tmp(.\w*)*(\s*)\"").search(buffer):
     24 		#skip next line, write neither this line nor the next
     25 		buffer = input.readline()
     26 	else:
     27 		#this isn't a tmp Node, we can write it
     28 		output.write(buffer)
     29 	#prepare for the next iteration
     30 	buffer = input.readline()
     31 input.close()
     32 output.close()
     33