| #! /usr/bin/python |
| |
| #changelog: |
| #10/13/2005b: replaced the # in tmp(.#*)* with alphanumeric and _, this will then remove |
| #nodes such as %tmp.1.i and %tmp._i.3 |
| #10/13/2005: exntended to remove variables of the form %tmp(.#)* rather than just |
| #%tmp.#, i.e. it now will remove %tmp.12.3.15 etc, additionally fixed a spelling error in |
| #the comments |
| #10/12/2005: now it only removes nodes and edges for which the label is %tmp.# rather |
| #than removing all lines for which the lable CONTAINS %tmp.# |
| import re |
| import sys |
| if( len(sys.argv) < 3 ): |
| print 'usage is: ./DSAclean <dot_file_to_be_cleaned> <out_put_file>' |
| sys.exit(1) |
| #get a file object |
| input = open(sys.argv[1], 'r') |
| output = open(sys.argv[2], 'w') |
| #we'll get this one line at a time...while we could just put the whole thing in a string |
| #it would kill old computers |
| buffer = input.readline() |
| while buffer != '': |
| if re.compile("label(\s*)=(\s*)\"\s%tmp(.\w*)*(\s*)\"").search(buffer): |
| #skip next line, write neither this line nor the next |
| buffer = input.readline() |
| else: |
| #this isn't a tmp Node, we can write it |
| output.write(buffer) |
| #prepare for the next iteration |
| buffer = input.readline() |
| input.close() |
| output.close() |