1e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#! /usr/bin/python
2e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao
3e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#changelog:
4e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#10/13/2005b: replaced the # in tmp(.#*)* with alphanumeric and _, this will then remove
5e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#nodes such as %tmp.1.i and %tmp._i.3
6e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#10/13/2005: exntended to remove variables of the form %tmp(.#)* rather than just
7e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#%tmp.#, i.e. it now will remove %tmp.12.3.15 etc, additionally fixed a spelling error in
8e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#the comments
9e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#10/12/2005: now it only removes nodes and edges for which the label is %tmp.# rather
10e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#than removing all lines for which the lable CONTAINS %tmp.#
11e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaoimport re
12e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaoimport sys
13e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaoif( len(sys.argv) < 3 ):
14e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	print 'usage is: ./DSAclean <dot_file_to_be_cleaned> <out_put_file>'
15e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	sys.exit(1)
16e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#get a file object
17e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaoinput = open(sys.argv[1], 'r')
18e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaooutput = open(sys.argv[2], 'w')
19e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#we'll get this one line at a time...while we could just put the whole thing in a string
20e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao#it would kill old computers
21e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaobuffer = input.readline()
22e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaowhile buffer != '':
23e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	if re.compile("label(\s*)=(\s*)\"\s%tmp(.\w*)*(\s*)\"").search(buffer):
24e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao		#skip next line, write neither this line nor the next
25e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao		buffer = input.readline()
26e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	else:
27e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao		#this isn't a tmp Node, we can write it
28e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao		output.write(buffer)
29e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	#prepare for the next iteration
30e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liao	buffer = input.readline()
31e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaoinput.close()
32e264f62ca09a8f65c87a46d562a4d0f9ec5d457Shih-wei Liaooutput.close()
33