sedsed

#!/usr/bin/env python
# sedsed - the SED mastering script
# Since 27 November 2001, by Aurelio Marinho Jargas
# For ChangeLog and Documentation, see http://sedsed.sf.net

import sys, re, os, getopt, string, tempfile

myname    = 'sedsed'
myversion = '1.0'
myhome    = 'http://sedsed.sf.net'


#-------------------------------------------------------------------------------
#                              User Configuration
#-------------------------------------------------------------------------------

# Default config - Changeable, but you won't need to do it
sedbin = 'sed'                # name (or full path) of the sed program
color = 1                     # colored output or not? (--color, --nocolor)
dump_debug = 0                # dump debug script to screen? (--dump-debug)
indent_prefix = ' '*4         # default indent prefix for blocks (--prefix)
debug_prefix = '\t\t'         # default prefix for debug commands
action = 'indent'             # default action if none specified (-d,-i,-t,-H)
DEBUG = 0                     # set developper's debug level [0-3]
EMUDEBUG = 0                  # emulator have it's own debug [0-3]

# HTML colors for --htmlize
# You may edit here to change the default colors
html_colors = {
  'addr1'    : '#8080ff',
  'addr1flag': '#ff6060',
  'addr2'    : '#8080ff',
  'addr2flag': '#ff6060',
  'lastaddr' : '',
  'modifier' : '#ff6060',
  'id'       : '#ffff00',
  'content'  : '#ff00ff',
  'delimiter': '#ff6060',
  'pattern'  : '#8080ff',
  'replace'  : '',
  'flag'     : '#00ff00',
  'extrainfo': '',
  'comment'  : '#00ffff',
  'escape'   : '#ff6060',
  'special'  : '#00ff00',
  'pattmeta' : '#ff00ff',
  'plaintext': '',
  'branch'   : '',
  'BGCOLOR'  : '#000000',
  'TEXT'     : '#ffffff',
  'LINK'     : '#ff00ff',
  'ALINK'    : '#ff00ff',
  'VLINK'    : '#ff00ff'
}


#-------------------------------------------------------------------------------
#                              General Functions
#-------------------------------------------------------------------------------

def printUsage(exitcode=1):
	print """
Usage: sedsed OPTION [-e sedscript] [-f sedscriptfile] [inputfile]

OPTIONS:

     -f, --file          add file contents to the commands to be parsed
     -e, --expression    add the script to the commands to be parsed
     -n, --quiet         suppress automatic printing of pattern space
         --silent        alias to --quiet

     -d, --debug         debug the sed script
         --hide          hide some debug info (options: PATT,HOLD,COMM)
         --color         shows debug output in colors (default: ON)
         --nocolor       no colors on debug output
         --dump-debug    dumps to screen the debugged sed script

         --emu           emulates GNU sed (INCOMPLETE)
         --emudebug      emulates GNU sed debugging the sed script (INCOMPLETE)

     -i, --indent        script beautifier, prints indented and
                         one-command-per-line output do STDOUT
         --prefix        indent prefix string (default: 4 spaces)

     -t, --tokenize      script tokenizer, prints extensive
                         command by command information
     -H, --htmlize       converts sed script to a colorful HTML page

     -V, --version       prints the program version and exit
     -h, --help          prints this help message and exit


NOTE: The --emu and --emudebug options are still INCOMPLETE and must
      be used with care. Mainly regexes and address $ (last line)
      are not handled right by the emulator.
"""
	print "Homepage: %s\n"%myhome
	sys.exit(exitcode)

def Error(msg):
	"All error messages are handled by me"
	print 'ERROR:',msg ; sys.exit(1)

def echo(msg): print "\033[33;1m%s\033[m"%msg

def Debug(msg, level=1):
	if DEBUG and DEBUG >= level: print '+++ DEBUG%d: %s'%(level,msg)

def read_file(file):
	"Reads a file into a list, removing line breaks"
	if file == '-':
		try: data = sys.stdin.readlines()
		except: Error('I was expecting data on STDIN!')
	else:
		try: f = open(file); data = f.readlines() ; f.close()
		except: Error("Cannot read file: %s"%file)
	return map(lambda x:re.sub('[\n\r]+$','',x), data)

def write_file(file, lines=[]):
	"Writes a list contents into file, adding correct line breaks"
	try: f = open(file, 'wb')
	except: Error("Cannot open file for writing: %s"%file)
	#TODO maybe use os.linesep? - all this is really necessary?
	# ensuring line break
	lines = map(lambda x:re.sub('\n$','',x)+'\n', lines)
	f.writelines(lines); f.close()

def runCommand(cmd): # Returns a (#exit_code, program_output[]) tuple
	#TODO dont use popen()
	list = [] ; fd = os.popen(cmd)
	for line in fd.readlines():
		list.append(string.rstrip(line))  # stripping \s*\n
	ret = fd.close()
	if ret: ret = ret/256  # 16bit number
	return ret, list


#-------------------------------------------------------------------------------
#                           Command line & Config
#-------------------------------------------------------------------------------

# Here's all the valid command line options
short_options = 'he:f:ditVHn'
long_options = [
  'debug', 'tokenize', 'htmlize', 'indent',                     # actions
  'version', 'help', 'file=', 'expression=', 'silent', 'quiet', # sed-like
  'nocolor', 'color', 'hide=', 'prefix=', 'emu', 'emudebug',    # misc
  'dump-debug',                                                 # other
  '_debuglevel=','_emudebuglevel=','_stdout-only', 'dumpcute']  # admin

# Check it!
try: opt, args = getopt.getopt(sys.argv[1:], short_options, long_options)
except getopt.error, errmsg: Error("%s (try --help)"%errmsg)

# Turn color OFF on Windows because ANSI.SYS is not installed by default.
# Windows users who have ANSY.SYS configured, can use the --color option
# or comment the following line.
# ANSY.SYS ressources:
#   http://www.evergreen.edu/biophysics/technotes/program/ansi_esc.htm#notes
#   http://www3.sympatico.ca/rhwatson/dos7/v-ansi-escseq.html
if os.name == 'nt': color = 0

# Command Line is OK, now let's parse its values
action_modifiers = []             # --hide contents and others
sedscript = []                    # join all scripts found here
script_file = ''                  # old sedscript filename for --htmlize
quiet_flag = 0                    # tell if the #n is needed or not

for o in opt:
	if   o[0] in ('-d', '--debug')     : action = 'debug'
	elif o[0] in ('-i', '--indent')    : action = 'indent'; color = 0
	elif o[0] in ('-t', '--tokenize')  : action = 'token' ; color = 0
	elif o[0] in ('-H', '--htmlize')   : action = 'html'  ; color = 0
	elif o[0] in ('-n', '--quiet')     : quiet_flag = 1
	elif o[0] in ('-e', '--expression'): sedscript.append(o[1])
	elif o[0] in ('-f', '--file')      :
		sedscript.extend(read_file(o[1]))
		script_file = o[1]
	elif o[0] in ('-h', '--help')      : printUsage(0)
	elif o[0] in ('-V', '--version')   :
		print '%s v%s'%(myname,myversion)
		sys.exit(0)
	elif o[0] == '--emu'       : action = 'emu'
	elif o[0] == '--emudebug'  : action = 'emudebug'
	elif o[0] == '--dump-debug': action = 'debug' ; dump_debug=1 ; color=0
	elif o[0] == '--nocolor'   : color = 0
	elif o[0] == '--color'     : color = 1
	elif o[0] == '--hide':                        # get hide options
		for hide in string.split(o[1], ','):  # save as no<OPT>
			hide_me = string.lower(string.strip(hide))
			action_modifiers.append('no'+hide_me)
	elif o[0] == '--prefix':
		if re.sub('\s', '', o[1]):            # prefix is valid?
			Error("--prefix: must be spaces and/or TABs")
		indent_prefix = o[1]
	# not documented admin options
	elif o[0] == '--_debuglevel'   : DEBUG = int(o[1])
	elif o[0] == '--_emudebuglevel': EMUDEBUG = int(o[1])
	elif o[0] == '--_stdout-only':
		action = 'debug'
		action_modifiers.append(o[0][2:])
	elif o[0] == '--dumpcute':
		action = 'dumpcute'; DEBUG = 0; color = 1

# Now all Command Line options were sucessfuly parsed


#-------------------------------------------------------------------------------
#                              Sanity Checkings
#-------------------------------------------------------------------------------

# There's a SED script?
if not sedscript:
	if args:          # the script is the only argument (echo | sed 's///')
		sedscript.append(args.pop(0))
	else:             # :(
		Error("there's no SED script to parse! (try --help)")

# Get all text files, if none, use STDIN (-)
textfiles = args or ['-']

# On --debug, check the given script syntax, runnig SED with it.
# We will not debug a broken script.
#XXX there is a problem with popen() and win9x machines
#    so i'm skipping this check for those machines
#TODO redo this check using !runCommand
if action == 'debug' and os.name != 'nt':
	tmpfile = tempfile.mktemp()
	write_file(tmpfile, sedscript)
	ret, msg = runCommand("%s -f '%s' /dev/null"%(sedbin,tmpfile))
	if ret:
		msg = 'syntax error on your SED script, please fix it before.'
		Error('#%d: %s' % (ret,msg))
	os.remove(tmpfile)


#-------------------------------------------------------------------------------
#                    Internal Config Adjustments and Magic
#-------------------------------------------------------------------------------

# Add the leading #n to the sed script, when using -n
if quiet_flag: sedscript.insert(0, '#n')

# Add the terminal escapes for color (or not)
if color:
	color_YLW = '\033[33;1m'  # yellow text
	color_RED = '\033[31;1m'  # red text
	color_REV = '\033[7m'     # reverse video
	color_NO  = '\033[m'      # back to default
else:
	color_YLW = color_RED = color_REV = color_NO = ''


### The SED debugger magic lines
#
# Here is where the 'magic' lives. The heart of this program are the
# following lines, which are the special SED commands responsable for
# the DEBUG behaviour. For *each* command of the original script,
# several commands are added before, to show buffers and command
# contents. Some tricks are needed to preserve script's original
# behaviour, they are explained ahead.
#
# 1. Show PATTERN SPACE contents:
#    The 'PATT:' prefix is added, then the 'l' command shows the
#    buffer contents, then the prefix is removed.
#
# 2. Show HOLD SPACE contents:
#    Similar to PATTERN SPACE, but use the 'x' command to access and
#    restore the HOLD buffer contents. The prefix used is 'HOLD:'.
#
# 3. Show current SED COMMAND:
#    Uses a single 'i' command to show the full 'COMM:' line, as it
#    does not depend on execution data. The color codes are added or
#    not, depending on user options.
#
# 4. 'Last Address' trick:
#    On SED, the empty address // refers to the last address matched.
#    As this behaviour can be affected when several DEBUG lines are
#    inserted before the command, sedsed uses a trick to force it.
#    The last address used on the original script is repeated with a
#    null command (/last-address/ y/!/!/). This way sedsed repeat the
#    addressing, ensuring the next command will have it as the right
#    'last' address.
#
# 5. 't Status' trick:
#    The 't' command behaviour, from SED manual page:
#
#        If a s/// has done a successful substitution since the last
#        input line was read and since the last t command, then branch
#        to label
#
#    As all the DEBUG commands use lots of 's///' commands, the 't'
#    status is always true. The trick here is to add fake labels
#    between *any* command and fake 't' commands to jump to them:
#
#        <last command, possibly s///>
#        t zzset001
#        ... debug commands ...
#        t zzclr001
#        : zzset001
#        ... debug commands ...
#        : zzclr001
#        <next command, possibly t>
#
#    The DEBUG commands are repeated and placed into two distinct
#    blocks: 'zzset' and 'zzclr', which represents the 't' status
#    of the last command. The execution order follows:
#
#       zzset: 1st jump (t), then debug (s///), t status is ON
#       zzclr: 1st debug (s///), then jump (t), t status is OFF
#
#    The 001 count is incremented on each command to have unique
#    labels.
#
#
#                   --- THANK YOU VERY MUCH ---
#
# - Paolo Bonzini (GNU sed 4.x maintainer) for the idea of the
#   't status' trick.
#
# - Thobias Salazar Trevisan for the idea of using the 'i'
#   command for the COMM: lines.
#

# show pattern space, show hold space, show sed command
# null sed command to restore last address, 't' status trick
showpatt = [     's/^/PATT:/', 'l', 's/^PATT://'     ]
showhold = ['x', 's/^/HOLD:/', 'l', 's/^HOLD://', 'x']
showcomm = ['i\\','COMM:%s\a%s'%(color_YLW, color_NO)]
nullcomm = ['y/!/!/']
save_t   = ['t zzset\a\n#DEBUG#', 't zzclr\a',
            ':zzset\a\n#DEBUG#' , ':zzclr\a' ]

def format_debugcmds(cmds):
	"One per line, with prefix (spaces)"
	return debug_prefix + string.join(cmds, '\n'+debug_prefix) + '\n'

showpatt = format_debugcmds(showpatt)
showhold = format_debugcmds(showhold)
save_t   = format_debugcmds(save_t  )
showcomm = debug_prefix+string.join(showcomm, '\n')+'\n'
nullcomm = nullcomm[0]


# If user specified --hide, unset DEBUG commands for them
if action_modifiers.count('nopatt'): showpatt = ''    # don't show!
if action_modifiers.count('nohold'): showhold = ''    # don't show!
if action_modifiers.count('nocomm'): showcomm = ''    # don't show!


# Compose HTML page header and footer info for --htmlize.
# The SCRIPTNAME is added then removed from html_colors for
# code convenience only.
#
html_colors['SCRIPTNAME'] = os.path.basename(script_file)
html_data = {
                   'header': """\
<html>
<head><meta name="Generator" content="sedsed --htmlize">
<title>Colorized %(SCRIPTNAME)s</title></head>
<body bgcolor="%(BGCOLOR)s" text="%(TEXT)s"
      link="%(LINK)s" alink="%(ALINK)s" vlink="%(VLINK)s">
<pre>
"""%html_colors,
                   'footer': """
<font color="%s"><b>### colorized by <a \
href="http://sedsed.sf.net">sedsed</a>, a SED script \
debugger/indenter/tokenizer/HTMLizer</b></font>\n
</pre></body></html>\
"""%html_colors['comment']
}
del html_colors['SCRIPTNAME']


#-------------------------------------------------------------------------------
#                              SED Machine Data
#-------------------------------------------------------------------------------

# All SED commands grouped by kind
sedcmds = {
  'file' : 'rw'            ,
  'addr' : '/$0123456789\\',
  'multi': 'sy'            ,
  'solo' : 'nNdDgGhHxpPlq=',
  'text' : 'aci'           ,
  'jump' : ':bt'           ,
  'block': '{}'            ,
  'flag' : 'gpIi0123456789w'
}

# Regex patterns to identify special entities
patt = {
  'jump_label': r'[^\s;}#]*'             ,  # _any_ char except those, or None
  'filename'  : r'[^\s]+'                ,  # _any_ not blank char (strange..)
  'flag'      : r'[%s]+'%sedcmds['flag'] ,  # list of all flags
  'topopts'   : r'#!\s*/[^\s]+\s+-([nf]+)'  # options on #!/bin/sed header
}

# All fields used by the internal SED command dictionary
cmdfields = [
  'linenr',
  'addr1', 'addr1flag', 'addr2', 'addr2flag', 'lastaddr', 'modifier',
  'id', 'content', 'delimiter', 'pattern', 'replace', 'flag',
  'extrainfo', 'comment'
]
#XXX Don't change the order! There is a piggy cmdfields[6:] ahead


#-------------------------------------------------------------------------------
#                         Auxiliar Functions - Tools
#-------------------------------------------------------------------------------

def escapeTextCommandsSpecials(str):
	str = string.replace(str, '\\', '\\\\')         # escape escape
	return str

def isOpenBracket(str):
	# bracket open:  [   \\[   \\\\[ ...
	# not bracket : \[  \\\[  \\\\\[ ...
	isis = 0
	delim = '['
	str = re.sub('\[:[a-z]+:]', '', str)            # del [:charclasses:]
	if string.find(str, delim) == -1: return 0      # hey, no brackets!

	# Only the last two count
	patterns = string.split(str, delim)[-2:]
	Debug('bracketpatts: %s'%patterns,3)
	possibleescape, bracketpatt = patterns

	# Maybe the bracket is escaped, and is not a metachar?
	m = re.search(r'\\+$', possibleescape)          # escaped bracket
	if m and len(m.group(0))%2:                     # odd number of escapes
		Debug('bracket INVALID! - escaped',2)
		isis = 0
	elif string.find(bracketpatt, ']') == -1:       # not closed by ]
		Debug('bracket OPEN! - found! found!',2)
		isis = 1                                # it is opened! &:)

	return isis

def paintHtml(id, txt=''):
	# Escape HTML special chars
	if txt:
		txt = string.replace(txt, '&', '&amp;')
		txt = string.replace(txt, '>', '&gt;')
		txt = string.replace(txt, '<', '&lt;')
	# Some color adjustments and emphasis
	if   id == 'id' and txt in sedcmds['block']:
		id = 'delimiter'
	elif id == 'id' and txt == ':':
		id = 'content'
	elif id == 'replace':   # highlight \n, & and \$
		newtxt = paintHtml('special', '\\'+linesep)
		txt = string.replace(txt, '\\'+linesep, newtxt)
		txt = re.sub(
		      '(\\\\[1-9]|&amp;)', paintHtml('special', '\\1'), txt)
	elif id == 'pattern':   # highlight ( and |
		txt = re.sub(
		      '(\\\\)([(|])', '\\1'+paintHtml('pattmeta', '\\2'), txt)
	elif id == 'plaintext': # highlight \$
		newtxt = paintHtml('special', '\\'+linesep)
		txt = string.replace(txt, '\\'+linesep, newtxt)
	elif id == 'branch':    # nice link to the label!
		txt = '<a href="#%s">%s</a>'%(txt,txt)
	elif id == 'target':    # link target
		txt = '<a name="%s">%s</a>'%(txt,txt)
		id = 'content'
	# Paint it!
	if html_colors.get(id) and txt:
		font_color = html_colors[id]
		txt = '<font color="%s"><b>%s</b></font>'%(font_color, txt)
	return txt


#-------------------------------------------------------------------------------
#                 SedCommand class - Know All About Commands
#-------------------------------------------------------------------------------

# TIP: SedCommand already receives lstrip()ed data and data != None
class SedCommand:
	def __init__(self, abcde):
		self.id = abcde[0]   # s
		self.content = ''    # txt, filename
		self.modifier = ''   # !
		self.full = ''       # !s/abc/def/g

		# for s/// & y///
		self.pattern = ''    # abc
		self.replace = ''    # def
		self.delimiter = ''  # /
		self.flag = ''       # g

		self.isok = 0
		self.comment = ''
		self.rest = self.junk = abcde
		self.extrainfo = ''

		if self.id == '!':
			self.modifier = self.id                  # set modifier
			self.junk = string.lstrip(self.junk[1:]) # del !@junk
			self.id = self.junk[0]                   # set id again
		self.junk = self.junk[1:]                     # del id@junk

		#self.setId()
		self.doItAll()

	def doItAll(self):
		# here, junk arrives without the id, but not lstripped (s///)
		id = self.id

		#TODO put pending comment on the previous command (h ;#comm)
		if id == '#':
			Debug('type: comment',3)
			self.comment = self.id+self.junk
			self.junk = ''
			self.isok = 1

		elif id in sedcmds['solo']:
			Debug('type: solo',3)
			self.isok = 1
		elif id in sedcmds['block']:
			Debug('type: block',3)
			self.isok = 1
		elif id in sedcmds['text']:
			Debug('type: text',3)
			if self.junk[-1] != '\\': # if not \ at end, finished
				# ensure \LineSep at begining
				self.content = re.sub(
				               r'^\\%s'%linesep, '', self.junk)
				self.content = '\\%s%s'%(linesep,self.content)
				self.isok = 1

		elif id in sedcmds['jump']:
			Debug('type: jump',3)
			self.junk = string.lstrip(self.junk)
			m = re.match(patt['jump_label'], self.junk)
			if m:
				self.content = m.group()
				self.junk = self.junk[m.end():]
				self.isok = 1

		elif id in sedcmds['file']:
		#TODO deal with valid cmds like 'r bla;bla' and 'r bla ;#comm'
		#TODO spaces and ; are valid as filename chars
			Debug('type: file',3)
			self.junk = string.lstrip(self.junk)
			m = re.match(patt['filename'], self.junk)
			if m:
				self.content = m.group()
				self.junk = self.junk[m.end():]
				self.isok = 1

		elif id in sedcmds['multi']:                  # s/// & y///
			Debug('type: multi',3)
			self.delimiter = self.junk[0]
			ps = SedAddress(self.junk)
			hs = ''
			if ps.isok:
				self.pattern = ps.pattern
				self.junk = ps.rest
				# 'replace' opt to avoid openbracket check,
				# because 's/bla/[/' is ok
				hs = SedAddress(self.delimiter+self.junk,
				                'replace')
				if hs.isok:
					self.replace = hs.pattern
					self.junk = string.lstrip(hs.rest)

					# great, s/patt/rplc/ sucessfully taken

			if hs and hs.isok and self.junk:    # there are flags?
				Debug('possible s/// flag: %s'%self.junk,3)
				m = re.match('(%s\s*)+'%patt['flag'],self.junk)
				if m:
					self.flag = m.group()
					self.junk = string.lstrip(
					   self.junk[m.end():]) # del flag
					self.flag = re.sub(
					   '\s','',self.flag)  # del blanks@flag
					Debug('FOUND s/// flag: %s'%(
					   string.strip(self.flag)))

					### now we've got flags also

				if 'w' in self.flag:         # write file flag
					m = re.match(patt['filename'],self.junk)
					if m:
						self.content = m.group()
						Debug('FOUND s///w filename: %s'%self.content)
						self.junk = string.lstrip(
						            self.junk[m.end():])

						### and now, s///w filename
						### is saved also

			if hs and hs.isok: self.isok = 1

		else:
			Error("invalid SED command '%s' at line %d"%(id,linenr))

		if self.isok:
			self.full = composeSedCommand(vars(self))
			self.full = string.replace(self.full, '\n', linesep)
			self.rest = string.lstrip(self.junk)
			Debug('FOUND command: %s'%self.full)
			Debug('rest left: %s'%self.rest,2)

			possiblecomment = self.rest
			if possiblecomment and possiblecomment[0] == '#':
				self.comment = possiblecomment
				Debug('FOUND comment: %s'%self.comment)
		Debug('SedCommand: %s'%vars(self),3)


#-------------------------------------------------------------------------------
#                 SedAddress class - Know All About Addresses
#-------------------------------------------------------------------------------

#TIP an address is NOT multiline
class SedAddress:
	def __init__(self, abcde, context='addr'):
		self.delimiter = ''
		self.pattern = ''
		self.flag = ''
		self.full = ''
		self.html = ''

		self.isline = 0
		self.isok = 0
		self.escape = ''
		self.rest = self.junk = abcde
		self.context = context

		self.setType()                           # numeric or pattern?
		self.doItAll()
		Debug('SedAddress: %s'%vars(self),3)

	def doItAll(self):
		if self.isline: self.setLineAddr()
		else          : self.setPattAddr()

		if self.isok:
			self.full = '%s%s%s%s'%(
			            self.escape,
			            self.delimiter,
			            self.pattern,
			            self.delimiter)
			if action == 'html':
				self.html = '%s%s%s%s'%(
				   paintHtml('escape'   , self.escape   ),
				   paintHtml('delimiter', self.delimiter),
				   paintHtml('pattern'  , self.pattern  ),
				   paintHtml('delimiter', self.delimiter))
			Debug('FOUND addr: %s'%self.full)

			cutlen = len(self.full)+len(self.flag)
			self.rest = self.rest[cutlen:]      # del junk's addr
			self.flag = string.strip(self.flag) # del flag's blank
			Debug('rest left: %s'%self.rest,2)
		else:
			Debug('OH NO! partial addr: %s'%self.rest)

	def setType(self):
		id = self.junk[0]
		if re.match('[0-9$]', id):        # numeric addr, easy!
			self.isline = 1
		else:                             # oh no, pattern
			if id == '\\':                # strange delimiter (!/)
				self.escape = '\\'
				self.junk = self.junk[1:] # del escape
			self.delimiter = self.junk[0] # set delimiter
			self.junk = self.junk[1:]     # del delimiter@junk

	def setLineAddr(self):
		m = re.match(r'[0-9]+|\$', self.junk)
		self.pattern = m.group(0)
		self.isok = 1

	def setPattAddr(self):
		###
		# similar to command finder:
		# - split at pattern delimiter
		# - if address not terminated, join with next split chunk (loop)
		# - address found, return it
		#
		# We can deal with really catchy valid addresses like:
		#   /\/[/]\\/   and   \;\;[;;]\\;
		incompleteaddr = ''

		Debug('addr delimiter: '+self.delimiter,2)
		patterns = string.split(self.junk, self.delimiter)
		Debug('addr patterns: %s'%patterns,2)

		while patterns:
			possiblepatt = patterns.pop(0)

			# if address not terminated, join next
			if incompleteaddr:
				possiblepatt = string.join(
				               [incompleteaddr, possiblepatt],
				               self.delimiter)
				incompleteaddr = ''
			Debug('possiblepatt: '+possiblepatt,2)

			# maybe splitted at a (valid) escaped delimiter?
			if re.search(r'\\+$', possiblepatt):
				m = re.search(r'\\+$', possiblepatt)
				if len(m.group(0))%2:
					Debug('address INCOMPLETE! - ends with \\ alone')
					incompleteaddr = possiblepatt
					continue

			if self.context != 'replace':
				# maybe splitted at a delimiter inside
				# char class []?
				# BUG: []/[] is not catched - WONTFIX
				if isOpenBracket(possiblepatt):
					Debug('address INCOMPLETE! - open bracket')
					incompleteaddr = possiblepatt
					continue

			break                          # it's an address!

		if patterns:                      # must have something left
			if patterns[0]:                # the rest is a flag?
				Debug('possible addr flag: %s'%patterns[0],3)
				m = re.match('\s*I\s*', patterns[0])
				if m:                       # yes, a flag!
					self.flag = m.group()    # set addr flag
					Debug('FOUND addr flag: %s'%(
					      string.strip(self.flag)))
			self.pattern = possiblepatt
			self.isok = 1


#-------------------------------------------------------------------------------
#                 Hardcore Address/Command Composer Functions
#-------------------------------------------------------------------------------

def composeSedAddress(dict):
	addr1 = ''
	if action == 'html':
		if dict['addr1']: addr1 = dict['addr1html']
		if dict['addr2']: addr2 = dict['addr2html']
	else:
		addr1 = '%s%s'%(dict['addr1'],dict['addr1flag'])
		if dict['addr2']:
			addr2 = '%s%s'%(dict['addr2'],dict['addr2flag'])

	if dict['addr2']: addr = '%s,%s'%(addr1,addr2)
	else: addr = addr1

	if addr: addr = '%s '%(addr)  # visual addr/cmd separation
	return addr

def composeSedCommand(dict):
	if dict['delimiter']:         # s///
		if action != 'html':
			cmd = '%s%s%s%s%s%s%s%s'%(
			    dict['modifier'] ,dict['id'],
			    dict['delimiter'],dict['pattern'],
			    dict['delimiter'],dict['replace'],
			    dict['delimiter'],dict['flag'])
			if dict['content']:   # s///w filename
				cmd = cmd+' '+dict['content']
		else:
			cmd = """%s%s%s%s%s%s%s%s"""%(
			    paintHtml('modifier' , dict['modifier'] ),
			    paintHtml('id'       , dict['id']       ),
			    paintHtml('delimiter', dict['delimiter']),
			    paintHtml('pattern'  , dict['pattern']  ),
			    paintHtml('delimiter', dict['delimiter']),
			    paintHtml('replace'  , dict['replace']  ),
			    paintHtml('delimiter', dict['delimiter']),
			    paintHtml('flag'     , dict['flag']     ))
			if dict['content']:   # s///w filename
				painted = paintHtml('content', dict['content'])
				cmd = '%s %s'%(cmd, painted)
	else:
		idsep=''
		# spacer on r,w,b,t commands only
		spaceme = sedcmds['file']+sedcmds['jump']
		spaceme = string.replace(spaceme,':','') # : label (no space!)
		if dict['id'] in spaceme: idsep=' '
		cmd = '%s%s%s%s'%(
		      dict['modifier'],
		      dict['id'],
		      idsep,
		      dict['content'])
		if action == 'html':
			if   dict['id'] in sedcmds['text']:
				content_type = 'plaintext'
			elif dict['id'] in 'bt':
				content_type = 'branch'
			elif dict['id'] == ':':
				content_type = 'target'
			else:
				content_type = 'content'

			cmd = '%s%s%s%s'%(
			       paintHtml('modifier'  , dict['modifier']),
			       paintHtml('id'        , dict['id']      ),
			       idsep,
			       paintHtml(content_type, dict['content'] ))
	cmd = string.replace(cmd, linesep, '\n')
	return cmd


#-------------------------------------------------------------------------------
#                    The dump* Functions - They 4mat 4you!
#-------------------------------------------------------------------------------

def dumpKeyValuePair(datalist):
	"Shows field:value command data line by line (lots of lines!)"
	for data in datalist[1:]:                         # skip headers at 0
		if not data['id']: continue                   # blank line
		for key in datalist[0]['fields']:
			if key == 'replace':
				data[key] = string.replace(
				            data[key],
				            linesep,
				            newlineshow)
			print "%10s:%s"%(key,data[key])
		print

# Format: line:ad1:ad1f:ad2:ad2f:mod:cmd:content:delim:patt:rplc:flag:comment
def dumpOneliner(datalist, fancy=0):
	"Shows a command per line, elements separated by : (looooong lines)"
	r = n = ''
	if fancy: r = '\033[7m'; n = '\033[m'
	for data in datalist[1:]:                         # skip headers at 0
		outline = data['linenr']
		if data['id']:
			for key in datalist[0]['fields'][1:]:     # skip linenr
				outline = '%s:%s%s%s'%(outline,r,data[key],n)
		print outline

def dumpCute(datalist):
	"Shows a strange representation of SED commands. Use --dumpcute."
	r = color_REV; n = color_NO
	for data in datalist[1:]:                         # skip headers at 0
		if not data['id']:
			print '%40s'%'[blank]'
		elif data['id'] == '#' :
			print data['comment']
		else:
			idsep=''
			if data['id'] in 'bt': idsep=' '
			cmd = '%s%s%s%s'%(
			      data['modifier'],
			      data['id'],
			      idsep,
			      data['content'])
			if data['delimiter']:
				cmd = '%s%s%s%s%s%s%s'%(cmd,
				    data['delimiter'],data['pattern'],
				    data['delimiter'],data['replace'],
				    data['delimiter'],data['flag'])
			cmd = string.replace(cmd, linesep, n+newlineshow+r)
			print '%s'%'-'*40
			print 'adr: %s%s%s%s  :::  %s%s%s%s'%(
			       r,data['addr1'],data['addr1flag'],n,
			       r,data['addr2'],data['addr2flag'],n)
			print 'cmd: %s%s%s   [%s]'%(r,cmd,n,data['comment'])

# dumpScript: This is a handy function, used by --indent AND --htmlize
# It formats the SED script in a humam-friendly way, with one command
# per line and adding spaces on the right places. If --htmlize, it
# also adds the HTML code to the script.
#
def dumpScript(datalist, indent_prefix):
	"Shows the indented script in plain text or HTML!"
	indfmt = { 'string' : indent_prefix, 'initlevel'  : 0,
	           'addrsep': ',' , 'joinaddrcmd': 0 }
	outlist = []
	adsep = indfmt['addrsep']
	indent = indfmt['initlevel']

	if action == 'html': outlist.append(html_data['header'])

	for data in datalist[1:]:                         # skip headers at 0
		if not data['id']:
			outlist.append('\n')
			continue                                  # blank line
		if data['id'] == '#' :
			indentstr = indfmt['string']*indent
			if action != 'html':
				outlist.append('%s%s\n'%(
				               indentstr,
				               data['comment']))
			else:
				outlist.append('%s%s\n'%(
				               indentstr,
				               paintHtml('comment',
				                         data['comment'])))
		else:
			if data['id'] == '}': indent = indent - 1
			# only indent++ after open {
			indentstr = indfmt['string']*indent
			if data['id'] == '{': indent = indent + 1

			cmd = composeSedCommand(data)
			addr = composeSedAddress(data)

			# saving full line
			comm = ''
			if data['comment']: comm = ';'+data['comment']
			cmd = '%s%s%s'%(indentstr,addr,cmd)
			outlist.append('%-39s%s\n'%(cmd,comm))

	if action == 'html':
		outlist.append(html_data['footer'])

	for line in outlist: print line,                  # print the result


#-------------------------------------------------------------------------------
#                    doDebug - Here is where the fun begins
#-------------------------------------------------------------------------------
#
### doDebug
#
# This function performs the --debug action.
#
# After the SED script was parsed by the parsed (below), this function
# is called with the script data found. It loops, shouts and screems,
# inserting the nice DEBUG lines between the SED script commands.
#
# After all lines are composed, it call the system's SED to run the
# script, and SED will do it's job, but this time showing you all the
# secrets that the PATTERN SPACE and HOLD SPACE buffers holds.
#
def doDebug(datalist):
	outlist = []
	cmdlineopts = 'f'
	t_count = 0
	hideregisters = 0

	if datalist[0].has_key('topopts'):
		cmdlineopts = datalist[0]['topopts']

	# If we have one or more t commands on the script, we need to save
	# the t command status between debug commands. As they perform
	# s/// commands, the t status of the "last substitution" is lost.
	# So, we save the status doing a nice loop trick before *every*
	# command (necessary overhead). This loops uses the :zzsetNNN and
	# zzclrNNN labels, where NNN is the label count.
	# TIP: t status resets: line read, t call
	if datalist[0]['has_t']: t_count = 1

	for i in range(len(datalist)):
		if i == 0: continue                         # skip headers at 0
		data = datalist[i]
		if not data['id']: continue                 # ignore blank line
		if data['id'] == '#': outlist.append('%s\n'%(data['comment']))
		else:
			cmd = composeSedCommand(data)
			addr = composeSedAddress(data)

			cmdshow = string.replace(cmd, '\n',
			                         newlineshow+color_YLW)
			cmdshow = escapeTextCommandsSpecials(addr+cmdshow)
			showsedcmd = string.replace(showcomm, '\a', cmdshow)

			registers = showpatt + showhold
			if hideregisters: registers = ''

			showall = '%s%s'%(registers,showsedcmd)

			# Add the 't status' trick to commands.
			# Exception: read-next-line commands (n,d,q)
			# Exception: no PATT/HOLD registers to show (no s///)
			if t_count and showall:
				if data['id'] not in 'ndq' and registers:
					tmp = string.replace(save_t, '\a',
					                     '%03d'%t_count)
					showall = string.replace(tmp, '#DEBUG#',
					                         showall)
					t_count = t_count + 1

			# null cmd to restore last addr: /addr/y/!/!/
			if data['lastaddr']:
				showall = showall+debug_prefix+\
					data['lastaddr']+nullcomm+'\n'

			# after jump or block commands don't show
			# registers, because they're not affected.
			# exception: after b or t without target
			# (read next line)
			hideregisters = 0
			if data['id'] in sedcmds['jump'] and data['content']:
				hideregisters = 1
			elif data['id'] in sedcmds['block']:
				hideregisters = 1

			outlist.append("%s#%s\n%s\n"%(showall,'-'*50,addr+cmd))

	outlist.append(showpatt + showhold)           # last line status

	# executing sed script
	cmdextra = inputfiles = ''
	if action_modifiers.count('_stdout-only'):
		#cmdextra = "| egrep -v '^PATT|^HOLD|^COMM|\$$|\\$'"  # sed
		cmdextra = "-l 5000 | egrep -v '^PATT|^HOLD|^COMM'"   # gsed
	for file in textfiles: inputfiles = '%s %s'%(inputfiles,file)
	if dump_debug:
		for line in map(lambda x:re.sub('\n$','',x), outlist):
			print line
		print "\n# Debugged SED script generated by %s-%s (%s)"%(
			myname, myversion, myhome)
	else:
		tmpfile = tempfile.mktemp()
		write_file(tmpfile, outlist)
		os.system("%s -%s %s %s %s"%(
		           sedbin, cmdlineopts, tmpfile, inputfiles, cmdextra))
		os.remove(tmpfile)


################################################################################
#                                                                              #
#                               SED Script Parser                              #
#                           -------------------------                          #
#                      Extract Every Info of Every Command                     #
#                                                                              #
################################################################################
#
### Global view of the parser:
#
# - Load the original sed script to a list, then let the file free
# - Scan the list (line by line)
# - As user can do more than one sed command on the same line, we split
#   "possible valid commands" by ; (brute force method)
# - Validate each splitted command
# - If not valid, join next, and try to validate again (loop here)
# - If hit EOL and still not valid, join next line, validate (loop here)
# - Hit EOF, we've got all info at hand
# - Generate a result list with all sed command found and its data, each
#   command having it's own dictionary: {addr1: '', addr2: '', cmd: ''}
# - ZZ is the list
###


incompletecmd = ''
incompleteaddr = ''
incompletecmdline = ''
addr1 = addr2 = ''
lastaddr = ''
lastsubref = ''
has_t = 0
cmdsep = ';'
linesep = '@#linesep#@'
newlineshow = '%s\\N%s'%(color_RED,color_NO)
newlinemark = r']]\([\)'
blanklines= []
ZZ = []
ZZ.append({})  #for header

linenr = 0
cmddict = {}
for line in sedscript:
	linenr = linenr + 1

	if linenr == 1:                            # 1st line #!/... finder
		m= re.match(patt['topopts'], line)
		if m:                                 # we have options!
			ZZ[0]['topopts'] = m.group(1)     # saved on list header
			del m

	if incompletecmdline:
		line = string.join([incompletecmdline, line], linesep)

	if line and line[-1] == '\n': line = line[:-1]    # s/\n$//
	if not string.strip(line):                        # blank line
		blanklines.append(linenr)
		ZZ.append({'linenr': linenr, 'id': ''})
		continue

	if DEBUG: print ; Debug('line:%d: %s'%(linenr,line))

	# bruteforce: split lines in ; char
	# exceptions: comments and a,c,i text
	if string.lstrip(line)[0] == '#':
		linesplit = [string.lstrip(line)]           # comments
	elif string.lstrip(line)[0] in sedcmds['text']:
		linesplit = [line]                          # a, c, i
	else:
		linesplit = string.split(line, cmdsep)      # split lines at ;

	while linesplit:
		possiblecmd = linesplit.pop(0)
		if not incompletecmdline:
			if incompletecmd:
				possiblecmd = string.join(
				              [incompletecmd, possiblecmd],
				              cmdsep)
			if incompleteaddr:
				possiblecmd = string.join(
				              [incompleteaddr, possiblecmd],
				              cmdsep)
		else:
			incompletecmdline = ''

		if not possiblecmd: continue # ; at EOL or useless seq of ;;;;

		Debug('possiblecmd: '+possiblecmd,2)
		possiblecmd = string.lstrip(possiblecmd) # del space at begin
		cmdid = possiblecmd[0]                   # get 1st char(sed cmd)

		if cmdid == '\\' and len(possiblecmd) == 1:  # to get \;addr;
			incompleteaddr = cmdid
			continue


		###----------- Get addresses routine ---------------
		#
		# To handle ranges, match addresses one by one:
		# - Matched addr at ^   ? Get it and set addr1.
		# - Next char is a comma? It's a range. Get & set addr2.
		# - Addresses are cutted from command, continue.
		#
		# We're not using split cause it fails at /bla[,]bla/ address
		#
		while 1:
			if not possiblecmd[0] in sedcmds['addr']: break # NOaddr

			addr = SedAddress(possiblecmd)            # get data

			if addr.isok:
				if not cmddict.has_key('addr1'):
					cmddict['linenr'] = linenr
					cmddict['addr1'] = addr.full
					cmddict['addr1flag'] = addr.flag
					cmddict['addr1html'] = addr.html
					if addr.pattern: lastaddr = addr.full
					else: cmddict['lastaddr'] = lastaddr
				else:
					cmddict['addr2'] = addr.full
					cmddict['addr2flag'] = addr.flag
					cmddict['addr2html'] = addr.html
					if addr.pattern: lastaddr = addr.full
					else: cmddict['lastaddr'] = lastaddr
				rest = addr.rest
			else:
				incompleteaddr = addr.rest
				break                        # join more cmds

			# it's a range!
			if not cmddict.has_key('addr2') and rest[0] == ',':
				# del comma and blanks
				possiblecmd = string.lstrip(rest[1:])
				continue                     # process again
			else:
				incompleteaddr = ''
				possiblecmd = string.lstrip(rest)
				break                        # we're done!

		if incompleteaddr: continue                   # need more cmds!
		for key in cmdfields[:6]:  # filling not set addr fields
			if not cmddict.has_key(key): cmddict[key] = ''

		###-------------------------------------------------
		### from here, address is no more
		###-------------------------------------------------

		if not incompletecmd:
			if not possiblecmd:
				Error('missing command at line %d!'%linenr)
			cmd = SedCommand(possiblecmd)
			if not cmddict['linenr']:
				cmddict['linenr'] = linenr
		else:
			cutme = len(cmd.modifier+cmd.id)
			cmd.rest = possiblecmd
			cmd.junk = possiblecmd[cutme:]
			cmd.doItAll()

		if cmd.isok:
			for key in cmdfields[6:]:       # filling cmd entry data
				cmddict[key] = getattr(cmd, key)

			# saving last address content
			if cmd.pattern:
				lastaddr = cmd.delimiter+\
				           cmd.pattern  +\
				           cmd.delimiter
			elif cmd.delimiter:
				cmddict['lastaddr'] = lastaddr

			if cmd.id == 's':
				lastsubref = len(ZZ)    # saving s/// position
			if cmd.id == 't':               # related s/// reference
				cmddict['extrainfo'] = lastsubref
				has_t = 1

			ZZ.append(cmddict)              # saving full cmd entry
			Debug('FULL entry: %s'%cmddict,3)
			cmddict = {}                    # reset data holder
			# reset incomplete holders
			incompletecmd = incompletecmdline = ''

			if cmd.id   == '{': linesplit.insert(0,cmd.rest)
			if cmd.rest == '}': linesplit.insert(0,cmd.rest)
			# ^---  3{p;d} (gnu)
			del cmd
		else:
			incompletecmd = cmd.rest       # not ok, will join next
			Debug('INCOMPLETE cmd: %s'%incompletecmd)

	if incompletecmd:
		incompletecmdline = incompletecmd

# populating list header
ZZ[0]['blanklines'] = blanklines
ZZ[0]['fields'] = cmdfields
ZZ[0]['has_t'] = has_t

# Now the ZZ list is full.
# It has every info that sedsed can extract from a SED script.
# From now on, all functions and classes will manage this list.
# If you are curious about it, just uncomment the line below and
# prepare yourself for an ASCII nightmare ;)
#print color_YLW + `ZZ` + color_NO ; sys.exit(0)


################################################################################
#                                                                              #
#                               The SED Emulator!                              #
#                           -------------------------                          #
#                       Not 100% done, but already usable                      #
#                                                                              #
################################################################################
#
# The emulator still don't support complex regexes and '$' as line address.
# Use the --emu command line option to run the emulator.
# If you don't have SED on your system, you can use --emu to have a SED-like
# program!
#
# Example:
#    $ echo 'foo bar' | sedsed --emu 's/.*/SED/'
#    SED
#

class emuSed:
#TODO check for syntax errors
#TODO convert regexes
#TODO organize debug msgs
#TODO make all this script a valid/callable python module
	def __init__(self, datalist, textfile, debug=0):
		self.inlist = ['']
		self.outlist = []
		self.cmdlist = []
		self.labels = {}
		self.blocks = {}
		self.addr1 = self.addr2 = ''
		self.linenr = 0
		self.cmdnr = 0
		self.holdspace = ''
		self.line = ''
		self.cmd = ''

		self.f_debug = debug
		self.f_stdin = 0
		self.rewindScript()

		# getting input data location (stdin or file)
		if textfile == '-': self.f_stdin = 1
		else: self.inlist.extend(read_file(textfile))

		# wipe null commands, save labels and block info
		blockopen = []
		for data in datalist[1:]:                # skip headers at 0
			if not data['id'] or data['id'] == '#': continue
			self.cmdlist.append(data)
			cmdpos = len(self.cmdlist)-1
			if   data['id'] == ':':
				self.labels[data['content']] = cmdpos
			elif data['id'] == '{':
				blockopen.append(cmdpos)
			elif data['id'] == '}':
				self.blocks[blockopen.pop()] = cmdpos
		del blockopen

		self.run()

	def rewindScript(self):
		self.EOS = 0     # end of script
		self.EOF = 0     # end of file
		self.cmdnr = -1
		self.f_delme = 0
		self.f_inrange = 0
		self.f_joinme = 0

	def readNextLine(self):
		self.linenr = self.linenr +1
		#TODO $ matches everyline.
		#TODO GNUsed retains stdout until next only if there is a $ addr
		if self.f_stdin:                 # reading STDIN interactively
			inputline = sys.stdin.readline()
			if not inputline: self.EOF = 1 ; return
			self.inlist.append(inputline[:-1])   # del \n$
		if self.linenr > len(self.inlist)-1:     # no more lines!
			self.EOF = 1 ; return
		next = self.inlist[self.linenr]
		if self.f_joinme: self.line = self.line+'\n'+next
		else            : self.line = next
		Debug('line readed:%d:%s'%(self.linenr,`self.line`), 1)

	def _getAddress(self, fulladdr):
		addr = fulladdr                          # number
		if   addr[0] == '/' : addr = addr[1:-1]  # del //
		elif addr[0] == '\\': addr = addr[2:-1]  # del \xx
		return addr

	def _matchAddress(self, addr):
		ok = 0
		if addr[0] in '0123456789':              # 003 is valid
			if self.linenr == int(addr): ok = 1
		elif addr == '$':                        # last line
			if self.linenr == len(self.inlist)-1: ok = 1
		elif re.search(addr,self.line): ok = 1   # pattern
		if ok: Debug('MATCHed addr:%s'%`addr`,2)
		return ok

	def testAddress(self):
		ok = 0 ; cmd = self.cmd ; PS = self.line

		if not cmd['addr1']:
			ok = 1              # no address
			Debug('NO address!', 3)
		else:
			self.addr1 = self._getAddress(cmd['addr1'])
			Debug('addr1: '+self.addr1, 2)

		if cmd['addr2']:                         # range
			self.addr2 = self._getAddress(cmd['addr2'])
			Debug('addr2: '+self.addr2, 2)
			if self.f_inrange: self.f_inrange = 0

		if not ok:
			if self._matchAddress(self.addr1): ok = 1

			if self.addr2:                       # range
				if ok: self.f_inrange = 1        # start range
				elif self._matchAddress(self.addr2):
					ok = 1 ; self.f_inrange = 0  # end range
				elif self.f_inrange: ok = 1      # in range
				Debug('in range: %d'%self.f_inrange, 3)

		Debug('is hotline: %d'%ok, 3)
		Debug('cmd: %s'%cmd['id'], 1)
		return ok

	def _makeRawString(self,str):
		raw = string.replace(str, '\t', '\\t')
		raw = string.replace(raw, '\n', '\\n')
		return raw +'$'

	def applyCmd(self):
		cmd = self.cmd ; PS = self.line ; HS = self.holdspace
		Debug('cmdnr: %d'%self.cmdnr, 3)

		#TODO ! r w //
		if   cmd['id'] == ':': pass
		elif cmd['id'] == '=': print(self.linenr)
		elif cmd['id'] == 'p': print(PS)
		elif cmd['id'] == 'P': print(re.sub('\n.*','', PS))
		elif cmd['id'] == 'q': self.EOF = 1
		elif cmd['id'] == 'h': HS = PS
		elif cmd['id'] == 'H': HS = HS+'\n'+PS
		elif cmd['id'] == 'g': PS = HS
		elif cmd['id'] == 'G': PS = PS+'\n'+HS
		elif cmd['id'] == 'x': PS, HS = HS, PS
		elif cmd['id'] == 'y':
			trtab = string.maketrans(cmd['pattern'], cmd['replace'])
			PS = string.translate(PS, trtab)
		elif cmd['id'] == 'l': print self._makeRawString(PS)
		elif cmd['id'] == 'd':
			self.f_delme = 1 ; self.EOS = 1   # d) forces next cicle
		elif cmd['id'] == 'D':             # D) del till \n, next cicle
			cutted = re.sub('^.*?\n', '', PS) # del till the 1st \n
			if cutted == PS: cutted = ''      # if no \n, del all
			PS = cutted
			self.rewindScript()               # D forces rewind
			if not PS:                    # no PS, start next cicle
				self.f_delme = 1 ; self.EOS = 1
			print '------',PS
		elif cmd['id'] == 'n':             # n) print patt, read line
			print(PS)
			self.readNextLine(); PS = self.line
		elif cmd['id'] == 'N':             # N) join next, read line
			self.f_joinme = 1
			self.readNextLine(); PS = self.line
		elif cmd['id'] in 'aic':           # aic) spill text
			txt = re.sub(r'\\%s'%linesep, '\n', cmd['content'])
			txt = re.sub('^\n', '', txt)     #  delete first escape
			self.f_delme = 1
			if cmd['id'] == 'a': print(PS)   #  line before
			print(txt)                       #  put text
			if cmd['id'] == 'i': print(PS)   #  line after
		elif cmd['id'] in 'bt':            # jump to...
			if not cmd['content']: self.EOS = 1            #...end
			else: self.cmdnr = self.labels[cmd['content']] #...label
		#TODO s///3 ; s//\1/ ; s//&/
		elif cmd['id'] == 's':
			times = 1
			patt = cmd['pattern']
			repl = cmd['replace']
			#TODO v----- test only, make function
			patt = re.sub(r'\\\(','(',patt)
			patt = re.sub(r'\\\)',')',patt)
			repl = re.sub(r'^\\\n','\n',repl) # NL escaped on repl
			if 'g' in cmd['flag']: times = 0           # global
			if 'i' in cmd['flag']: patt = '(?i)'+patt  # ignore case
			new = re.sub(patt, repl, PS, times)
			if 'p' in cmd['flag'] and new != PS: print new
			if 'w' in cmd['flag']:
				text = [new]   # w) open file truncating anyway
				# write patt only if s/// was ok
				if new == PS: text = ''
				write_file(cmd['content'], text)
			PS = new

		if self.f_debug:
			showreg = 1
			fullcmd = "%s%s"%(composeSedAddress(cmd),
			   string.replace(composeSedCommand(cmd), '\n',
			                  newlineshow+color_YLW))
			print commid+color_YLW+fullcmd+color_NO
			if cmd['id'] in ':bt' and cmd['content']: showreg = 0
			if cmd['id'] in '{}': showreg = 0
			if showreg:
				print pattid+self._makeRawString(PS)
				print holdid+self._makeRawString(HS)

		self.line = PS ; self.holdspace = HS # save registers


	def run(self):
		while not self.EOF:
			self.rewindScript()
			self.readNextLine()
			if self.EOF: break

			if self.linenr == 1 and self.f_debug:   # debug info
				print pattid+self._makeRawString(self.line)
				print holdid+self._makeRawString(self.holdspace)

			while not self.EOS:
				if self.cmdnr == -1:  # 1st position
					self.cmdnr = 0
				self.cmd = self.cmdlist[self.cmdnr]
				if self.testAddress():
					self.applyCmd()
					if self.EOS or self.EOF: break
				elif self.cmd['id'] == '{':
					self.cmdnr = self.blocks[self.cmdnr]

				self.cmdnr = self.cmdnr +1 # next command
				if self.cmdnr > len(self.cmdlist)-1: break

			# default print pattern behaviour
			if not self.f_delme: print self.line


#-------------------------------------------------------------------------------
#          Script Already Parsed, Now It's Time To Make Decisions
#-------------------------------------------------------------------------------
#
# This is the crucial point where the program will perform the action
# that you choose on the command line.
#
# The ZZ list is full of data, and all the following functions know
# how to handle it. Maybe we will indent, maybe debug? We'll see.
#

if   action == 'indent'  : dumpScript(ZZ, indent_prefix)
elif action == 'html'    : dumpScript(ZZ, indent_prefix)
elif action == 'debug'   : doDebug(ZZ)
elif action == 'token'   : dumpKeyValuePair(ZZ)
elif action == 'dumpcute': dumpCute(ZZ)
elif action in ['emu', 'emudebug']:
	DEBUG = EMUDEBUG
	if action == 'emudebug':
		dodebug = 1
	else:
		dodebug = 0
	for textfile in textfiles:
		emuSed(ZZ, textfile, dodebug)


#-------------------------------------------------------------------------------
#                               - THE END -
#-------------------------------------------------------------------------------


#TODO commenter
#TODO ignore l command line break?
#TODO accept \n as addr delimiter
#TODO more comments, reformat some long lines or depth indent
#TODO check if there's a SED command
#TODO check if user script is syntax correct (!popen())
#     ^---- how to close stdout on os.system() ?
# vim:ts=8