summaryrefslogtreecommitdiffstats
path: root/Doc/tools
diff options
context:
space:
mode:
Diffstat (limited to 'Doc/tools')
-rw-r--r--Doc/tools/partparse.py3412
1 files changed, 1699 insertions, 1713 deletions
diff --git a/Doc/tools/partparse.py b/Doc/tools/partparse.py
index db53a01..2f072bb 100644
--- a/Doc/tools/partparse.py
+++ b/Doc/tools/partparse.py
@@ -27,61 +27,61 @@ MODE_MATH = 4
MODE_DMATH = 5
MODE_GOBBLEWHITE = 6
-the_modes = MODE_REGULAR, MODE_VERBATIM, MODE_CS_SCAN, MODE_COMMENT, \
- MODE_MATH, MODE_DMATH, MODE_GOBBLEWHITE
+the_modes = (MODE_REGULAR, MODE_VERBATIM, MODE_CS_SCAN, MODE_COMMENT,
+ MODE_MATH, MODE_DMATH, MODE_GOBBLEWHITE)
# Show the neighbourhood of the scanned buffer
def epsilon(buf, where):
- wmt, wpt = where - 10, where + 10
- if wmt < 0:
- wmt = 0
- if wpt > len(buf):
- wpt = len(buf)
- return ' Context ' + `buf[wmt:where]` + '.' + `buf[where:wpt]` + '.'
+ wmt, wpt = where - 10, where + 10
+ if wmt < 0:
+ wmt = 0
+ if wpt > len(buf):
+ wpt = len(buf)
+ return ' Context ' + `buf[wmt:where]` + '.' + `buf[where:wpt]` + '.'
# Should return the line number. never worked
def lin():
- global lineno
- return ' Line ' + `lineno` + '.'
+ global lineno
+ return ' Line ' + `lineno` + '.'
# Displays the recursion level.
def lv(lvl):
- return ' Level ' + `lvl` + '.'
+ return ' Level ' + `lvl` + '.'
# Combine the three previous functions. Used often.
def lle(lvl, buf, where):
- return lv(lvl) + lin() + epsilon(buf, where)
-
-
+ return lv(lvl) + lin() + epsilon(buf, where)
+
+
# This class is only needed for _symbolic_ representation of the parse mode.
class Mode:
- def __init__(self, arg):
- if arg not in the_modes:
- raise ValueError, 'mode not in the_modes'
- self.mode = arg
-
- def __cmp__(self, other):
- if type(self) != type(other):
- other = mode(other)
- return cmp(self.mode, other.mode)
-
- def __repr__(self):
- if self.mode == MODE_REGULAR:
- return 'MODE_REGULAR'
- elif self.mode == MODE_VERBATIM:
- return 'MODE_VERBATIM'
- elif self.mode == MODE_CS_SCAN:
- return 'MODE_CS_SCAN'
- elif self.mode == MODE_COMMENT:
- return 'MODE_COMMENT'
- elif self.mode == MODE_MATH:
- return 'MODE_MATH'
- elif self.mode == MODE_DMATH:
- return 'MODE_DMATH'
- elif self.mode == MODE_GOBBLEWHITE:
- return 'MODE_GOBBLEWHITE'
- else:
- raise ValueError, 'mode not in the_modes'
+ def __init__(self, arg):
+ if arg not in the_modes:
+ raise ValueError, 'mode not in the_modes'
+ self.mode = arg
+
+ def __cmp__(self, other):
+ if type(self) != type(other):
+ other = mode(other)
+ return cmp(self.mode, other.mode)
+
+ def __repr__(self):
+ if self.mode == MODE_REGULAR:
+ return 'MODE_REGULAR'
+ elif self.mode == MODE_VERBATIM:
+ return 'MODE_VERBATIM'
+ elif self.mode == MODE_CS_SCAN:
+ return 'MODE_CS_SCAN'
+ elif self.mode == MODE_COMMENT:
+ return 'MODE_COMMENT'
+ elif self.mode == MODE_MATH:
+ return 'MODE_MATH'
+ elif self.mode == MODE_DMATH:
+ return 'MODE_DMATH'
+ elif self.mode == MODE_GOBBLEWHITE:
+ return 'MODE_GOBBLEWHITE'
+ else:
+ raise ValueError, 'mode not in the_modes'
# just a wrapper around a class initialisation
mode = Mode
@@ -106,88 +106,88 @@ GOBBLEDWHITE = 8 # Gobbled LWSP, after CSNAME
ENDLINE = 9 # END-OF-LINE, data = '\n'
DENDLINE = 10 # DOUBLE EOL, data='\n', indicates \par
ENV = 11 # LaTeX-environment
- # data =(envname,[ch,ch,ch,.])
+ # data =(envname,[ch,ch,ch,.])
CSLINE = 12 # for texi: next chunk will be one group
- # of args. Will be set all on 1 line
+ # of args. Will be set all on 1 line
IGNORE = 13 # IGNORE this data
ENDENV = 14 # TEMP END OF GROUP INDICATOR
IF = 15 # IF-directive
- # data = (flag,negate,[ch, ch, ch,...])
-the_types = PLAIN, GROUP, CSNAME, COMMENT, DMATH, MATH, OTHER, ACTIVE, \
- GOBBLEDWHITE, ENDLINE, DENDLINE, ENV, CSLINE, IGNORE, ENDENV, IF
+ # data = (flag,negate,[ch, ch, ch,...])
+the_types = (PLAIN, GROUP, CSNAME, COMMENT, DMATH, MATH, OTHER, ACTIVE,
+ GOBBLEDWHITE, ENDLINE, DENDLINE, ENV, CSLINE, IGNORE, ENDENV, IF)
# class, just to display symbolic name
class ChunkType:
- def __init__(self, chunk_type):
- if chunk_type not in the_types:
- raise ValueError, 'chunk_type not in the_types'
- self.chunk_type = chunk_type
-
- def __cmp__(self, other):
- if type(self) != type(other):
- other = chunk_type(other)
- return cmp(self.chunk_type, other.chunk_type)
-
- def __repr__(self):
- if self.chunk_type == PLAIN:
- return 'PLAIN'
- elif self.chunk_type == GROUP:
- return 'GROUP'
- elif self.chunk_type == CSNAME:
- return 'CSNAME'
- elif self.chunk_type == COMMENT:
- return 'COMMENT'
- elif self.chunk_type == DMATH:
- return 'DMATH'
- elif self.chunk_type == MATH:
- return 'MATH'
- elif self.chunk_type == OTHER:
- return 'OTHER'
- elif self.chunk_type == ACTIVE:
- return 'ACTIVE'
- elif self.chunk_type == GOBBLEDWHITE:
- return 'GOBBLEDWHITE'
- elif self.chunk_type == DENDLINE:
- return 'DENDLINE'
- elif self.chunk_type == ENDLINE:
- return 'ENDLINE'
- elif self.chunk_type == ENV:
- return 'ENV'
- elif self.chunk_type == CSLINE:
- return 'CSLINE'
- elif self.chunk_type == IGNORE:
- return 'IGNORE'
- elif self.chunk_type == ENDENV:
- return 'ENDENV'
- elif self.chunk_type == IF:
- return 'IF'
- else:
- raise ValueError, 'chunk_type not in the_types'
+ def __init__(self, chunk_type):
+ if chunk_type not in the_types:
+ raise ValueError, 'chunk_type not in the_types'
+ self.chunk_type = chunk_type
+
+ def __cmp__(self, other):
+ if type(self) != type(other):
+ other = chunk_type(other)
+ return cmp(self.chunk_type, other.chunk_type)
+
+ def __repr__(self):
+ if self.chunk_type == PLAIN:
+ return 'PLAIN'
+ elif self.chunk_type == GROUP:
+ return 'GROUP'
+ elif self.chunk_type == CSNAME:
+ return 'CSNAME'
+ elif self.chunk_type == COMMENT:
+ return 'COMMENT'
+ elif self.chunk_type == DMATH:
+ return 'DMATH'
+ elif self.chunk_type == MATH:
+ return 'MATH'
+ elif self.chunk_type == OTHER:
+ return 'OTHER'
+ elif self.chunk_type == ACTIVE:
+ return 'ACTIVE'
+ elif self.chunk_type == GOBBLEDWHITE:
+ return 'GOBBLEDWHITE'
+ elif self.chunk_type == DENDLINE:
+ return 'DENDLINE'
+ elif self.chunk_type == ENDLINE:
+ return 'ENDLINE'
+ elif self.chunk_type == ENV:
+ return 'ENV'
+ elif self.chunk_type == CSLINE:
+ return 'CSLINE'
+ elif self.chunk_type == IGNORE:
+ return 'IGNORE'
+ elif self.chunk_type == ENDENV:
+ return 'ENDENV'
+ elif self.chunk_type == IF:
+ return 'IF'
+ else:
+ raise ValueError, 'chunk_type not in the_types'
# ...and the wrapper
_all_chunk_types = {}
for t in the_types:
- _all_chunk_types[t] = ChunkType(t)
+ _all_chunk_types[t] = ChunkType(t)
def chunk_type(t):
- return _all_chunk_types[t]
+ return _all_chunk_types[t]
# store a type object of the ChunkType-class-instance...
chunk_type_type = type(chunk_type(0))
# this class contains a part of the parsed buffer
class Chunk:
- def __init__(self, chtype, where, data):
- if type(chtype) != chunk_type_type:
- chtype = chunk_type(chtype)
- self.chtype = chtype
- if type(where) != IntType:
- raise TypeError, '\'where\' is not a number'
- self.where = where
- self.data = data
-
- def __repr__(self):
- return 'chunk' + `self.chtype, self.where, self.data`
+ def __init__(self, chtype, where, data):
+ if type(chtype) != chunk_type_type:
+ chtype = chunk_type(chtype)
+ self.chtype = chtype
+ if type(where) != IntType:
+ raise TypeError, "'where' is not a number"
+ self.where = where
+ self.data = data
+
+ def __repr__(self):
+ return 'chunk' + `self.chtype, self.where, self.data`
# and the wrapper
chunk = Chunk
@@ -216,40 +216,40 @@ CC_COMMENT = 14
CC_INVALID = 15
# and the names
-cc_names = [\
- 'CC_ESCAPE', \
- 'CC_LBRACE', \
- 'CC_RBRACE', \
- 'CC_MATHSHIFT', \
- 'CC_ALIGNMENT', \
- 'CC_ENDLINE', \
- 'CC_PARAMETER', \
- 'CC_SUPERSCRIPT', \
- 'CC_SUBSCRIPT', \
- 'CC_IGNORE', \
- 'CC_WHITE', \
- 'CC_LETTER', \
- 'CC_OTHER', \
- 'CC_ACTIVE', \
- 'CC_COMMENT', \
- 'CC_INVALID', \
+cc_names = [
+ 'CC_ESCAPE',
+ 'CC_LBRACE',
+ 'CC_RBRACE',
+ 'CC_MATHSHIFT',
+ 'CC_ALIGNMENT',
+ 'CC_ENDLINE',
+ 'CC_PARAMETER',
+ 'CC_SUPERSCRIPT',
+ 'CC_SUBSCRIPT',
+ 'CC_IGNORE',
+ 'CC_WHITE',
+ 'CC_LETTER',
+ 'CC_OTHER',
+ 'CC_ACTIVE',
+ 'CC_COMMENT',
+ 'CC_INVALID',
]
# Show a list of catcode-name-symbols
def pcl(codelist):
- result = ''
- for i in codelist:
- result = result + cc_names[i] + ', '
- return '[' + result[:-2] + ']'
+ result = ''
+ for i in codelist:
+ result = result + cc_names[i] + ', '
+ return '[' + result[:-2] + ']'
# the name of the catcode (ACTIVE, OTHER, etc.)
def pc(code):
- return cc_names[code]
-
+ return cc_names[code]
+
# Which catcodes make the parser stop parsing regular plaintext
-regular_stopcodes = [CC_ESCAPE, CC_LBRACE, CC_RBRACE, CC_MATHSHIFT, \
- CC_ALIGNMENT, CC_PARAMETER, CC_SUPERSCRIPT, CC_SUBSCRIPT, \
+regular_stopcodes = [CC_ESCAPE, CC_LBRACE, CC_RBRACE, CC_MATHSHIFT,
+ CC_ALIGNMENT, CC_PARAMETER, CC_SUPERSCRIPT, CC_SUBSCRIPT,
CC_IGNORE, CC_ACTIVE, CC_COMMENT, CC_INVALID, CC_ENDLINE]
# same for scanning a control sequence name
@@ -269,37 +269,37 @@ comment_stopcodes = [CC_ENDLINE]
# gather all characters together, specified by a list of catcodes
def code2string(cc, codelist):
- ##print 'code2string: codelist = ' + pcl(codelist),
- result = ''
- for category in codelist:
- if cc[category]:
- result = result + cc[category]
- ##print 'result = ' + `result`
- return result
+ ##print 'code2string: codelist = ' + pcl(codelist),
+ result = ''
+ for category in codelist:
+ if cc[category]:
+ result = result + cc[category]
+ ##print 'result = ' + `result`
+ return result
# automatically generate all characters of catcode other, being the
# complement set in the ASCII range (128 characters)
def make_other_codes(cc):
- otherchars = range(256) # could be made 256, no problem
- for category in all_but_other_codes:
- if cc[category]:
- for c in cc[category]:
- otherchars[ord(c)] = None
- result = ''
- for i in otherchars:
- if i != None:
- result = result + chr(i)
- return result
+ otherchars = range(256) # could be made 256, no problem
+ for category in all_but_other_codes:
+ if cc[category]:
+ for c in cc[category]:
+ otherchars[ord(c)] = None
+ result = ''
+ for i in otherchars:
+ if i != None:
+ result = result + chr(i)
+ return result
# catcode dump (which characters have which catcodes).
def dump_cc(name, cc):
- ##print '\t' + name
- ##print '=' * (8+len(name))
- if len(cc) != 16:
- raise TypeError, 'cc not good cat class'
+ ##print '\t' + name
+ ##print '=' * (8+len(name))
+ if len(cc) != 16:
+ raise TypeError, 'cc not good cat class'
## for i in range(16):
## print pc(i) + '\t' + `cc[i]`
-
+
# In the beginning,....
epoch_cc = [None] * 16
@@ -316,7 +316,7 @@ initex_cc[CC_COMMENT], initex_cc[CC_INVALID] = '%', '\x7F'
#initex_cc[CC_OTHER] = make_other_codes(initex_cc) I don't need them, anyway
##dump_cc('initex_cc', initex_cc)
-
+
# LPLAIN: LaTeX catcode setting (see lplain.tex)
lplain_cc = initex_cc[:]
lplain_cc[CC_LBRACE], lplain_cc[CC_RBRACE] = '{', '}'
@@ -330,7 +330,7 @@ lplain_cc[CC_ACTIVE] = '~\x0C' # '~' and C-l
lplain_cc[CC_OTHER] = make_other_codes(lplain_cc)
##dump_cc('lplain_cc', lplain_cc)
-
+
# Guido's LaTeX environment catcoded '_' as ``other''
# my own purpose catlist
my_cc = lplain_cc[:]
@@ -344,27 +344,27 @@ dump_cc('my_cc', my_cc)
re_meaning = '\\[]^$'
def un_re(str):
- result = ''
- for i in str:
- if i in re_meaning:
- result = result + '\\'
- result = result + i
- return result
-
+ result = ''
+ for i in str:
+ if i in re_meaning:
+ result = result + '\\'
+ result = result + i
+ return result
+
# NOTE the negate ('^') operator in *some* of the regexps below
def make_rc_regular(cc):
- # problems here if '[]' are included!!
- return regex.compile('[' + code2string(cc, regular_stopcodes) + ']')
+ # problems here if '[]' are included!!
+ return regex.compile('[' + code2string(cc, regular_stopcodes) + ']')
def make_rc_cs_scan(cc):
- return regex.compile('[^' + code2string(cc, csname_scancodes) + ']')
+ return regex.compile('[^' + code2string(cc, csname_scancodes) + ']')
def make_rc_comment(cc):
- return regex.compile('[' + code2string(cc, comment_stopcodes) + ']')
+ return regex.compile('[' + code2string(cc, comment_stopcodes) + ']')
def make_rc_endwhite(cc):
- return regex.compile('[^' + code2string(cc, white_scancodes) + ']')
-
+ return regex.compile('[^' + code2string(cc, white_scancodes) + ']')
+
# regular: normal mode:
@@ -386,213 +386,205 @@ rc_endwhite = make_rc_endwhite(my_cc)
# This has been done in order to better check for environment-mismatches
def parseit(buf, *rest):
- global lineno
-
- if len(rest) == 3:
- parsemode, start, lvl = rest
- elif len(rest) == 2:
- parsemode, start, lvl = rest + (0, )
- elif len(rest) == 1:
- parsemode, start, lvl = rest + (0, 0)
- elif len(rest) == 0:
- parsemode, start, lvl = mode(MODE_REGULAR), 0, 0
- else:
- raise TypeError, 'usage: parseit(buf[, parsemode[, start[, level]]])'
- result = []
- end = len(buf)
- if lvl == 0 and parsemode == mode(MODE_REGULAR):
- lineno = 1
- lvl = lvl + 1
-
- ##print 'parseit(' + epsilon(buf, start) + ', ' + `parsemode` + ', ' + `start` + ', ' + `lvl` + ')'
-
- #
- # some of the more regular modes...
- #
-
- if parsemode in (mode(MODE_REGULAR), mode(MODE_DMATH), mode(MODE_MATH)):
- cstate = []
- newpos = start
- curpmode = parsemode
- while 1:
- where = newpos
- #print '\tnew round: ' + epsilon(buf, where)
- if where == end:
- if lvl > 1 or curpmode != mode(MODE_REGULAR):
- # not the way we started...
- raise EOFError, 'premature end of file.' + lle(lvl, buf, where)
- # the real ending of lvl-1 parse
- return end, result
-
- pos = rc_regular.search(buf, where)
-
- if pos < 0:
- pos = end
-
- if pos != where:
- newpos, c = pos, chunk(PLAIN, where, (where, pos))
- result.append(c)
- continue
-
-
- #
- # ok, pos == where and pos != end
- #
- foundchar = buf[where]
- if foundchar in my_cc[CC_LBRACE]:
- # recursive subgroup parse...
- newpos, data = parseit(buf, curpmode, where+1, lvl)
- result.append(chunk(GROUP, where, data))
-
- elif foundchar in my_cc[CC_RBRACE]:
- if lvl <= 1:
- raise error, 'ENDGROUP while in base level.' + lle(lvl, buf, where)
- if lvl == 1 and mode != mode(MODE_REGULAR):
- raise error, 'endgroup while in math mode. +lin() + epsilon(buf, where)'
- return where + 1, result
-
- elif foundchar in my_cc[CC_ESCAPE]:
- #
- # call the routine that actually deals with
- # this problem. If do_ret is None, than
- # return the value of do_ret
- #
- # Note that handle_cs might call this routine
- # recursively again...
- #
- do_ret, newpos = handlecs(buf, where, \
- curpmode, lvl, result, end)
- if do_ret != None:
- return do_ret
-
- elif foundchar in my_cc[CC_COMMENT]:
- newpos, data = parseit(buf, \
- mode(MODE_COMMENT), where+1, lvl)
- result.append(chunk(COMMENT, where, data))
-
- elif foundchar in my_cc[CC_MATHSHIFT]:
- # note that recursive calls to math-mode
- # scanning are called with recursion-level 0
- # again, in order to check for bad mathend
- #
- if where + 1 != end and \
- buf[where + 1] in \
- my_cc[CC_MATHSHIFT]:
- #
- # double mathshift, e.g. '$$'
- #
- if curpmode == mode(MODE_REGULAR):
- newpos, data = parseit(buf, \
- mode(MODE_DMATH), \
- where+2, 0)
- result.append(chunk(DMATH, \
- where, data))
- elif curpmode == mode(MODE_MATH):
- raise error, 'wrong math delimiiter' + lin() + epsilon(buf, where)
- elif lvl != 1:
- raise error, 'bad mathend.' + \
- lle(lvl, buf, where)
- else:
- return where + 2, result
- else:
- #
- # single math shift, e.g. '$'
- #
- if curpmode == mode(MODE_REGULAR):
- newpos, data = parseit(buf, \
- mode(MODE_MATH), \
- where+1, 0)
- result.append(chunk(MATH, \
- where, data))
- elif curpmode == mode(MODE_DMATH):
- raise error, 'wrong math delimiiter' + lin() + epsilon(buf, where)
- elif lvl != 1:
- raise error, 'bad mathend.' + \
- lv(lvl, buf, where)
- else:
- return where + 1, result
-
- elif foundchar in my_cc[CC_IGNORE]:
- print 'warning: ignored char', `foundchar`
- newpos = where + 1
-
- elif foundchar in my_cc[CC_ACTIVE]:
- result.append(chunk(ACTIVE, where, foundchar))
- newpos = where + 1
-
- elif foundchar in my_cc[CC_INVALID]:
- raise error, 'invalid char ' + `foundchar`
- newpos = where + 1
-
- elif foundchar in my_cc[CC_ENDLINE]:
- #
- # after an end of line, eat the rest of
- # whitespace on the beginning of the next line
- # this is what LaTeX more or less does
- #
- # also, try to indicate double newlines (\par)
- #
- lineno = lineno + 1
- savedwhere = where
- newpos, dummy = parseit(buf, mode(MODE_GOBBLEWHITE), where + 1, lvl)
- if newpos != end and buf[newpos] in \
- my_cc[CC_ENDLINE]:
- result.append(chunk(DENDLINE, \
- savedwhere, foundchar))
- else:
- result.append(chunk(ENDLINE, \
- savedwhere, foundchar))
- else:
- result.append(chunk(OTHER, where, foundchar))
- newpos = where + 1
-
- elif parsemode == mode(MODE_CS_SCAN):
+ global lineno
+
+ if len(rest) == 3:
+ parsemode, start, lvl = rest
+ elif len(rest) == 2:
+ parsemode, start, lvl = rest + (0, )
+ elif len(rest) == 1:
+ parsemode, start, lvl = rest + (0, 0)
+ elif len(rest) == 0:
+ parsemode, start, lvl = mode(MODE_REGULAR), 0, 0
+ else:
+ raise TypeError, 'usage: parseit(buf[, parsemode[, start[, level]]])'
+ result = []
+ end = len(buf)
+ if lvl == 0 and parsemode == mode(MODE_REGULAR):
+ lineno = 1
+ lvl = lvl + 1
+
+ ##print 'parseit(' + epsilon(buf, start) + ', ' + `parsemode` + ', ' + `start` + ', ' + `lvl` + ')'
+
+ #
+ # some of the more regular modes...
+ #
+
+ if parsemode in (mode(MODE_REGULAR), mode(MODE_DMATH), mode(MODE_MATH)):
+ cstate = []
+ newpos = start
+ curpmode = parsemode
+ while 1:
+ where = newpos
+ #print '\tnew round: ' + epsilon(buf, where)
+ if where == end:
+ if lvl > 1 or curpmode != mode(MODE_REGULAR):
+ # not the way we started...
+ raise EOFError, 'premature end of file.' + lle(lvl, buf, where)
+ # the real ending of lvl-1 parse
+ return end, result
+
+ pos = rc_regular.search(buf, where)
+
+ if pos < 0:
+ pos = end
+
+ if pos != where:
+ newpos, c = pos, chunk(PLAIN, where, (where, pos))
+ result.append(c)
+ continue
+
+
+ #
+ # ok, pos == where and pos != end
+ #
+ foundchar = buf[where]
+ if foundchar in my_cc[CC_LBRACE]:
+ # recursive subgroup parse...
+ newpos, data = parseit(buf, curpmode, where+1, lvl)
+ result.append(chunk(GROUP, where, data))
+
+ elif foundchar in my_cc[CC_RBRACE]:
+ if lvl <= 1:
+ raise error, 'ENDGROUP while in base level.' + lle(lvl, buf, where)
+ if lvl == 1 and mode != mode(MODE_REGULAR):
+ raise error, 'endgroup while in math mode. +lin() + epsilon(buf, where)'
+ return where + 1, result
+
+ elif foundchar in my_cc[CC_ESCAPE]:
#
- # scan for a control sequence token. `\ape', `\nut' or `\%'
+ # call the routine that actually deals with
+ # this problem. If do_ret is None, than
+ # return the value of do_ret
#
- if start == end:
- raise EOFError, 'can\'t find end of csname'
- pos = rc_cs_scan.search(buf, start)
- if pos < 0:
- pos = end
- if pos == start:
- # first non-letter right where we started the search
- # ---> the control sequence name consists of one single
- # character. Also: don't eat white space...
- if buf[pos] in my_cc[CC_ENDLINE]:
- lineno = lineno + 1
- pos = pos + 1
- return pos, (start, pos)
+ # Note that handle_cs might call this routine
+ # recursively again...
+ #
+ do_ret, newpos = handlecs(buf, where,
+ curpmode, lvl, result, end)
+ if do_ret != None:
+ return do_ret
+
+ elif foundchar in my_cc[CC_COMMENT]:
+ newpos, data = parseit(buf,
+ mode(MODE_COMMENT), where+1, lvl)
+ result.append(chunk(COMMENT, where, data))
+
+ elif foundchar in my_cc[CC_MATHSHIFT]:
+ # note that recursive calls to math-mode
+ # scanning are called with recursion-level 0
+ # again, in order to check for bad mathend
+ #
+ if where + 1 != end and buf[where + 1] in my_cc[CC_MATHSHIFT]:
+ #
+ # double mathshift, e.g. '$$'
+ #
+ if curpmode == mode(MODE_REGULAR):
+ newpos, data = parseit(buf,
+ mode(MODE_DMATH),
+ where+2, 0)
+ result.append(chunk(DMATH,
+ where, data))
+ elif curpmode == mode(MODE_MATH):
+ raise error, 'wrong math delimiiter' + lin() + epsilon(buf, where)
+ elif lvl != 1:
+ raise error, 'bad mathend.' + lle(lvl, buf, where)
+ else:
+ return where + 2, result
else:
- spos = pos
- if buf[pos] == '\n':
- lineno = lineno + 1
- spos = pos + 1
- pos2, dummy = parseit(buf, \
- mode(MODE_GOBBLEWHITE), spos, lvl)
- return pos2, (start, pos)
-
- elif parsemode == mode(MODE_GOBBLEWHITE):
- if start == end:
- return start, ''
- pos = rc_endwhite.search(buf, start)
- if pos < 0:
- pos = start
- return pos, (start, pos)
+ #
+ # single math shift, e.g. '$'
+ #
+ if curpmode == mode(MODE_REGULAR):
+ newpos, data = parseit(buf,
+ mode(MODE_MATH),
+ where+1, 0)
+ result.append(chunk(MATH,
+ where, data))
+ elif curpmode == mode(MODE_DMATH):
+ raise error, 'wrong math delimiiter' + lin() + epsilon(buf, where)
+ elif lvl != 1:
+ raise error, 'bad mathend.' + lv(lvl, buf, where)
+ else:
+ return where + 1, result
+
+ elif foundchar in my_cc[CC_IGNORE]:
+ print 'warning: ignored char', `foundchar`
+ newpos = where + 1
+
+ elif foundchar in my_cc[CC_ACTIVE]:
+ result.append(chunk(ACTIVE, where, foundchar))
+ newpos = where + 1
+
+ elif foundchar in my_cc[CC_INVALID]:
+ raise error, 'invalid char ' + `foundchar`
+ newpos = where + 1
+
+ elif foundchar in my_cc[CC_ENDLINE]:
+ #
+ # after an end of line, eat the rest of
+ # whitespace on the beginning of the next line
+ # this is what LaTeX more or less does
+ #
+ # also, try to indicate double newlines (\par)
+ #
+ lineno = lineno + 1
+ savedwhere = where
+ newpos, dummy = parseit(buf, mode(MODE_GOBBLEWHITE), where + 1, lvl)
+ if newpos != end and buf[newpos] in my_cc[CC_ENDLINE]:
+ result.append(chunk(DENDLINE, savedwhere, foundchar))
+ else:
+ result.append(chunk(ENDLINE, savedwhere, foundchar))
+ else:
+ result.append(chunk(OTHER, where, foundchar))
+ newpos = where + 1
- elif parsemode == mode(MODE_COMMENT):
- pos = rc_comment.search(buf, start)
+ elif parsemode == mode(MODE_CS_SCAN):
+ #
+ # scan for a control sequence token. `\ape', `\nut' or `\%'
+ #
+ if start == end:
+ raise EOFError, 'can\'t find end of csname'
+ pos = rc_cs_scan.search(buf, start)
+ if pos < 0:
+ pos = end
+ if pos == start:
+ # first non-letter right where we started the search
+ # ---> the control sequence name consists of one single
+ # character. Also: don't eat white space...
+ if buf[pos] in my_cc[CC_ENDLINE]:
lineno = lineno + 1
- if pos < 0:
- print 'no newline perhaps?'
- raise EOFError, 'can\'t find end of comment'
- pos = pos + 1
- pos2, dummy = parseit(buf, mode(MODE_GOBBLEWHITE), pos, lvl)
- return pos2, (start, pos)
+ pos = pos + 1
+ return pos, (start, pos)
+ else:
+ spos = pos
+ if buf[pos] == '\n':
+ lineno = lineno + 1
+ spos = pos + 1
+ pos2, dummy = parseit(buf, mode(MODE_GOBBLEWHITE), spos, lvl)
+ return pos2, (start, pos)
+ elif parsemode == mode(MODE_GOBBLEWHITE):
+ if start == end:
+ return start, ''
+ pos = rc_endwhite.search(buf, start)
+ if pos < 0:
+ pos = start
+ return pos, (start, pos)
+
+ elif parsemode == mode(MODE_COMMENT):
+ pos = rc_comment.search(buf, start)
+ lineno = lineno + 1
+ if pos < 0:
+ print 'no newline perhaps?'
+ raise EOFError, 'can\'t find end of comment'
+ pos = pos + 1
+ pos2, dummy = parseit(buf, mode(MODE_GOBBLEWHITE), pos, lvl)
+ return pos2, (start, pos)
- else:
- raise error, 'Unknown mode (' + `parsemode` + ')'
+
+ else:
+ raise error, 'Unknown mode (' + `parsemode` + ')'
#moreresult = cswitch(buf[x1:x2], buf, newpos, parsemode, lvl)
@@ -613,182 +605,182 @@ re_endverb = regex.compile(un_re(endverbstr))
# return with the data in return_data
#
def handlecs(buf, where, curpmode, lvl, result, end):
- global lineno
-
- # get the control sequence name...
- newpos, data = parseit(buf, mode(MODE_CS_SCAN), where+1, lvl)
- saveddata = data
-
- if s(buf, data) in ('begin', 'end'):
- # skip the expected '{' and get the LaTeX-envname '}'
- newpos, data = parseit(buf, mode(MODE_REGULAR), newpos+1, lvl)
- if len(data) != 1:
- raise error, 'expected 1 chunk of data.' + \
- lle(lvl, buf, where)
-
- # yucky, we've got an environment
- envname = s(buf, data[0].data)
- ##print 'FOUND ' + s(buf, saveddata) + '. Name ' + `envname` + '.' + lv(lvl)
- if s(buf, saveddata) == 'begin' and envname == 'verbatim':
- # verbatim deserves special treatment
- pos = re_endverb.search(buf, newpos)
- if pos < 0:
- raise error, `endverbstr` + ' not found.' + lle(lvl, buf, where)
- result.append(chunk(ENV, where, (envname, [chunk(PLAIN, newpos, (newpos, pos))])))
- newpos = pos + len(endverbstr)
-
- elif s(buf, saveddata) == 'begin':
- # start parsing recursively... If that parse returns
- # from an '\end{...}', then should the last item of
- # the returned data be a string containing the ended
- # environment
- newpos, data = parseit(buf, curpmode, newpos, lvl)
- if not data or type(data[-1]) is not StringType:
- raise error, 'missing \'end\'' + lle(lvl, buf, where) + epsilon(buf, newpos)
- retenv = data[-1]
- del data[-1]
- if retenv != envname:
- #[`retenv`, `envname`]
- raise error, 'environments do not match.' + \
- lle(lvl, buf, where) + \
- epsilon(buf, newpos)
- result.append(chunk(ENV, where, (retenv, data)))
- else:
- # 'end'... append the environment name, as just
- # pointed out, and order parsit to return...
- result.append(envname)
- ##print 'POINT of return: ' + epsilon(buf, newpos)
- # the tuple will be returned by parseit
- return (newpos, result), newpos
-
- # end of \begin ... \end handling
-
- elif s(buf, data)[0:2] == 'if':
- # another scary monster: the 'if' directive
- flag = s(buf, data)[2:]
-
- # recursively call parseit, just like environment above..
- # the last item of data should contain the if-termination
- # e.g., 'else' of 'fi'
- newpos, data = parseit(buf, curpmode, newpos, lvl)
- if not data or data[-1] not in ('else', 'fi'):
- raise error, 'wrong if... termination' + \
- lle(lvl, buf, where) + epsilon(buf, newpos)
-
- ifterm = data[-1]
- del data[-1]
- # 0 means dont_negate flag
- result.append(chunk(IF, where, (flag, 0, data)))
- if ifterm == 'else':
- # do the whole thing again, there is only one way
- # to end this one, by 'fi'
- newpos, data = parseit(buf, curpmode, newpos, lvl)
- if not data or data[-1] not in ('fi', ):
- raise error, 'wrong if...else... termination' \
- + lle(lvl, buf, where) \
- + epsilon(buf, newpos)
-
- ifterm = data[-1]
- del data[-1]
- result.append(chunk(IF, where, (flag, 1, data)))
- #done implicitely: return None, newpos
-
- elif s(buf, data) in ('else', 'fi'):
- result.append(s(buf, data))
- # order calling party to return tuple
- return (newpos, result), newpos
-
- # end of \if, \else, ... \fi handling
-
- elif s(buf, saveddata) == 'verb':
- x2 = saveddata[1]
- result.append(chunk(CSNAME, where, data))
- if x2 == end:
- raise error, 'premature end of command.' + lle(lvl, buf, where)
- delimchar = buf[x2]
- ##print 'VERB: delimchar ' + `delimchar`
- pos = regex.compile(un_re(delimchar)).search(buf, x2 + 1)
- if pos < 0:
- raise error, 'end of \'verb\' argument (' + \
- `delimchar` + ') not found.' + \
- lle(lvl, buf, where)
- result.append(chunk(GROUP, x2, [chunk(PLAIN, x2+1, (x2+1, pos))]))
- newpos = pos + 1
+ global lineno
+
+ # get the control sequence name...
+ newpos, data = parseit(buf, mode(MODE_CS_SCAN), where+1, lvl)
+ saveddata = data
+
+ if s(buf, data) in ('begin', 'end'):
+ # skip the expected '{' and get the LaTeX-envname '}'
+ newpos, data = parseit(buf, mode(MODE_REGULAR), newpos+1, lvl)
+ if len(data) != 1:
+ raise error, 'expected 1 chunk of data.' + \
+ lle(lvl, buf, where)
+
+ # yucky, we've got an environment
+ envname = s(buf, data[0].data)
+ ##print 'FOUND ' + s(buf, saveddata) + '. Name ' + `envname` + '.' + lv(lvl)
+ if s(buf, saveddata) == 'begin' and envname == 'verbatim':
+ # verbatim deserves special treatment
+ pos = re_endverb.search(buf, newpos)
+ if pos < 0:
+ raise error, `endverbstr` + ' not found.' + lle(lvl, buf, where)
+ result.append(chunk(ENV, where, (envname, [chunk(PLAIN, newpos, (newpos, pos))])))
+ newpos = pos + len(endverbstr)
+
+ elif s(buf, saveddata) == 'begin':
+ # start parsing recursively... If that parse returns
+ # from an '\end{...}', then should the last item of
+ # the returned data be a string containing the ended
+ # environment
+ newpos, data = parseit(buf, curpmode, newpos, lvl)
+ if not data or type(data[-1]) is not StringType:
+ raise error, 'missing \'end\'' + lle(lvl, buf, where) + epsilon(buf, newpos)
+ retenv = data[-1]
+ del data[-1]
+ if retenv != envname:
+ #[`retenv`, `envname`]
+ raise error, 'environments do not match.' + \
+ lle(lvl, buf, where) + \
+ epsilon(buf, newpos)
+ result.append(chunk(ENV, where, (retenv, data)))
else:
- result.append(chunk(CSNAME, where, data))
- return None, newpos
+ # 'end'... append the environment name, as just
+ # pointed out, and order parsit to return...
+ result.append(envname)
+ ##print 'POINT of return: ' + epsilon(buf, newpos)
+ # the tuple will be returned by parseit
+ return (newpos, result), newpos
+
+ # end of \begin ... \end handling
+
+ elif s(buf, data)[0:2] == 'if':
+ # another scary monster: the 'if' directive
+ flag = s(buf, data)[2:]
+
+ # recursively call parseit, just like environment above..
+ # the last item of data should contain the if-termination
+ # e.g., 'else' of 'fi'
+ newpos, data = parseit(buf, curpmode, newpos, lvl)
+ if not data or data[-1] not in ('else', 'fi'):
+ raise error, 'wrong if... termination' + \
+ lle(lvl, buf, where) + epsilon(buf, newpos)
+
+ ifterm = data[-1]
+ del data[-1]
+ # 0 means dont_negate flag
+ result.append(chunk(IF, where, (flag, 0, data)))
+ if ifterm == 'else':
+ # do the whole thing again, there is only one way
+ # to end this one, by 'fi'
+ newpos, data = parseit(buf, curpmode, newpos, lvl)
+ if not data or data[-1] not in ('fi', ):
+ raise error, 'wrong if...else... termination' \
+ + lle(lvl, buf, where) \
+ + epsilon(buf, newpos)
+
+ ifterm = data[-1]
+ del data[-1]
+ result.append(chunk(IF, where, (flag, 1, data)))
+ #done implicitely: return None, newpos
+
+ elif s(buf, data) in ('else', 'fi'):
+ result.append(s(buf, data))
+ # order calling party to return tuple
+ return (newpos, result), newpos
+
+ # end of \if, \else, ... \fi handling
+
+ elif s(buf, saveddata) == 'verb':
+ x2 = saveddata[1]
+ result.append(chunk(CSNAME, where, data))
+ if x2 == end:
+ raise error, 'premature end of command.' + lle(lvl, buf, where)
+ delimchar = buf[x2]
+ ##print 'VERB: delimchar ' + `delimchar`
+ pos = regex.compile(un_re(delimchar)).search(buf, x2 + 1)
+ if pos < 0:
+ raise error, 'end of \'verb\' argument (' + \
+ `delimchar` + ') not found.' + \
+ lle(lvl, buf, where)
+ result.append(chunk(GROUP, x2, [chunk(PLAIN, x2+1, (x2+1, pos))]))
+ newpos = pos + 1
+ else:
+ result.append(chunk(CSNAME, where, data))
+ return None, newpos
# this is just a function to get the string value if the possible data-tuple
def s(buf, data):
- if type(data) is StringType:
- return data
- if len(data) != 2 or not (type(data[0]) is type(data[1]) is IntType):
- raise TypeError, 'expected tuple of 2 integers'
- x1, x2 = data
- return buf[x1:x2]
+ if type(data) is StringType:
+ return data
+ if len(data) != 2 or not (type(data[0]) is type(data[1]) is IntType):
+ raise TypeError, 'expected tuple of 2 integers'
+ x1, x2 = data
+ return buf[x1:x2]
##length, data1, i = getnextarg(length, buf, pp, i + 1)
# make a deep-copy of some chunks
def crcopy(r):
- return map(chunkcopy, r)
+ return map(chunkcopy, r)
# copy a chunk, would better be a method of class Chunk...
def chunkcopy(ch):
- if ch.chtype == chunk_type(GROUP):
- return chunk(GROUP, ch.where, map(chunkcopy, ch.data))
- else:
- return chunk(ch.chtype, ch.where, ch.data)
+ if ch.chtype == chunk_type(GROUP):
+ return chunk(GROUP, ch.where, map(chunkcopy, ch.data))
+ else:
+ return chunk(ch.chtype, ch.where, ch.data)
# get next argument for TeX-macro, flatten a group (insert between)
# or return Command Sequence token, or give back one character
def getnextarg(length, buf, pp, item):
- ##wobj = Wobj()
- ##dumpit(buf, wobj.write, pp[item:min(length, item + 5)])
- ##print 'GETNEXTARG, (len, item) =', `length, item` + ' ---> ' + wobj.data + ' <---'
-
- while item < length and pp[item].chtype == chunk_type(ENDLINE):
- del pp[item]
- length = length - 1
- if item >= length:
- raise error, 'no next arg.' + epsilon(buf, pp[-1].where)
- if pp[item].chtype == chunk_type(GROUP):
- newpp = pp[item].data
- del pp[item]
- length = length - 1
- changeit(buf, newpp)
- length = length + len(newpp)
- pp[item:item] = newpp
- item = item + len(newpp)
- if len(newpp) < 10:
- wobj = Wobj()
- dumpit(buf, wobj.write, newpp)
- ##print 'GETNEXTARG: inserted ' + `wobj.data`
- return length, item
- elif pp[item].chtype == chunk_type(PLAIN):
- #grab one char
- print 'WARNING: grabbing one char'
- if len(s(buf, pp[item].data)) > 1:
- pp.insert(item, chunk(PLAIN, pp[item].where, s(buf, pp[item].data)[:1]))
- item, length = item+1, length+1
- pp[item].data = s(buf, pp[item].data)[1:]
- else:
- item = item+1
- return length, item
+ ##wobj = Wobj()
+ ##dumpit(buf, wobj.write, pp[item:min(length, item + 5)])
+ ##print 'GETNEXTARG, (len, item) =', `length, item` + ' ---> ' + wobj.data + ' <---'
+
+ while item < length and pp[item].chtype == chunk_type(ENDLINE):
+ del pp[item]
+ length = length - 1
+ if item >= length:
+ raise error, 'no next arg.' + epsilon(buf, pp[-1].where)
+ if pp[item].chtype == chunk_type(GROUP):
+ newpp = pp[item].data
+ del pp[item]
+ length = length - 1
+ changeit(buf, newpp)
+ length = length + len(newpp)
+ pp[item:item] = newpp
+ item = item + len(newpp)
+ if len(newpp) < 10:
+ wobj = Wobj()
+ dumpit(buf, wobj.write, newpp)
+ ##print 'GETNEXTARG: inserted ' + `wobj.data`
+ return length, item
+ elif pp[item].chtype == chunk_type(PLAIN):
+ #grab one char
+ print 'WARNING: grabbing one char'
+ if len(s(buf, pp[item].data)) > 1:
+ pp.insert(item, chunk(PLAIN, pp[item].where, s(buf, pp[item].data)[:1]))
+ item, length = item+1, length+1
+ pp[item].data = s(buf, pp[item].data)[1:]
else:
- ch = pp[item]
- try:
- str = `s(buf, ch.data)`
- except TypeError:
- str = `ch.data`
- if len(str) > 400:
- str = str[:400] + '...'
- print 'GETNEXTARG:', ch.chtype, 'not handled, data ' + str
- return length, item
+ item = item+1
+ return length, item
+ else:
+ ch = pp[item]
+ try:
+ str = `s(buf, ch.data)`
+ except TypeError:
+ str = `ch.data`
+ if len(str) > 400:
+ str = str[:400] + '...'
+ print 'GETNEXTARG:', ch.chtype, 'not handled, data ' + str
+ return length, item
# this one is needed to find the end of LaTeX's optional argument, like
@@ -798,52 +790,52 @@ re_endopt = regex.compile(']')
# get a LaTeX-optional argument, you know, the square braces '[' and ']'
def getoptarg(length, buf, pp, item):
- wobj = Wobj()
- dumpit(buf, wobj.write, pp[item:min(length, item + 5)])
- ##print 'GETOPTARG, (len, item) =', `length, item` + ' ---> ' + wobj.data + ' <---'
+ wobj = Wobj()
+ dumpit(buf, wobj.write, pp[item:min(length, item + 5)])
+ ##print 'GETOPTARG, (len, item) =', `length, item` + ' ---> ' + wobj.data + ' <---'
+
+ if item >= length or \
+ pp[item].chtype != chunk_type(PLAIN) or \
+ s(buf, pp[item].data)[0] != '[':
+ return length, item
+
+ pp[item].data = s(buf, pp[item].data)[1:]
+ if len(pp[item].data) == 0:
+ del pp[item]
+ length = length-1
+
+ while 1:
+ if item == length:
+ raise error, 'No end of optional arg found'
+ if pp[item].chtype == chunk_type(PLAIN):
+ text = s(buf, pp[item].data)
+ pos = re_endopt.search(text)
+ if pos >= 0:
+ pp[item].data = text[:pos]
+ if pos == 0:
+ del pp[item]
+ length = length-1
+ else:
+ item=item+1
+ text = text[pos+1:]
- if item >= length or \
- pp[item].chtype != chunk_type(PLAIN) or \
- s(buf, pp[item].data)[0] != '[':
- return length, item
+ while text and text[0] in ' \t':
+ text = text[1:]
- pp[item].data = s(buf, pp[item].data)[1:]
- if len(pp[item].data) == 0:
- del pp[item]
- length = length-1
+ if text:
+ pp.insert(item, chunk(PLAIN, 0, text))
+ length = length + 1
+ return length, item
- while 1:
- if item == length:
- raise error, 'No end of optional arg found'
- if pp[item].chtype == chunk_type(PLAIN):
- text = s(buf, pp[item].data)
- pos = re_endopt.search(text)
- if pos >= 0:
- pp[item].data = text[:pos]
- if pos == 0:
- del pp[item]
- length = length-1
- else:
- item=item+1
- text = text[pos+1:]
-
- while text and text[0] in ' \t':
- text = text[1:]
-
- if text:
- pp.insert(item, chunk(PLAIN, 0, text))
- length = length + 1
- return length, item
-
- item = item+1
+ item = item+1
# Wobj just add write-requests to the ``data'' attribute
class Wobj:
- data = ''
+ data = ''
- def write(self, data):
- self.data = self.data + data
+ def write(self, data):
+ self.data = self.data + data
# ignore these commands
ignoredcommands = ('bcode', 'ecode')
@@ -855,7 +847,7 @@ themselves = ('{', '}', '.', '@', ' ', '\n') + wordsselves
inargsselves = (',', '[', ']', '(', ')')
# this is how *I* would show the difference between emph and strong
# code 1 means: fold to uppercase
-markcmds = {'code': ('', ''), 'var': 1, 'emph': ('_', '_'), \
+markcmds = {'code': ('', ''), 'var': 1, 'emph': ('_', '_'),
'strong': ('*', '*')}
# recognise patter {\FONTCHANGE-CMD TEXT} to \MAPPED-FC-CMD{TEXT}
@@ -868,95 +860,95 @@ for_texi = ('emph', 'var', 'strong', 'code', 'kbd', 'key', 'dfn', 'samp',
# try to remove macros and return flat text
def flattext(buf, pp):
- pp = crcopy(pp)
- ##print '---> FLATTEXT ' + `pp`
- wobj = Wobj()
-
- i, length = 0, len(pp)
- while 1:
- if len(pp) != length:
- raise 'FATAL', 'inconsistent length'
- if i >= length:
- break
- ch = pp[i]
- i = i+1
- if ch.chtype == chunk_type(PLAIN):
- pass
- elif ch.chtype == chunk_type(CSNAME):
- if s(buf, ch.data) in themselves or hist.inargs and s(buf, ch.data) in inargsselves:
- ch.chtype = chunk_type(PLAIN)
- elif s(buf, ch.data) == 'e':
- ch.chtype = chunk_type(PLAIN)
- ch.data = '\\'
- elif len(s(buf, ch.data)) == 1 \
- and s(buf, ch.data) in onlylatexspecial:
- ch.chtype = chunk_type(PLAIN)
- # if it is followed by an empty group,
- # remove that group, it was needed for
- # a true space
- if i < length \
- and pp[i].chtype==chunk_type(GROUP) \
- and len(pp[i].data) == 0:
- del pp[i]
- length = length-1
-
- elif s(buf, ch.data) in markcmds.keys():
- length, newi = getnextarg(length, buf, pp, i)
- str = flattext(buf, pp[i:newi])
- del pp[i:newi]
- length = length - (newi - i)
- ch.chtype = chunk_type(PLAIN)
- markcmd = s(buf, ch.data)
- x = markcmds[markcmd]
- if type(x) == TupleType:
- pre, after = x
- str = pre+str+after
- elif x == 1:
- str = string.upper(str)
- else:
- raise 'FATAL', 'corrupt markcmds'
- ch.data = str
- else:
- if s(buf, ch.data) not in ignoredcommands:
- print 'WARNING: deleting command ' + `s(buf, ch.data)`
- print 'PP' + `pp[i-1]`
- del pp[i-1]
- i, length = i-1, length-1
- elif ch.chtype == chunk_type(GROUP):
- length, newi = getnextarg(length, buf, pp, i-1)
- i = i-1
+ pp = crcopy(pp)
+ ##print '---> FLATTEXT ' + `pp`
+ wobj = Wobj()
+
+ i, length = 0, len(pp)
+ while 1:
+ if len(pp) != length:
+ raise 'FATAL', 'inconsistent length'
+ if i >= length:
+ break
+ ch = pp[i]
+ i = i+1
+ if ch.chtype == chunk_type(PLAIN):
+ pass
+ elif ch.chtype == chunk_type(CSNAME):
+ if s(buf, ch.data) in themselves or hist.inargs and s(buf, ch.data) in inargsselves:
+ ch.chtype = chunk_type(PLAIN)
+ elif s(buf, ch.data) == 'e':
+ ch.chtype = chunk_type(PLAIN)
+ ch.data = '\\'
+ elif len(s(buf, ch.data)) == 1 \
+ and s(buf, ch.data) in onlylatexspecial:
+ ch.chtype = chunk_type(PLAIN)
+ # if it is followed by an empty group,
+ # remove that group, it was needed for
+ # a true space
+ if i < length \
+ and pp[i].chtype==chunk_type(GROUP) \
+ and len(pp[i].data) == 0:
+ del pp[i]
+ length = length-1
+
+ elif s(buf, ch.data) in markcmds.keys():
+ length, newi = getnextarg(length, buf, pp, i)
+ str = flattext(buf, pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi - i)
+ ch.chtype = chunk_type(PLAIN)
+ markcmd = s(buf, ch.data)
+ x = markcmds[markcmd]
+ if type(x) == TupleType:
+ pre, after = x
+ str = pre+str+after
+ elif x == 1:
+ str = string.upper(str)
+ else:
+ raise 'FATAL', 'corrupt markcmds'
+ ch.data = str
+ else:
+ if s(buf, ch.data) not in ignoredcommands:
+ print 'WARNING: deleting command ' + `s(buf, ch.data)`
+ print 'PP' + `pp[i-1]`
+ del pp[i-1]
+ i, length = i-1, length-1
+ elif ch.chtype == chunk_type(GROUP):
+ length, newi = getnextarg(length, buf, pp, i-1)
+ i = i-1
## str = flattext(buf, crcopy(pp[i-1:newi]))
## del pp[i:newi]
## length = length - (newi - i)
## ch.chtype = chunk_type(PLAIN)
## ch.data = str
- else:
- pass
-
- dumpit(buf, wobj.write, pp)
- ##print 'FLATTEXT: RETURNING ' + `wobj.data`
- return wobj.data
+ else:
+ pass
+
+ dumpit(buf, wobj.write, pp)
+ ##print 'FLATTEXT: RETURNING ' + `wobj.data`
+ return wobj.data
# try to generate node names (a bit shorter than the chapter title)
# note that the \nodename command (see elsewhere) overules these efforts
def invent_node_names(text):
- words = string.split(text)
-
- ##print 'WORDS ' + `words`
-
- if len(words) == 2 \
- and string.lower(words[0]) == 'built-in' \
- and string.lower(words[1]) not in ('modules', 'functions'):
- return words[1]
- if len(words) == 3 and string.lower(words[1]) == 'module':
- return words[2]
- if len(words) == 3 and string.lower(words[1]) == 'object':
- return string.join(words[0:2])
- if len(words) > 4 and string.lower(string.join(words[-4:])) == \
- 'methods and data attributes':
- return string.join(words[:2])
- return text
-
+ words = string.split(text)
+
+ ##print 'WORDS ' + `words`
+
+ if len(words) == 2 \
+ and string.lower(words[0]) == 'built-in' \
+ and string.lower(words[1]) not in ('modules', 'functions'):
+ return words[1]
+ if len(words) == 3 and string.lower(words[1]) == 'module':
+ return words[2]
+ if len(words) == 3 and string.lower(words[1]) == 'object':
+ return string.join(words[0:2])
+ if len(words) > 4 and string.lower(string.join(words[-4:])) == \
+ 'methods and data attributes':
+ return string.join(words[:2])
+ return text
+
re_commas_etc = regex.compile('[,`\'@{}]')
re_whitespace = regex.compile('[ \t]*')
@@ -969,27 +961,27 @@ re_whitespace = regex.compile('[ \t]*')
# Sometimes this is too much, maybe consider DENDLINE's as stop
def next_command_p(length, buf, pp, i, cmdname):
- while 1:
- if i >= len(pp):
- break
- ch = pp[i]
- i = i+1
- if ch.chtype == chunk_type(ENDLINE):
- continue
- if ch.chtype == chunk_type(DENDLINE):
- continue
- if ch.chtype == chunk_type(PLAIN):
- if re_whitespace.search(s(buf, ch.data)) == 0 and \
- re_whitespace.match(s(buf, ch.data)) == len(s(buf, ch.data)):
- continue
- return -1
- if ch.chtype == chunk_type(CSNAME):
- if s(buf, ch.data) == cmdname:
- return i # _after_ the command
- return -1
- return -1
-
-
+ while 1:
+ if i >= len(pp):
+ break
+ ch = pp[i]
+ i = i+1
+ if ch.chtype == chunk_type(ENDLINE):
+ continue
+ if ch.chtype == chunk_type(DENDLINE):
+ continue
+ if ch.chtype == chunk_type(PLAIN):
+ if re_whitespace.search(s(buf, ch.data)) == 0 and \
+ re_whitespace.match(s(buf, ch.data)) == len(s(buf, ch.data)):
+ continue
+ return -1
+ if ch.chtype == chunk_type(CSNAME):
+ if s(buf, ch.data) == cmdname:
+ return i # _after_ the command
+ return -1
+ return -1
+
+
# things that are special to LaTeX, but not to texi..
onlylatexspecial = '_~^$#&%'
@@ -999,17 +991,17 @@ hist = Struct()
out = Struct()
def startchange():
- global hist, out
+ global hist, out
- hist.inenv = []
- hist.nodenames = []
- hist.cindex = []
- hist.inargs = 0
- hist.enumeratenesting, hist.itemizenesting = 0, 0
+ hist.inenv = []
+ hist.nodenames = []
+ hist.cindex = []
+ hist.inargs = 0
+ hist.enumeratenesting, hist.itemizenesting = 0, 0
+
+ out.doublenodes = []
+ out.doublecindeces = []
- out.doublenodes = []
- out.doublecindeces = []
-
spacech = [chunk(PLAIN, 0, ' ')]
commach = [chunk(PLAIN, 0, ', ')]
@@ -1051,174 +1043,173 @@ enumeratesymbols = ['1', 'A', 'a']
## or \funcline{NAME}{ARGS}
##
def do_funcdesc(length, buf, pp, i):
- startpoint = i-1
- ch = pp[startpoint]
- wh = ch.where
- length, newi = getnextarg(length, buf, pp, i)
- funcname = chunk(GROUP, wh, pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- save = hist.inargs
- hist.inargs = 1
- length, newi = getnextarg(length, buf, pp, i)
- hist.inargs = save
- del save
- the_args = [chunk(PLAIN, wh, '()'[0])] + \
- pp[i:newi] + \
- [chunk(PLAIN, wh, '()'[1])]
- del pp[i:newi]
- length = length - (newi-i)
-
- idxsi = hist.indexsubitem # words
- command = ''
- cat_class = ''
- if idxsi and idxsi[-1] in ('method', 'protocol'):
- command = 'defmethod'
- cat_class = string.join(idxsi[:-1])
- elif len(idxsi) == 2 and idxsi[1] == 'function':
- command = 'deffn'
- cat_class = string.join(idxsi)
- elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
- command = 'deffn'
- cat_class = 'function of ' + string.join(idxsi[1:])
-
- if not command:
- raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = command
-
- cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
- cslinearg.append(chunk(PLAIN, wh, ' '))
- cslinearg.append(funcname)
- cslinearg.append(chunk(PLAIN, wh, ' '))
- l = len(cslinearg)
- cslinearg[l:l] = the_args
+ startpoint = i-1
+ ch = pp[startpoint]
+ wh = ch.where
+ length, newi = getnextarg(length, buf, pp, i)
+ funcname = chunk(GROUP, wh, pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ save = hist.inargs
+ hist.inargs = 1
+ length, newi = getnextarg(length, buf, pp, i)
+ hist.inargs = save
+ del save
+ the_args = [chunk(PLAIN, wh, '()'[0])] + pp[i:newi] + \
+ [chunk(PLAIN, wh, '()'[1])]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ idxsi = hist.indexsubitem # words
+ command = ''
+ cat_class = ''
+ if idxsi and idxsi[-1] in ('method', 'protocol'):
+ command = 'defmethod'
+ cat_class = string.join(idxsi[:-1])
+ elif len(idxsi) == 2 and idxsi[1] == 'function':
+ command = 'deffn'
+ cat_class = string.join(idxsi)
+ elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
+ command = 'deffn'
+ cat_class = 'function of ' + string.join(idxsi[1:])
+
+ if not command:
+ raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = command
+
+ cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
+ cslinearg.append(chunk(PLAIN, wh, ' '))
+ cslinearg.append(funcname)
+ cslinearg.append(chunk(PLAIN, wh, ' '))
+ l = len(cslinearg)
+ cslinearg[l:l] = the_args
+
+ pp.insert(i, chunk(GROUP, wh, cslinearg))
+ i, length = i+1, length+1
+ hist.command = command
+ return length, i
- pp.insert(i, chunk(GROUP, wh, cslinearg))
- i, length = i+1, length+1
- hist.command = command
- return length, i
-
## this routine will be called on \begin{excdesc}{NAME}
## or \excline{NAME}
##
def do_excdesc(length, buf, pp, i):
- startpoint = i-1
- ch = pp[startpoint]
- wh = ch.where
- length, newi = getnextarg(length, buf, pp, i)
- excname = chunk(GROUP, wh, pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
-
- idxsi = hist.indexsubitem # words
- command = ''
- cat_class = ''
- class_class = ''
- if len(idxsi) == 2 and idxsi[1] == 'exception':
- command = 'defvr'
- cat_class = string.join(idxsi)
- elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
- command = 'defcv'
- cat_class = 'exception'
- class_class = string.join(idxsi[1:])
- elif len(idxsi) == 4 and idxsi[:3] == ['exception', 'in', 'module']:
- command = 'defcv'
- cat_class = 'exception'
- class_class = string.join(idxsi[2:])
-
-
- if not command:
- raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = command
-
- cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
+ startpoint = i-1
+ ch = pp[startpoint]
+ wh = ch.where
+ length, newi = getnextarg(length, buf, pp, i)
+ excname = chunk(GROUP, wh, pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ idxsi = hist.indexsubitem # words
+ command = ''
+ cat_class = ''
+ class_class = ''
+ if len(idxsi) == 2 and idxsi[1] == 'exception':
+ command = 'defvr'
+ cat_class = string.join(idxsi)
+ elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
+ command = 'defcv'
+ cat_class = 'exception'
+ class_class = string.join(idxsi[1:])
+ elif len(idxsi) == 4 and idxsi[:3] == ['exception', 'in', 'module']:
+ command = 'defcv'
+ cat_class = 'exception'
+ class_class = string.join(idxsi[2:])
+
+
+ if not command:
+ raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = command
+
+ cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
+ cslinearg.append(chunk(PLAIN, wh, ' '))
+ if class_class:
+ cslinearg.append(chunk(GROUP, wh, [chunk(PLAIN, wh, class_class)]))
cslinearg.append(chunk(PLAIN, wh, ' '))
- if class_class:
- cslinearg.append(chunk(GROUP, wh, [chunk(PLAIN, wh, class_class)]))
- cslinearg.append(chunk(PLAIN, wh, ' '))
- cslinearg.append(excname)
+ cslinearg.append(excname)
- pp.insert(i, chunk(GROUP, wh, cslinearg))
- i, length = i+1, length+1
- hist.command = command
- return length, i
+ pp.insert(i, chunk(GROUP, wh, cslinearg))
+ i, length = i+1, length+1
+ hist.command = command
+ return length, i
## same for datadesc or dataline...
def do_datadesc(length, buf, pp, i):
- startpoint = i-1
- ch = pp[startpoint]
- wh = ch.where
- length, newi = getnextarg(length, buf, pp, i)
- dataname = chunk(GROUP, wh, pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
-
- idxsi = hist.indexsubitem # words
- command = ''
- cat_class = ''
- class_class = ''
- if idxsi[-1] in ('attribute', 'option'):
- command = 'defcv'
- cat_class = idxsi[-1]
- class_class = string.join(idxsi[:-1])
- elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
- command = 'defcv'
- cat_class = 'data'
- class_class = string.join(idxsi[1:])
- elif len(idxsi) == 4 and idxsi[:3] == ['data', 'in', 'module']:
- command = 'defcv'
- cat_class = 'data'
- class_class = string.join(idxsi[2:])
-
-
- if not command:
- raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = command
-
- cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
+ startpoint = i-1
+ ch = pp[startpoint]
+ wh = ch.where
+ length, newi = getnextarg(length, buf, pp, i)
+ dataname = chunk(GROUP, wh, pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ idxsi = hist.indexsubitem # words
+ command = ''
+ cat_class = ''
+ class_class = ''
+ if idxsi[-1] in ('attribute', 'option'):
+ command = 'defcv'
+ cat_class = idxsi[-1]
+ class_class = string.join(idxsi[:-1])
+ elif len(idxsi) == 3 and idxsi[:2] == ['in', 'module']:
+ command = 'defcv'
+ cat_class = 'data'
+ class_class = string.join(idxsi[1:])
+ elif len(idxsi) == 4 and idxsi[:3] == ['data', 'in', 'module']:
+ command = 'defcv'
+ cat_class = 'data'
+ class_class = string.join(idxsi[2:])
+
+
+ if not command:
+ raise error, 'don\'t know what to do with indexsubitem ' + `idxsi`
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = command
+
+ cslinearg = [chunk(GROUP, wh, [chunk(PLAIN, wh, cat_class)])]
+ cslinearg.append(chunk(PLAIN, wh, ' '))
+ if class_class:
+ cslinearg.append(chunk(GROUP, wh, [chunk(PLAIN, wh, class_class)]))
cslinearg.append(chunk(PLAIN, wh, ' '))
- if class_class:
- cslinearg.append(chunk(GROUP, wh, [chunk(PLAIN, wh, class_class)]))
- cslinearg.append(chunk(PLAIN, wh, ' '))
- cslinearg.append(dataname)
+ cslinearg.append(dataname)
+
+ pp.insert(i, chunk(GROUP, wh, cslinearg))
+ i, length = i+1, length+1
+ hist.command = command
+ return length, i
- pp.insert(i, chunk(GROUP, wh, cslinearg))
- i, length = i+1, length+1
- hist.command = command
- return length, i
-
# regular indices: those that are not set in tt font by default....
regindices = ('cindex', )
# remove illegal characters from node names
def rm_commas_etc(text):
- result = ''
- changed = 0
- while 1:
- pos = re_commas_etc.search(text)
- if pos >= 0:
- changed = 1
- result = result + text[:pos]
- text = text[pos+1:]
- else:
- result = result + text
- break
- if changed:
- print 'Warning: nodename changhed to ' + `result`
+ result = ''
+ changed = 0
+ while 1:
+ pos = re_commas_etc.search(text)
+ if pos >= 0:
+ changed = 1
+ result = result + text[:pos]
+ text = text[pos+1:]
+ else:
+ result = result + text
+ break
+ if changed:
+ print 'Warning: nodename changhed to ' + `result`
+
+ return result
- return result
-
# boolean flags
flags = {'texi': 1}
-
+
##
## changeit: the actual routine, that changes the contents of the parsed
@@ -1226,932 +1217,927 @@ flags = {'texi': 1}
##
def changeit(buf, pp):
- global onlylatexspecial, hist, out
+ global onlylatexspecial, hist, out
+
+ i, length = 0, len(pp)
+ while 1:
+ # sanity check: length should always equal len(pp)
+ if len(pp) != length:
+ raise 'FATAL', 'inconsistent length. thought ' + `length` + ', but should really be ' + `len(pp)`
+ if i >= length:
+ break
+ ch = pp[i]
+ i = i + 1
+
+ if type(ch) is StringType:
+ #normally, only chunks are present in pp,
+ # but in some cases, some extra info
+ # has been inserted, e.g., the \end{...} clauses
+ raise 'FATAL', 'got string, probably too many ' + `end`
- i, length = 0, len(pp)
- while 1:
- # sanity check: length should always equal len(pp)
- if len(pp) != length:
- raise 'FATAL', 'inconsistent length. thought ' + `length` + ', but should really be ' + `len(pp)`
- if i >= length:
- break
- ch = pp[i]
- i = i + 1
+ if ch.chtype == chunk_type(GROUP):
+ # check for {\em ...} constructs
+ if ch.data and \
+ ch.data[0].chtype == chunk_type(CSNAME) and \
+ s(buf, ch.data[0].data) in fontchanges.keys():
+ k = s(buf, ch.data[0].data)
+ del ch.data[0]
+ pp.insert(i-1, chunk(CSNAME, ch.where, fontchanges[k]))
+ length, i = length+1, i+1
+
+ # recursively parse the contents of the group
+ changeit(buf, ch.data)
+
+ elif ch.chtype == chunk_type(IF):
+ # \if...
+ flag, negate, data = ch.data
+ ##print 'IF: flag, negate = ' + `flag, negate`
+ if flag not in flags.keys():
+ raise error, 'unknown flag ' + `flag`
+
+ value = flags[flag]
+ if negate:
+ value = (not value)
+ del pp[i-1]
+ length, i = length-1, i-1
+ if value:
+ pp[i:i] = data
+ length = length + len(data)
+
+
+ elif ch.chtype == chunk_type(ENV):
+ # \begin{...} ....
+ envname, data = ch.data
+
+ #push this environment name on stack
+ hist.inenv.insert(0, envname)
+
+ #append an endenv chunk after grouped data
+ data.append(chunk(ENDENV, ch.where, envname))
+ ##[`data`]
+
+ #delete this object
+ del pp[i-1]
+ i, length = i-1, length-1
+
+ #insert found data
+ pp[i:i] = data
+ length = length + len(data)
+
+ if envname == 'verbatim':
+ pp[i:i] = [chunk(CSLINE, ch.where, 'example'),
+ chunk(GROUP, ch.where, [])]
+ length, i = length+2, i+2
+
+ elif envname == 'itemize':
+ if hist.itemizenesting > len(itemizesymbols):
+ raise error, 'too deep itemize nesting'
+ ingroupch = [chunk(CSNAME, ch.where,
+ itemizesymbols[hist.itemizenesting])]
+ hist.itemizenesting = hist.itemizenesting + 1
+ pp[i:i] = [chunk(CSLINE, ch.where, 'itemize'),
+ chunk(GROUP, ch.where, ingroupch)]
+ length, i = length+2, i+2
+
+ elif envname == 'enumerate':
+ if hist.enumeratenesting > len(enumeratesymbols):
+ raise error, 'too deep enumerate nesting'
+ ingroupch = [chunk(PLAIN, ch.where,
+ enumeratesymbols[hist.enumeratenesting])]
+ hist.enumeratenesting = hist.enumeratenesting + 1
+ pp[i:i] = [chunk(CSLINE, ch.where, 'enumerate'),
+ chunk(GROUP, ch.where, ingroupch)]
+ length, i = length+2, i+2
+
+ elif envname == 'description':
+ ingroupch = [chunk(CSNAME, ch.where, 'b')]
+ pp[i:i] = [chunk(CSLINE, ch.where, 'table'),
+ chunk(GROUP, ch.where, ingroupch)]
+ length, i = length+2, i+2
+
+ elif (envname == 'tableiii') or (envname == 'tableii'):
+ if (envname == 'tableii'):
+ ltable = 2
+ else:
+ ltable = 3
+ wh = ch.where
+ newcode = []
+
+ #delete tabular format description
+ # e.g., {|l|c|l|}
+ length, newi = getnextarg(length, buf, pp, i)
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ newcode.append(chunk(CSLINE, wh, 'table'))
+ ingroupch = [chunk(CSNAME, wh, 'asis')]
+ newcode.append(chunk(GROUP, wh, ingroupch))
+ newcode.append(chunk(CSLINE, wh, 'item'))
+
+ #get the name of macro for @item
+ # e.g., {code}
+ length, newi = getnextarg(length, buf, pp, i)
+
+ if newi-i != 1:
+ raise error, 'Sorry, expected 1 chunk argument'
+ if pp[i].chtype != chunk_type(PLAIN):
+ raise error, 'Sorry, expected plain text argument'
+ hist.itemargmacro = s(buf, pp[i].data)
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ itembody = []
+ for count in range(ltable):
+ length, newi = getnextarg(length, buf, pp, i)
+ emphgroup = [
+ chunk(CSNAME, wh, 'emph'),
+ chunk(GROUP, 0, pp[i:newi])]
+ del pp[i:newi]
+ length = length - (newi-i)
+ if count == 0:
+ itemarg = emphgroup
+ elif count == ltable-1:
+ itembody = itembody + \
+ [chunk(PLAIN, wh, ' --- ')] + emphgroup
+ else:
+ itembody = emphgroup
+ newcode.append(chunk(GROUP, wh, itemarg))
+ newcode = newcode + itembody + [chunk(DENDLINE, wh, '\n')]
+ pp[i:i] = newcode
+ l = len(newcode)
+ length, i = length+l, i+l
+ del newcode, l
+
+ if length != len(pp):
+ raise 'STILL, SOMETHING wrong', `i`
+
+
+ elif envname == 'funcdesc':
+ pp.insert(i, chunk(PLAIN, ch.where, ''))
+ i, length = i+1, length+1
+ length, i = do_funcdesc(length, buf, pp, i)
+
+ elif envname == 'excdesc':
+ pp.insert(i, chunk(PLAIN, ch.where, ''))
+ i, length = i+1, length+1
+ length, i = do_excdesc(length, buf, pp, i)
+
+ elif envname == 'datadesc':
+ pp.insert(i, chunk(PLAIN, ch.where, ''))
+ i, length = i+1, length+1
+ length, i = do_datadesc(length, buf, pp, i)
+
+ else:
+ print 'WARNING: don\'t know what to do with env ' + `envname`
+
+ elif ch.chtype == chunk_type(ENDENV):
+ envname = ch.data
+ if envname != hist.inenv[0]:
+ raise error, '\'end\' does not match. Name ' + `envname` + ', expected ' + `hist.inenv[0]`
+ del hist.inenv[0]
+ del pp[i-1]
+ i, length = i-1, length-1
+
+ if envname == 'verbatim':
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, 'example')])]
+ i, length = i+2, length+2
+ elif envname == 'itemize':
+ hist.itemizenesting = hist.itemizenesting - 1
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, 'itemize')])]
+ i, length = i+2, length+2
+ elif envname == 'enumerate':
+ hist.enumeratenesting = hist.enumeratenesting-1
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, 'enumerate')])]
+ i, length = i+2, length+2
+ elif envname == 'description':
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, 'table')])]
+ i, length = i+2, length+2
+ elif (envname == 'tableiii') or (envname == 'tableii'):
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, 'table')])]
+ i, length = i+2, length + 2
+ pp.insert(i, chunk(DENDLINE, ch.where, '\n'))
+ i, length = i+1, length+1
+
+ elif envname in ('funcdesc', 'excdesc', 'datadesc'):
+ pp[i:i] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, hist.command)])]
+ i, length = i+2, length+2
+ else:
+ print 'WARNING: ending env ' + `envname` + 'has no actions'
+
+ elif ch.chtype == chunk_type(CSNAME):
+ # control name transformations
+ if s(buf, ch.data) == 'optional':
+ pp[i-1].chtype = chunk_type (PLAIN)
+ pp[i-1].data = '['
+ if (i < length) and \
+ (pp[i].chtype == chunk_type(GROUP)):
+ cp=pp[i].data
+ pp[i:i+1]=cp + [
+ chunk(PLAIN, ch.where, ']')]
+ length = length+len(cp)
+ elif s(buf, ch.data) in ignoredcommands:
+ del pp[i-1]
+ i, length = i-1, length-1
+ elif s(buf, ch.data) == '@' and \
+ i != length and \
+ pp[i].chtype == chunk_type(PLAIN) and \
+ s(buf, pp[i].data)[0] == '.':
+ # \@. --> \. --> @.
+ ch.data = '.'
+ del pp[i]
+ length = length-1
+ elif s(buf, ch.data) == '\\':
+ # \\ --> \* --> @*
+ ch.data = '*'
+ elif len(s(buf, ch.data)) == 1 and \
+ s(buf, ch.data) in onlylatexspecial:
+ ch.chtype = chunk_type(PLAIN)
+ # check if such a command is followed by
+ # an empty group: e.g., `\%{}'. If so, remove
+ # this empty group too
+ if i < length and \
+ pp[i].chtype == chunk_type(GROUP) \
+ and len(pp[i].data) == 0:
+ del pp[i]
+ length = length-1
+
+ elif hist.inargs and s(buf, ch.data) in inargsselves:
+ # This is the special processing of the
+ # arguments of the \begin{funcdesc}... or
+ # \funcline... arguments
+ # \, --> , \[ --> [, \] --> ]
+ ch.chtype = chunk_type(PLAIN)
+
+ elif s(buf, ch.data) == 'renewcommand':
+ # \renewcommand{\indexsubitem}....
+ i, length = i-1, length-1
+ del pp[i]
+ length, newi = getnextarg(length, buf, pp, i)
+ if newi-i == 1 \
+ and i < length \
+ and pp[i].chtype == chunk_type(CSNAME) \
+ and s(buf, pp[i].data) == 'indexsubitem':
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ text = flattext(buf, pp[i:newi])
+ if text[:1] != '(' or text[-1:] != ')':
+ raise error, 'expected indexsubitme enclosed in braces'
+ words = string.split(text[1:-1])
+ hist.indexsubitem = words
+ del text, words
+ else:
+ print 'WARNING: renewcommand with unsupported arg removed'
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ elif s(buf, ch.data) == 'item':
+ ch.chtype = chunk_type(CSLINE)
+ length, newi = getoptarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ i, length = i+1, length+1
+
+ elif s(buf, ch.data) == 'ttindex':
+ idxsi = hist.indexsubitem
+
+ cat_class = ''
+ if len(idxsi) >= 2 and idxsi[1] in \
+ ('method', 'function', 'protocol'):
+ command = 'findex'
+ elif len(idxsi) >= 2 and idxsi[1] in \
+ ('exception', 'object'):
+ command = 'vindex'
+ else:
+ print 'WARNING: can\'t categorize ' + `idxsi` + ' for \'ttindex\' command'
+ command = 'cindex'
- if type(ch) is StringType:
- #normally, only chunks are present in pp,
- # but in some cases, some extra info
- # has been inserted, e.g., the \end{...} clauses
- raise 'FATAL', 'got string, probably too many ' + `end`
-
- if ch.chtype == chunk_type(GROUP):
- # check for {\em ...} constructs
- if ch.data and \
- ch.data[0].chtype == chunk_type(CSNAME) and \
- s(buf, ch.data[0].data) in fontchanges.keys():
- k = s(buf, ch.data[0].data)
- del ch.data[0]
- pp.insert(i-1, chunk(CSNAME, ch.where, fontchanges[k]))
- length, i = length+1, i+1
-
- # recursively parse the contents of the group
- changeit(buf, ch.data)
-
- elif ch.chtype == chunk_type(IF):
- # \if...
- flag, negate, data = ch.data
- ##print 'IF: flag, negate = ' + `flag, negate`
- if flag not in flags.keys():
- raise error, 'unknown flag ' + `flag`
-
- value = flags[flag]
- if negate:
- value = (not value)
- del pp[i-1]
- length, i = length-1, i-1
- if value:
- pp[i:i] = data
- length = length + len(data)
-
-
- elif ch.chtype == chunk_type(ENV):
- # \begin{...} ....
- envname, data = ch.data
-
- #push this environment name on stack
- hist.inenv.insert(0, envname)
-
- #append an endenv chunk after grouped data
- data.append(chunk(ENDENV, ch.where, envname))
- ##[`data`]
-
- #delete this object
- del pp[i-1]
- i, length = i-1, length-1
-
- #insert found data
- pp[i:i] = data
- length = length + len(data)
-
- if envname == 'verbatim':
- pp[i:i] = [chunk(CSLINE, ch.where, 'example'), \
- chunk(GROUP, ch.where, [])]
- length, i = length+2, i+2
-
- elif envname == 'itemize':
- if hist.itemizenesting > len(itemizesymbols):
- raise error, 'too deep itemize nesting'
- ingroupch = [chunk(CSNAME, ch.where,\
- itemizesymbols[hist.itemizenesting])]
- hist.itemizenesting = hist.itemizenesting + 1
- pp[i:i] = [chunk(CSLINE, ch.where, 'itemize'),\
- chunk(GROUP, ch.where, ingroupch)]
- length, i = length+2, i+2
-
- elif envname == 'enumerate':
- if hist.enumeratenesting > len(enumeratesymbols):
- raise error, 'too deep enumerate nesting'
- ingroupch = [chunk(PLAIN, ch.where,\
- enumeratesymbols[hist.enumeratenesting])]
- hist.enumeratenesting = hist.enumeratenesting + 1
- pp[i:i] = [chunk(CSLINE, ch.where, 'enumerate'),\
- chunk(GROUP, ch.where, ingroupch)]
- length, i = length+2, i+2
-
- elif envname == 'description':
- ingroupch = [chunk(CSNAME, ch.where, 'b')]
- pp[i:i] = [chunk(CSLINE, ch.where, 'table'), \
- chunk(GROUP, ch.where, ingroupch)]
- length, i = length+2, i+2
-
- elif (envname == 'tableiii') or \
- (envname == 'tableii'):
- if (envname == 'tableii'):
- ltable = 2
- else:
- ltable = 3
- wh = ch.where
- newcode = []
-
- #delete tabular format description
- # e.g., {|l|c|l|}
- length, newi = getnextarg(length, buf, pp, i)
- del pp[i:newi]
- length = length - (newi-i)
-
- newcode.append(chunk(CSLINE, wh, 'table'))
- ingroupch = [chunk(CSNAME, wh, 'asis')]
- newcode.append(chunk(GROUP, wh, ingroupch))
- newcode.append(chunk(CSLINE, wh, 'item'))
-
- #get the name of macro for @item
- # e.g., {code}
- length, newi = getnextarg(length, buf, pp, i)
-
- if newi-i != 1:
- raise error, 'Sorry, expected 1 chunk argument'
- if pp[i].chtype != chunk_type(PLAIN):
- raise error, 'Sorry, expected plain text argument'
- hist.itemargmacro = s(buf, pp[i].data)
- del pp[i:newi]
- length = length - (newi-i)
-
- itembody = []
- for count in range(ltable):
- length, newi = getnextarg(length, buf, pp, i)
- emphgroup = [\
- chunk(CSNAME, wh, 'emph'), \
- chunk(GROUP, 0, pp[i:newi])]
- del pp[i:newi]
- length = length - (newi-i)
- if count == 0:
- itemarg = emphgroup
- elif count == ltable-1:
- itembody = itembody + \
- [chunk(PLAIN, wh, ' --- ')] + \
- emphgroup
- else:
- itembody = emphgroup
- newcode.append(chunk(GROUP, wh, itemarg))
- newcode = newcode + itembody + [chunk(DENDLINE, wh, '\n')]
- pp[i:i] = newcode
- l = len(newcode)
- length, i = length+l, i+l
- del newcode, l
-
- if length != len(pp):
- raise 'STILL, SOMETHING wrong', `i`
-
-
- elif envname == 'funcdesc':
- pp.insert(i, chunk(PLAIN, ch.where, ''))
- i, length = i+1, length+1
- length, i = do_funcdesc(length, buf, pp, i)
-
- elif envname == 'excdesc':
- pp.insert(i, chunk(PLAIN, ch.where, ''))
- i, length = i+1, length+1
- length, i = do_excdesc(length, buf, pp, i)
-
- elif envname == 'datadesc':
- pp.insert(i, chunk(PLAIN, ch.where, ''))
- i, length = i+1, length+1
- length, i = do_datadesc(length, buf, pp, i)
-
- else:
- print 'WARNING: don\'t know what to do with env ' + `envname`
-
- elif ch.chtype == chunk_type(ENDENV):
- envname = ch.data
- if envname != hist.inenv[0]:
- raise error, '\'end\' does not match. Name ' + `envname` + ', expected ' + `hist.inenv[0]`
- del hist.inenv[0]
- del pp[i-1]
- i, length = i-1, length-1
-
- if envname == 'verbatim':
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, 'example')])]
- i, length = i+2, length+2
- elif envname == 'itemize':
- hist.itemizenesting = hist.itemizenesting - 1
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, 'itemize')])]
- i, length = i+2, length+2
- elif envname == 'enumerate':
- hist.enumeratenesting = hist.enumeratenesting-1
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, 'enumerate')])]
- i, length = i+2, length+2
- elif envname == 'description':
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, 'table')])]
- i, length = i+2, length+2
- elif (envname == 'tableiii') or (envname == 'tableii'):
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, 'table')])]
- i, length = i+2, length + 2
- pp.insert(i, chunk(DENDLINE, ch.where, '\n'))
- i, length = i+1, length+1
-
- elif envname in ('funcdesc', 'excdesc', 'datadesc'):
- pp[i:i] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, hist.command)])]
- i, length = i+2, length+2
- else:
- print 'WARNING: ending env ' + `envname` + 'has no actions'
-
- elif ch.chtype == chunk_type(CSNAME):
- # control name transformations
- if s(buf, ch.data) == 'optional':
- pp[i-1].chtype = chunk_type (PLAIN)
- pp[i-1].data = '['
- if (i < length) and \
- (pp[i].chtype == chunk_type(GROUP)):
- cp=pp[i].data
- pp[i:i+1]=cp + [\
- chunk(PLAIN, ch.where, ']')]
- length = length+len(cp)
- elif s(buf, ch.data) in ignoredcommands:
- del pp[i-1]
- i, length = i-1, length-1
- elif s(buf, ch.data) == '@' and \
- i != length and \
- pp[i].chtype == chunk_type(PLAIN) and \
- s(buf, pp[i].data)[0] == '.':
- # \@. --> \. --> @.
- ch.data = '.'
- del pp[i]
- length = length-1
- elif s(buf, ch.data) == '\\':
- # \\ --> \* --> @*
- ch.data = '*'
- elif len(s(buf, ch.data)) == 1 and \
- s(buf, ch.data) in onlylatexspecial:
- ch.chtype = chunk_type(PLAIN)
- # check if such a command is followed by
- # an empty group: e.g., `\%{}'. If so, remove
- # this empty group too
- if i < length and \
- pp[i].chtype == chunk_type(GROUP) \
- and len(pp[i].data) == 0:
- del pp[i]
- length = length-1
-
- elif hist.inargs and s(buf, ch.data) in inargsselves:
- # This is the special processing of the
- # arguments of the \begin{funcdesc}... or
- # \funcline... arguments
- # \, --> , \[ --> [, \] --> ]
- ch.chtype = chunk_type(PLAIN)
-
- elif s(buf, ch.data) == 'renewcommand':
- # \renewcommand{\indexsubitem}....
- i, length = i-1, length-1
- del pp[i]
- length, newi = getnextarg(length, buf, pp, i)
- if newi-i == 1 \
- and i < length \
- and pp[i].chtype == chunk_type(CSNAME) \
- and s(buf, pp[i].data) == 'indexsubitem':
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- text = flattext(buf, pp[i:newi])
- if text[:1] != '(' or text[-1:] != ')':
- raise error, 'expected indexsubitme enclosed in braces'
- words = string.split(text[1:-1])
- hist.indexsubitem = words
- del text, words
- else:
- print 'WARNING: renewcommand with unsupported arg removed'
- del pp[i:newi]
- length = length - (newi-i)
-
- elif s(buf, ch.data) == 'item':
- ch.chtype = chunk_type(CSLINE)
- length, newi = getoptarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- i, length = i+1, length+1
-
- elif s(buf, ch.data) == 'ttindex':
- idxsi = hist.indexsubitem
-
- cat_class = ''
- if len(idxsi) >= 2 and idxsi[1] in \
- ('method', 'function', 'protocol'):
- command = 'findex'
- elif len(idxsi) >= 2 and idxsi[1] in \
- ('exception', 'object'):
- command = 'vindex'
- else:
- print 'WARNING: can\'t categorize ' + `idxsi` + ' for \'ttindex\' command'
- command = 'cindex'
-
- if not cat_class:
- cat_class = '('+string.join(idxsi)+')'
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = command
-
- length, newi = getnextarg(length, buf, pp, i)
- arg = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- cat_arg = [chunk(PLAIN, ch.where, cat_class)]
-
- # determine what should be set in roman, and
- # what in tt-font
- if command in regindices:
-
- arg = [chunk(CSNAME, ch.where, 't'), \
- chunk(GROUP, ch.where, arg)]
- else:
- cat_arg = [chunk(CSNAME, ch.where, 'r'), \
- chunk(GROUP, ch.where, cat_arg)]
-
- ingroupch = arg + \
- [chunk(PLAIN, ch.where, ' ')] + \
- cat_arg
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
-
- elif s(buf, ch.data) == 'ldots':
- # \ldots --> \dots{} --> @dots{}
- ch.data = 'dots'
- if i == length \
- or pp[i].chtype != chunk_type(GROUP) \
- or pp[i].data != []:
- pp.insert(i, chunk(GROUP, ch.where, []))
- i, length = i+1, length+1
- elif s(buf, ch.data) in wordsselves:
- # \UNIX --> UNIX
- ch.chtype = chunk_type(PLAIN)
- if i != length \
- and pp[i].chtype == chunk_type(GROUP) \
- and pp[i].data == []:
- del pp[i]
- length = length-1
- elif s(buf, ch.data) in for_texi:
- pass
-
- elif s(buf, ch.data) == 'e':
- # "\e" --> "\"
- ch.data = '\\'
- ch.chtype = chunk_type(PLAIN)
- elif (s(buf, ch.data) == 'lineiii') or\
- (s(buf, ch.data) == 'lineii'):
- # This is the most tricky one
- # \lineiii{a1}{a2}[{a3}] -->
- # @item @<cts. of itemargmacro>{a1}
- # a2 [ -- a3]
- #
- ##print 'LINEIIIIII!!!!!!!'
+ if not cat_class:
+ cat_class = '('+string.join(idxsi)+')'
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = command
+
+ length, newi = getnextarg(length, buf, pp, i)
+ arg = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ cat_arg = [chunk(PLAIN, ch.where, cat_class)]
+
+ # determine what should be set in roman, and
+ # what in tt-font
+ if command in regindices:
+
+ arg = [chunk(CSNAME, ch.where, 't'),
+ chunk(GROUP, ch.where, arg)]
+ else:
+ cat_arg = [chunk(CSNAME, ch.where, 'r'),
+ chunk(GROUP, ch.where, cat_arg)]
+
+ ingroupch = arg + \
+ [chunk(PLAIN, ch.where, ' ')] + \
+ cat_arg
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+
+ elif s(buf, ch.data) == 'ldots':
+ # \ldots --> \dots{} --> @dots{}
+ ch.data = 'dots'
+ if i == length \
+ or pp[i].chtype != chunk_type(GROUP) \
+ or pp[i].data != []:
+ pp.insert(i, chunk(GROUP, ch.where, []))
+ i, length = i+1, length+1
+ elif s(buf, ch.data) in wordsselves:
+ # \UNIX --> UNIX
+ ch.chtype = chunk_type(PLAIN)
+ if i != length \
+ and pp[i].chtype == chunk_type(GROUP) \
+ and pp[i].data == []:
+ del pp[i]
+ length = length-1
+ elif s(buf, ch.data) in for_texi:
+ pass
+
+ elif s(buf, ch.data) == 'e':
+ # "\e" --> "\"
+ ch.data = '\\'
+ ch.chtype = chunk_type(PLAIN)
+ elif (s(buf, ch.data) == 'lineiii') or\
+ (s(buf, ch.data) == 'lineii'):
+ # This is the most tricky one
+ # \lineiii{a1}{a2}[{a3}] -->
+ # @item @<cts. of itemargmacro>{a1}
+ # a2 [ -- a3]
+ #
+ ##print 'LINEIIIIII!!!!!!!'
## wobj = Wobj()
## dumpit(buf, wobj.write, pp[i-1:i+5])
## print '--->' + wobj.data + '<----'
- if not hist.inenv:
- raise error, \
- 'no environment for lineiii'
- if (hist.inenv[0] != 'tableiii') and\
- (hist.inenv[0] != 'tableii'):
- raise error, \
- 'wrong command (' + \
- s(buf, ch.data)+ \
- ') in wrong environment (' \
- + `hist.inenv[0]` + ')'
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'item'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = [chunk(CSNAME, 0, \
- hist.itemargmacro), \
- chunk(GROUP, 0, pp[i:newi])]
- del pp[i:newi]
- length = length - (newi-i)
+ if not hist.inenv:
+ raise error, 'no environment for lineiii'
+ if (hist.inenv[0] != 'tableiii') and \
+ (hist.inenv[0] != 'tableii'):
+ raise error, \
+ 'wrong command (' + \
+ s(buf, ch.data)+ \
+ ') in wrong environment (' \
+ + `hist.inenv[0]` + ')'
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'item'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = [chunk(CSNAME, 0,
+ hist.itemargmacro),
+ chunk(GROUP, 0, pp[i:newi])]
+ del pp[i:newi]
+ length = length - (newi-i)
## print 'ITEM ARG: --->',
## wobj = Wobj()
## dumpit(buf, wobj.write, ingroupch)
## print wobj.data, '<---'
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- grouppos = i
- i, length = i+1, length+1
- length, i = getnextarg(length, buf, pp, i)
- length, newi = getnextarg(length, buf, pp, i)
- if newi > i:
- # we have a 3rd arg
- pp.insert(i, chunk(PLAIN, ch.where, ' --- '))
- i = newi + 1
- length = length + 1
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ grouppos = i
+ i, length = i+1, length+1
+ length, i = getnextarg(length, buf, pp, i)
+ length, newi = getnextarg(length, buf, pp, i)
+ if newi > i:
+ # we have a 3rd arg
+ pp.insert(i, chunk(PLAIN, ch.where, ' --- '))
+ i = newi + 1
+ length = length + 1
## pp[grouppos].data = pp[grouppos].data \
## + [chunk(PLAIN, ch.where, ' ')] \
## + pp[i:newi]
## del pp[i:newi]
## length = length - (newi-i)
- if length != len(pp):
- raise 'IN LINEIII IS THE ERR', `i`
-
- elif s(buf, ch.data) in ('chapter', 'section', 'subsection', 'subsubsection'):
- #\xxxsection{A} ---->
- # @node A, , ,
- # @xxxsection A
- ## also: remove commas and quotes
- ch.chtype = chunk_type(CSLINE)
- length, newi = getnextarg(length, buf, pp, i)
- afternodenamecmd = next_command_p(length, buf, pp, newi, 'nodename')
- if afternodenamecmd < 0:
- cp1 = crcopy(pp[i:newi])
- pp[i:newi] = [\
- chunk(GROUP, ch.where, \
- pp[i:newi])]
- length, newi = length - (newi-i) + 1, \
- i+1
- text = flattext(buf, cp1)
- text = invent_node_names(text)
- else:
- length, endarg = getnextarg(length, buf, pp, afternodenamecmd)
- cp1 = crcopy(pp[afternodenamecmd:endarg])
- del pp[newi:endarg]
- length = length - (endarg-newi)
-
- pp[i:newi] = [\
- chunk(GROUP, ch.where, \
- pp[i:newi])]
- length, newi = length - (newi-i) + 1, \
- i + 1
- text = flattext(buf, cp1)
- if text[-1] == '.':
- text = text[:-1]
+ if length != len(pp):
+ raise 'IN LINEIII IS THE ERR', `i`
+
+ elif s(buf, ch.data) in ('chapter', 'section', 'subsection', 'subsubsection'):
+ #\xxxsection{A} ---->
+ # @node A, , ,
+ # @xxxsection A
+ ## also: remove commas and quotes
+ ch.chtype = chunk_type(CSLINE)
+ length, newi = getnextarg(length, buf, pp, i)
+ afternodenamecmd = next_command_p(length, buf, pp, newi, 'nodename')
+ if afternodenamecmd < 0:
+ cp1 = crcopy(pp[i:newi])
+ pp[i:newi] = [
+ chunk(GROUP, ch.where,
+ pp[i:newi])]
+ length, newi = length - (newi-i) + 1, i+1
+ text = flattext(buf, cp1)
+ text = invent_node_names(text)
+ else:
+ length, endarg = getnextarg(length, buf, pp, afternodenamecmd)
+ cp1 = crcopy(pp[afternodenamecmd:endarg])
+ del pp[newi:endarg]
+ length = length - (endarg-newi)
+
+ pp[i:newi] = [
+ chunk(GROUP, ch.where,
+ pp[i:newi])]
+ length, newi = length - (newi-i) + 1, i + 1
+ text = flattext(buf, cp1)
+ if text[-1] == '.':
+ text = text[:-1]
## print 'FLATTEXT:', `text`
- if text in hist.nodenames:
- print 'WARNING: node name ' + `text` + ' already used'
- out.doublenodes.append(text)
- else:
- hist.nodenames.append(text)
- text = rm_commas_etc(text)
- pp[i-1:i-1] = [\
- chunk(CSLINE, ch.where, 'node'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, text+', , ,')\
- ])]
- i, length = newi+2, length+2
-
- elif s(buf,ch.data) == 'funcline':
- # fold it to a very short environment
- pp[i-1:i-1] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, hist.command)])]
- i, length = i+2, length+2
- length, i = do_funcdesc(length, buf, pp, i)
-
- elif s(buf,ch.data) == 'dataline':
- pp[i-1:i-1] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, hist.command)])]
- i, length = i+2, length+2
- length, i = do_datadesc(length, buf, pp, i)
-
- elif s(buf,ch.data) == 'excline':
- pp[i-1:i-1] = [\
- chunk(CSLINE, ch.where, 'end'), \
- chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, hist.command)])]
- i, length = i+2, length+2
- length, i = do_excdesc(length, buf, pp, i)
-
-
- elif s(buf, ch.data) == 'index':
- #\index{A} --->
- # @cindex A
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'cindex'
- length, newi = getnextarg(length, buf, pp, i)
-
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
- elif s(buf, ch.data) == 'bifuncindex':
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'findex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- ingroupch.append(chunk(PLAIN, ch.where, ' '))
- ingroupch.append(chunk(CSNAME, ch.where, 'r'))
- ingroupch.append(chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, \
- '(built-in function)')]))
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
-
- elif s(buf, ch.data) == 'obindex':
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'findex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- ingroupch.append(chunk(PLAIN, ch.where, ' '))
- ingroupch.append(chunk(CSNAME, ch.where, 'r'))
- ingroupch.append(chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, \
- '(object)')]))
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
-
- elif s(buf, ch.data) == 'opindex':
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'findex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- ingroupch.append(chunk(PLAIN, ch.where, ' '))
- ingroupch.append(chunk(CSNAME, ch.where, 'r'))
- ingroupch.append(chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, \
- '(operator)')]))
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
-
- elif s(buf, ch.data) == 'bimodindex':
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'pindex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- ingroupch.append(chunk(PLAIN, ch.where, ' '))
- ingroupch.append(chunk(CSNAME, ch.where, 'r'))
- ingroupch.append(chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, \
- '(built-in)')]))
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
- elif s(buf, ch.data) == 'sectcode':
- ch.data = 'code'
-
-
- elif s(buf, ch.data) == 'stmodindex':
- ch.chtype = chunk_type(CSLINE)
- # use the program index as module index
- ch.data = 'pindex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = pp[i:newi]
- del pp[i:newi]
- length = length - (newi-i)
-
- ingroupch.append(chunk(PLAIN, ch.where, ' '))
- ingroupch.append(chunk(CSNAME, ch.where, 'r'))
- ingroupch.append(chunk(GROUP, ch.where, [\
- chunk(PLAIN, ch.where, \
- '(standard)')]))
-
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- length, i = length+1, i+1
-
-
- elif s(buf, ch.data) == 'stindex':
- # XXX must actually go to newindex st
- wh = ch.where
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'cindex'
- length, newi = getnextarg(length, buf, pp, i)
- ingroupch = [chunk(CSNAME, wh, 'code'), \
- chunk(GROUP, wh, pp[i:newi])]
-
- del pp[i:newi]
- length = length - (newi-i)
-
- t = ingroupch[:]
- t.append(chunk(PLAIN, wh, ' statement'))
-
- pp.insert(i, chunk(GROUP, wh, t))
- i, length = i+1, length+1
-
- pp.insert(i, chunk(CSLINE, wh, 'cindex'))
- i, length = i+1, length+1
-
- t = ingroupch[:]
- t.insert(0, chunk(PLAIN, wh, 'statement, '))
-
- pp.insert(i, chunk(GROUP, wh, t))
- i, length = i+1, length+1
-
-
- elif s(buf, ch.data) == 'indexii':
- #\indexii{A}{B} --->
- # @cindex A B
- # @cindex B, A
- length, newi = getnextarg(length, buf, pp, i)
- cp11 = pp[i:newi]
- cp21 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp12 = pp[i:newi]
- cp22 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'cindex'
- pp.insert(i, chunk(GROUP, ch.where, cp11 + [\
- chunk(PLAIN, ch.where, ' ')] + cp12))
- i, length = i+1, length+1
- pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'), \
- chunk(GROUP, ch.where, cp22 + [\
- chunk(PLAIN, ch.where, ', ')]+ cp21)]
- i, length = i+2, length+2
-
- elif s(buf, ch.data) == 'indexiii':
- length, newi = getnextarg(length, buf, pp, i)
- cp11 = pp[i:newi]
- cp21 = crcopy(pp[i:newi])
- cp31 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp12 = pp[i:newi]
- cp22 = crcopy(pp[i:newi])
- cp32 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp13 = pp[i:newi]
- cp23 = crcopy(pp[i:newi])
- cp33 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'cindex'
- pp.insert(i, chunk(GROUP, ch.where, cp11 + [\
- chunk(PLAIN, ch.where, ' ')] + cp12 \
- + [chunk(PLAIN, ch.where, ' ')] \
- + cp13))
- i, length = i+1, length+1
- pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'), \
- chunk(GROUP, ch.where, cp22 + [\
- chunk(PLAIN, ch.where, ' ')]+ cp23\
- + [chunk(PLAIN, ch.where, ', ')] +\
- cp21)]
- i, length = i+2, length+2
- pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'), \
- chunk(GROUP, ch.where, cp33 + [\
- chunk(PLAIN, ch.where, ', ')]+ cp31\
- + [chunk(PLAIN, ch.where, ' ')] +\
- cp32)]
- i, length = i+2, length+2
-
-
- elif s(buf, ch.data) == 'indexiv':
- length, newi = getnextarg(length, buf, pp, i)
- cp11 = pp[i:newi]
- cp21 = crcopy(pp[i:newi])
- cp31 = crcopy(pp[i:newi])
- cp41 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp12 = pp[i:newi]
- cp22 = crcopy(pp[i:newi])
- cp32 = crcopy(pp[i:newi])
- cp42 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp13 = pp[i:newi]
- cp23 = crcopy(pp[i:newi])
- cp33 = crcopy(pp[i:newi])
- cp43 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
- length, newi = getnextarg(length, buf, pp, i)
- cp14 = pp[i:newi]
- cp24 = crcopy(pp[i:newi])
- cp34 = crcopy(pp[i:newi])
- cp44 = crcopy(pp[i:newi])
- del pp[i:newi]
- length = length - (newi-i)
-
- ch.chtype = chunk_type(CSLINE)
- ch.data = 'cindex'
- ingroupch = cp11 + \
- spacech + cp12 + \
- spacech + cp13 + \
- spacech + cp14
- pp.insert(i, chunk(GROUP, ch.where, ingroupch))
- i, length = i+1, length+1
- ingroupch = cp22 + \
- spacech + cp23 + \
- spacech + cp24 + \
- commach + cp21
- pp[i:i] = cindexch + [\
- chunk(GROUP, ch.where, ingroupch)]
- i, length = i+2, length+2
- ingroupch = cp33 + \
- spacech + cp34 + \
- commach + cp31 + \
- spacech + cp32
- pp[i:i] = cindexch + [\
- chunk(GROUP, ch.where, ingroupch)]
- i, length = i+2, length+2
- ingroupch = cp44 + \
- commach + cp41 + \
- spacech + cp42 + \
- spacech + cp43
- pp[i:i] = cindexch + [\
- chunk(GROUP, ch.where, ingroupch)]
- i, length = i+2, length+2
-
-
-
- else:
- print 'don\'t know what to do with keyword ' + `s(buf, ch.data)`
-
-
-
+ if text in hist.nodenames:
+ print 'WARNING: node name ' + `text` + ' already used'
+ out.doublenodes.append(text)
+ else:
+ hist.nodenames.append(text)
+ text = rm_commas_etc(text)
+ pp[i-1:i-1] = [
+ chunk(CSLINE, ch.where, 'node'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, text+', , ,')
+ ])]
+ i, length = newi+2, length+2
+
+ elif s(buf,ch.data) == 'funcline':
+ # fold it to a very short environment
+ pp[i-1:i-1] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, hist.command)])]
+ i, length = i+2, length+2
+ length, i = do_funcdesc(length, buf, pp, i)
+
+ elif s(buf,ch.data) == 'dataline':
+ pp[i-1:i-1] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, hist.command)])]
+ i, length = i+2, length+2
+ length, i = do_datadesc(length, buf, pp, i)
+
+ elif s(buf,ch.data) == 'excline':
+ pp[i-1:i-1] = [
+ chunk(CSLINE, ch.where, 'end'),
+ chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where, hist.command)])]
+ i, length = i+2, length+2
+ length, i = do_excdesc(length, buf, pp, i)
+
+
+ elif s(buf, ch.data) == 'index':
+ #\index{A} --->
+ # @cindex A
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'cindex'
+ length, newi = getnextarg(length, buf, pp, i)
+
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+ elif s(buf, ch.data) == 'bifuncindex':
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'findex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ingroupch.append(chunk(PLAIN, ch.where, ' '))
+ ingroupch.append(chunk(CSNAME, ch.where, 'r'))
+ ingroupch.append(chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where,
+ '(built-in function)')]))
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+
+ elif s(buf, ch.data) == 'obindex':
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'findex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ingroupch.append(chunk(PLAIN, ch.where, ' '))
+ ingroupch.append(chunk(CSNAME, ch.where, 'r'))
+ ingroupch.append(chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where,
+ '(object)')]))
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+
+ elif s(buf, ch.data) == 'opindex':
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'findex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ingroupch.append(chunk(PLAIN, ch.where, ' '))
+ ingroupch.append(chunk(CSNAME, ch.where, 'r'))
+ ingroupch.append(chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where,
+ '(operator)')]))
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+
+ elif s(buf, ch.data) == 'bimodindex':
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'pindex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ingroupch.append(chunk(PLAIN, ch.where, ' '))
+ ingroupch.append(chunk(CSNAME, ch.where, 'r'))
+ ingroupch.append(chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where,
+ '(built-in)')]))
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+ elif s(buf, ch.data) == 'sectcode':
+ ch.data = 'code'
+
+
+ elif s(buf, ch.data) == 'stmodindex':
+ ch.chtype = chunk_type(CSLINE)
+ # use the program index as module index
+ ch.data = 'pindex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = pp[i:newi]
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ingroupch.append(chunk(PLAIN, ch.where, ' '))
+ ingroupch.append(chunk(CSNAME, ch.where, 'r'))
+ ingroupch.append(chunk(GROUP, ch.where, [
+ chunk(PLAIN, ch.where,
+ '(standard)')]))
+
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ length, i = length+1, i+1
+
+
+ elif s(buf, ch.data) == 'stindex':
+ # XXX must actually go to newindex st
+ wh = ch.where
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'cindex'
+ length, newi = getnextarg(length, buf, pp, i)
+ ingroupch = [chunk(CSNAME, wh, 'code'),
+ chunk(GROUP, wh, pp[i:newi])]
+
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ t = ingroupch[:]
+ t.append(chunk(PLAIN, wh, ' statement'))
+
+ pp.insert(i, chunk(GROUP, wh, t))
+ i, length = i+1, length+1
+
+ pp.insert(i, chunk(CSLINE, wh, 'cindex'))
+ i, length = i+1, length+1
+
+ t = ingroupch[:]
+ t.insert(0, chunk(PLAIN, wh, 'statement, '))
+
+ pp.insert(i, chunk(GROUP, wh, t))
+ i, length = i+1, length+1
+
+
+ elif s(buf, ch.data) == 'indexii':
+ #\indexii{A}{B} --->
+ # @cindex A B
+ # @cindex B, A
+ length, newi = getnextarg(length, buf, pp, i)
+ cp11 = pp[i:newi]
+ cp21 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp12 = pp[i:newi]
+ cp22 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'cindex'
+ pp.insert(i, chunk(GROUP, ch.where, cp11 + [
+ chunk(PLAIN, ch.where, ' ')] + cp12))
+ i, length = i+1, length+1
+ pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'),
+ chunk(GROUP, ch.where, cp22 + [
+ chunk(PLAIN, ch.where, ', ')]+ cp21)]
+ i, length = i+2, length+2
+
+ elif s(buf, ch.data) == 'indexiii':
+ length, newi = getnextarg(length, buf, pp, i)
+ cp11 = pp[i:newi]
+ cp21 = crcopy(pp[i:newi])
+ cp31 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp12 = pp[i:newi]
+ cp22 = crcopy(pp[i:newi])
+ cp32 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp13 = pp[i:newi]
+ cp23 = crcopy(pp[i:newi])
+ cp33 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'cindex'
+ pp.insert(i, chunk(GROUP, ch.where, cp11 + [
+ chunk(PLAIN, ch.where, ' ')] + cp12
+ + [chunk(PLAIN, ch.where, ' ')]
+ + cp13))
+ i, length = i+1, length+1
+ pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'),
+ chunk(GROUP, ch.where, cp22 + [
+ chunk(PLAIN, ch.where, ' ')]+ cp23
+ + [chunk(PLAIN, ch.where, ', ')] +
+ cp21)]
+ i, length = i+2, length+2
+ pp[i:i] = [chunk(CSLINE, ch.where, 'cindex'),
+ chunk(GROUP, ch.where, cp33 + [
+ chunk(PLAIN, ch.where, ', ')]+ cp31
+ + [chunk(PLAIN, ch.where, ' ')] +
+ cp32)]
+ i, length = i+2, length+2
+
+
+ elif s(buf, ch.data) == 'indexiv':
+ length, newi = getnextarg(length, buf, pp, i)
+ cp11 = pp[i:newi]
+ cp21 = crcopy(pp[i:newi])
+ cp31 = crcopy(pp[i:newi])
+ cp41 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp12 = pp[i:newi]
+ cp22 = crcopy(pp[i:newi])
+ cp32 = crcopy(pp[i:newi])
+ cp42 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp13 = pp[i:newi]
+ cp23 = crcopy(pp[i:newi])
+ cp33 = crcopy(pp[i:newi])
+ cp43 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+ length, newi = getnextarg(length, buf, pp, i)
+ cp14 = pp[i:newi]
+ cp24 = crcopy(pp[i:newi])
+ cp34 = crcopy(pp[i:newi])
+ cp44 = crcopy(pp[i:newi])
+ del pp[i:newi]
+ length = length - (newi-i)
+
+ ch.chtype = chunk_type(CSLINE)
+ ch.data = 'cindex'
+ ingroupch = cp11 + \
+ spacech + cp12 + \
+ spacech + cp13 + \
+ spacech + cp14
+ pp.insert(i, chunk(GROUP, ch.where, ingroupch))
+ i, length = i+1, length+1
+ ingroupch = cp22 + \
+ spacech + cp23 + \
+ spacech + cp24 + \
+ commach + cp21
+ pp[i:i] = cindexch + [
+ chunk(GROUP, ch.where, ingroupch)]
+ i, length = i+2, length+2
+ ingroupch = cp33 + \
+ spacech + cp34 + \
+ commach + cp31 + \
+ spacech + cp32
+ pp[i:i] = cindexch + [
+ chunk(GROUP, ch.where, ingroupch)]
+ i, length = i+2, length+2
+ ingroupch = cp44 + \
+ commach + cp41 + \
+ spacech + cp42 + \
+ spacech + cp43
+ pp[i:i] = cindexch + [
+ chunk(GROUP, ch.where, ingroupch)]
+ i, length = i+2, length+2
+
+
+
+ else:
+ print 'don\'t know what to do with keyword ' + `s(buf, ch.data)`
+
+
+
re_atsign = regex.compile('[@{}]')
re_newline = regex.compile('\n')
def dumpit(buf, wm, pp):
- global out
-
- i, length = 0, len(pp)
+ global out
- addspace = 0
-
- while 1:
- if len(pp) != length:
- raise 'FATAL', 'inconsistent length'
- if i == length:
- break
- ch = pp[i]
- i = i + 1
+ i, length = 0, len(pp)
- if addspace:
- dospace = 1
- addspace = 0
- else:
- dospace = 0
-
- if ch.chtype == chunk_type(CSNAME):
- wm('@' + s(buf, ch.data))
- if s(buf, ch.data) == 'node' and \
- pp[i].chtype == chunk_type(PLAIN) and \
- s(buf, pp[i].data) in out.doublenodes:
- ##XXX doesnt work yet??
- wm(' ZZZ-' + zfill(`i`, 4))
- if s(buf, ch.data)[0] in string.letters:
- addspace = 1
- elif ch.chtype == chunk_type(PLAIN):
- if dospace and s(buf, ch.data) not in (' ', '\t'):
- wm(' ')
- text = s(buf, ch.data)
- while 1:
- pos = re_atsign.search(text)
- if pos < 0:
- break
- wm(text[:pos] + '@' + text[pos])
- text = text[pos+1:]
- wm(text)
- elif ch.chtype == chunk_type(GROUP):
- wm('{')
- dumpit(buf, wm, ch.data)
- wm('}')
- elif ch.chtype == chunk_type(DENDLINE):
- wm('\n\n')
- while i != length and pp[i].chtype in \
- (chunk_type(DENDLINE), chunk_type(ENDLINE)):
- i = i + 1
- elif ch.chtype == chunk_type(OTHER):
- wm(s(buf, ch.data))
- elif ch.chtype == chunk_type(ACTIVE):
- wm(s(buf, ch.data))
- elif ch.chtype == chunk_type(ENDLINE):
- wm('\n')
- elif ch.chtype == chunk_type(CSLINE):
- if i >= 2 and pp[i-2].chtype not in \
- (chunk_type(ENDLINE), chunk_type(DENDLINE)) \
- and (pp[i-2].chtype != chunk_type(PLAIN) \
- or s(buf, pp[i-2].data)[-1] != '\n'):
-
- wm('\n')
- wm('@' + s(buf, ch.data))
- if i == length:
- raise error, 'CSLINE expected another chunk'
- if pp[i].chtype != chunk_type(GROUP):
- raise error, 'CSLINE expected GROUP'
- if type(pp[i].data) != ListType:
- raise error, 'GROUP chould contain []-data'
-
- wobj = Wobj()
- dumpit(buf, wobj.write, pp[i].data)
- i = i + 1
- text = wobj.data
- del wobj
- if text:
- wm(' ')
- while 1:
- pos = re_newline.search(text)
- if pos < 0:
- break
- print 'WARNING: found newline in csline arg'
- wm(text[:pos] + ' ')
- text = text[pos+1:]
- wm(text)
- if i >= length or \
- pp[i].chtype not in (chunk_type(CSLINE), \
- chunk_type(ENDLINE), chunk_type(DENDLINE)) \
- and (pp[i].chtype != chunk_type(PLAIN) \
- or s(buf, pp[i].data)[0] != '\n'):
- wm('\n')
-
- elif ch.chtype == chunk_type(COMMENT):
+ addspace = 0
+
+ while 1:
+ if len(pp) != length:
+ raise 'FATAL', 'inconsistent length'
+ if i == length:
+ break
+ ch = pp[i]
+ i = i + 1
+
+ if addspace:
+ dospace = 1
+ addspace = 0
+ else:
+ dospace = 0
+
+ if ch.chtype == chunk_type(CSNAME):
+ wm('@' + s(buf, ch.data))
+ if s(buf, ch.data) == 'node' and \
+ pp[i].chtype == chunk_type(PLAIN) and \
+ s(buf, pp[i].data) in out.doublenodes:
+ ##XXX doesnt work yet??
+ wm(' ZZZ-' + zfill(`i`, 4))
+ if s(buf, ch.data)[0] in string.letters:
+ addspace = 1
+ elif ch.chtype == chunk_type(PLAIN):
+ if dospace and s(buf, ch.data) not in (' ', '\t'):
+ wm(' ')
+ text = s(buf, ch.data)
+ while 1:
+ pos = re_atsign.search(text)
+ if pos < 0:
+ break
+ wm(text[:pos] + '@' + text[pos])
+ text = text[pos+1:]
+ wm(text)
+ elif ch.chtype == chunk_type(GROUP):
+ wm('{')
+ dumpit(buf, wm, ch.data)
+ wm('}')
+ elif ch.chtype == chunk_type(DENDLINE):
+ wm('\n\n')
+ while i != length and pp[i].chtype in \
+ (chunk_type(DENDLINE), chunk_type(ENDLINE)):
+ i = i + 1
+ elif ch.chtype == chunk_type(OTHER):
+ wm(s(buf, ch.data))
+ elif ch.chtype == chunk_type(ACTIVE):
+ wm(s(buf, ch.data))
+ elif ch.chtype == chunk_type(ENDLINE):
+ wm('\n')
+ elif ch.chtype == chunk_type(CSLINE):
+ if i >= 2 and pp[i-2].chtype not in \
+ (chunk_type(ENDLINE), chunk_type(DENDLINE)) \
+ and (pp[i-2].chtype != chunk_type(PLAIN)
+ or s(buf, pp[i-2].data)[-1] != '\n'):
+
+ wm('\n')
+ wm('@' + s(buf, ch.data))
+ if i == length:
+ raise error, 'CSLINE expected another chunk'
+ if pp[i].chtype != chunk_type(GROUP):
+ raise error, 'CSLINE expected GROUP'
+ if type(pp[i].data) != ListType:
+ raise error, 'GROUP chould contain []-data'
+
+ wobj = Wobj()
+ dumpit(buf, wobj.write, pp[i].data)
+ i = i + 1
+ text = wobj.data
+ del wobj
+ if text:
+ wm(' ')
+ while 1:
+ pos = re_newline.search(text)
+ if pos < 0:
+ break
+ print 'WARNING: found newline in csline arg'
+ wm(text[:pos] + ' ')
+ text = text[pos+1:]
+ wm(text)
+ if i >= length or \
+ pp[i].chtype not in (chunk_type(CSLINE),
+ chunk_type(ENDLINE), chunk_type(DENDLINE)) \
+ and (pp[i].chtype != chunk_type(PLAIN)
+ or s(buf, pp[i].data)[0] != '\n'):
+ wm('\n')
+
+ elif ch.chtype == chunk_type(COMMENT):
## print 'COMMENT: previous chunk =', pp[i-2]
## if pp[i-2].chtype == chunk_type(PLAIN):
## print 'PLAINTEXT =', `s(buf, pp[i-2].data)`
- if s(buf, ch.data) and \
- regex.match('^[ \t]*$', s(buf, ch.data)) < 0:
- if i >= 2 and pp[i-2].chtype not in \
- (chunk_type(ENDLINE), chunk_type(DENDLINE)) \
- and not (pp[i-2].chtype == chunk_type(PLAIN) \
- and regex.match('\\(.\\|\n\\)*[ \t]*\n$', s(buf, pp[i-2].data)) >= 0):
- print 'ADDING NEWLINE'
- wm('\n')
- wm('@c ' + s(buf, ch.data))
- elif ch.chtype == chunk_type(IGNORE):
- pass
- else:
- try:
- str = `s(buf, ch.data)`
- except TypeError:
- str = `ch.data`
- if len(str) > 400:
- str = str[:400] + '...'
- print 'warning:', ch.chtype, 'not handled, data ' + str
+ if s(buf, ch.data) and \
+ regex.match('^[ \t]*$', s(buf, ch.data)) < 0:
+ if i >= 2 and pp[i-2].chtype not in \
+ (chunk_type(ENDLINE), chunk_type(DENDLINE)) \
+ and not (pp[i-2].chtype == chunk_type(PLAIN)
+ and regex.match('\\(.\\|\n\\)*[ \t]*\n$', s(buf, pp[i-2].data)) >= 0):
+ print 'ADDING NEWLINE'
+ wm('\n')
+ wm('@c ' + s(buf, ch.data))
+ elif ch.chtype == chunk_type(IGNORE):
+ pass
+ else:
+ try:
+ str = `s(buf, ch.data)`
+ except TypeError:
+ str = `ch.data`
+ if len(str) > 400:
+ str = str[:400] + '...'
+ print 'warning:', ch.chtype, 'not handled, data ' + str
def main():
- outfile = None
- headerfile = 'texipre.dat'
- trailerfile = 'texipost.dat'
-
- try:
- opts, args = getopt.getopt(sys.argv[1:], 'o:h:t:')
- except getopt.error:
- args = []
-
- if not args:
- print 'usage: partparse [-o outfile] [-h headerfile]',
- print '[-t trailerfile] file ...'
- sys.exit(2)
-
- for opt, arg in opts:
- if opt == '-o': outfile = arg
- if opt == '-h': headerfile = arg
- if opt == '-t': trailerfile = arg
-
- if not outfile:
- root, ext = os.path.splitext(args[0])
- outfile = root + '.texi'
-
- if outfile in args:
- print 'will not overwrite input file', outfile
- sys.exit(2)
-
- outf = open(outfile, 'w')
- outf.write(open(headerfile, 'r').read())
-
- for file in args:
- if len(args) > 1: print '='*20, file, '='*20
- buf = open(file, 'r').read()
- w, pp = parseit(buf)
- startchange()
- changeit(buf, pp)
- dumpit(buf, outf.write, pp)
-
- outf.write(open(trailerfile, 'r').read())
-
- outf.close()
+ outfile = None
+ headerfile = 'texipre.dat'
+ trailerfile = 'texipost.dat'
+
+ try:
+ opts, args = getopt.getopt(sys.argv[1:], 'o:h:t:')
+ except getopt.error:
+ args = []
+
+ if not args:
+ print 'usage: partparse [-o outfile] [-h headerfile]',
+ print '[-t trailerfile] file ...'
+ sys.exit(2)
+
+ for opt, arg in opts:
+ if opt == '-o': outfile = arg
+ if opt == '-h': headerfile = arg
+ if opt == '-t': trailerfile = arg
+
+ if not outfile:
+ root, ext = os.path.splitext(args[0])
+ outfile = root + '.texi'
+
+ if outfile in args:
+ print 'will not overwrite input file', outfile
+ sys.exit(2)
+
+ outf = open(outfile, 'w')
+ outf.write(open(headerfile, 'r').read())
+
+ for file in args:
+ if len(args) > 1: print '='*20, file, '='*20
+ buf = open(file, 'r').read()
+ w, pp = parseit(buf)
+ startchange()
+ changeit(buf, pp)
+ dumpit(buf, outf.write, pp)
+
+ outf.write(open(trailerfile, 'r').read())
+
+ outf.close()
if __name__ == "__main__":
main()