From 10ff0e06801af15050848c701f606ac5de3ebc06 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 17:35:50 +0000
Subject: Moved from private repository.

---
 COPYING                  |  340 ++++
 Makefile.in              |   75 +
 aapl/COPYING             |  502 ++++++
 aapl/README              |    6 +
 aapl/astring.h           |  808 +++++++++
 aapl/avlbasic.h          |   65 +
 aapl/avlcommon.h         | 1630 ++++++++++++++++++
 aapl/avlibasic.h         |   67 +
 aapl/avlikeyless.h       |   64 +
 aapl/avlimap.h           |   77 +
 aapl/avlimel.h           |   79 +
 aapl/avlimelkey.h        |   76 +
 aapl/avliset.h           |   75 +
 aapl/avlitree.h          |   78 +
 aapl/avlkeyless.h        |   58 +
 aapl/avlmap.h            |   74 +
 aapl/avlmel.h            |   74 +
 aapl/avlmelkey.h         |   71 +
 aapl/avlset.h            |   70 +
 aapl/avltree.h           |   73 +
 aapl/bstcommon.h         |  814 +++++++++
 aapl/bstmap.h            |  113 ++
 aapl/bstset.h            |   86 +
 aapl/bsttable.h          |   84 +
 aapl/bubblesort.h        |   94 ++
 aapl/compare.h           |  273 +++
 aapl/dlcommon.h          |  790 +++++++++
 aapl/dlist.h             |   64 +
 aapl/dlistmel.h          |   71 +
 aapl/dlistval.h          |   71 +
 aapl/insertsort.h        |   94 ++
 aapl/mergesort.h         |  140 ++
 aapl/quicksort.h         |  185 ++
 aapl/resize.h            |  344 ++++
 aapl/sbstmap.h           |  121 ++
 aapl/sbstset.h           |   94 ++
 aapl/sbsttable.h         |   93 +
 aapl/svector.h           | 1350 +++++++++++++++
 aapl/table.h             |  252 +++
 aapl/vector.h            | 1189 +++++++++++++
 colm.vim                 |   89 +
 colm/Makefile.in         |  123 ++
 colm/bytecode.cpp        | 4092 ++++++++++++++++++++++++++++++++++++++++++++
 colm/bytecode.h          |  615 +++++++
 colm/closure.cpp         |  450 +++++
 colm/colm.h              |   92 +
 colm/compile.cpp         | 2492 +++++++++++++++++++++++++++
 colm/dotgen.cpp          |  369 ++++
 colm/dotgen.h            |   51 +
 colm/fsmap.cpp           |  854 ++++++++++
 colm/fsmattach.cpp       |  425 +++++
 colm/fsmbase.cpp         |  602 +++++++
 colm/fsmcodegen.cpp      | 1089 ++++++++++++
 colm/fsmcodegen.h        |  214 +++
 colm/fsmexec.cpp         |  209 +++
 colm/fsmgraph.cpp        | 1399 +++++++++++++++
 colm/fsmgraph.h          | 1392 +++++++++++++++
 colm/fsmmin.cpp          |  732 ++++++++
 colm/fsmrun.cpp          |  890 ++++++++++
 colm/fsmrun.h            |  132 ++
 colm/fsmstate.cpp        |  467 +++++
 colm/input.cpp           |  144 ++
 colm/input.h             |  145 ++
 colm/list.cpp            |  105 ++
 colm/lmparse.kh          |  106 ++
 colm/lmparse.kl          | 2013 ++++++++++++++++++++++
 colm/lmscan.h            |  131 ++
 colm/lmscan.rl           |  545 ++++++
 colm/main.cpp            |  357 ++++
 colm/map.cpp             |  806 +++++++++
 colm/parsedata.cpp       | 1830 ++++++++++++++++++++
 colm/parsedata.h         |  904 ++++++++++
 colm/parsetree.cpp       | 2172 ++++++++++++++++++++++++
 colm/parsetree.h         | 1605 ++++++++++++++++++
 colm/pdabuild.cpp        | 1698 +++++++++++++++++++
 colm/pdacodegen.cpp      |  536 ++++++
 colm/pdacodegen.h        |  105 ++
 colm/pdagraph.cpp        |  518 ++++++
 colm/pdagraph.h          |  504 ++++++
 colm/pdarun.cpp          |  646 +++++++
 colm/pdarun.h            |  511 ++++++
 colm/redbuild.cpp        |  645 +++++++
 colm/redbuild.h          |  161 ++
 colm/redfsm.cpp          | 1112 ++++++++++++
 colm/redfsm.h            |  531 ++++++
 colm/string.cpp          |  177 ++
 colm/tree.cpp            |  160 ++
 common/Makefile.in       |   67 +
 common/buffer.h          |   55 +
 common/common.cpp        |  257 +++
 common/common.h          |  283 ++++
 common/config.h.in       |   50 +
 common/pcheck.h          |   48 +
 configure                | 4222 ++++++++++++++++++++++++++++++++++++++++++++++
 configure.in             |   79 +
 test/Makefile            |   46 +
 test/backtrack1.lm       |   24 +
 test/backtrack2.lm       |   24 +
 test/backtrack3.lm       |   27 +
 test/btscan.in           |    2 +
 test/btscan.lm           |   34 +
 test/constructex.in      |    3 +
 test/constructex.lm      |   37 +
 test/counting1.in        |    1 +
 test/counting1.lm        |   91 +
 test/counting2.lm        |   82 +
 test/counting3.lm        |   92 +
 test/counting4.lm        |   89 +
 test/cxx/Makefile        |   34 +
 test/cxx/cxx.lm          | 2163 ++++++++++++++++++++++++
 test/cxx/input01.cpp     |   17 +
 test/cxx/input02.cpp     |   16 +
 test/cxx/input03.cpp     |   19 +
 test/cxx/input04.cpp     |   17 +
 test/cxx/input05.cpp     |    8 +
 test/cxx/input06.cpp     |    7 +
 test/cxx/input07.cpp     |   18 +
 test/cxx/input08.cpp     |   13 +
 test/cxx/input09.cpp     |    7 +
 test/cxx/input10.cpp     |   11 +
 test/cxx/input11.cpp     |    2 +
 test/cxx/input12.cpp     |    8 +
 test/cxx/input13.cpp     |   14 +
 test/cxx/preproc         |    4 +
 test/diff/Makefile       |   34 +
 test/diff/diff.lm        |   84 +
 test/diff/input1.diff    |   86 +
 test/dns/Makefile        |   20 +
 test/dns/dns.lm          |  488 ++++++
 test/dns/dumpdns         |   11 +
 test/dns/extract.c       |   48 +
 test/heredoc.in          |    3 +
 test/heredoc.lm          |   45 +
 test/html/Makefile       |   34 +
 test/html/html-lextag.lm |  324 ++++
 test/html/html.lm        |  307 ++++
 test/html/input01.html   |    8 +
 test/http/Makefile       |   34 +
 test/http/http.lm        |   68 +
 test/http/input1         |    2 +
 test/http/input2         |   13 +
 test/http/input3         |    8 +
 test/http/xinetd.conf    |   10 +
 test/island.in           |   19 +
 test/island.lm           |   57 +
 test/liftattrs.in        |    3 +
 test/liftattrs.lm        |   74 +
 test/mailbox.in          |   29 +
 test/mailbox.lm          |   44 +
 test/matchex.in          |    3 +
 test/matchex.lm          |   34 +
 test/maxlen.lm           |   44 +
 test/nestedcomm.in       |    1 +
 test/nestedcomm.lm       |   41 +
 test/python/Makefile     |   18 +
 test/python/input1.py    |   18 +
 test/python/input2.py    |   20 +
 test/python/input3.py    |    1 +
 test/python/input4.py    |   10 +
 test/python/python.lm    |  726 ++++++++
 test/ragelambig.in       |    1 +
 test/ragelambig1.lm      |   65 +
 test/ragelambig2.lm      |   65 +
 test/ragelambig3.lm      |   64 +
 test/ragelambig4.lm      |   69 +
 test/rediv.in            |    1 +
 test/rediv.lm            |   92 +
 test/ruby/Makefile       |   34 +
 test/ruby/ruby.lm        |  627 +++++++
 test/rubyhere.in         |    8 +
 test/rubyhere.lm         |   89 +
 test/string.in           |    2 +
 test/string.lm           |   54 +
 test/superid.in          |    1 +
 test/superid.lm          |   59 +
 test/tags.in             |    1 +
 test/tags.lm             |   82 +
 test/til.in              |   14 +
 test/til.lm              |  124 ++
 test/travs1.in           |    1 +
 test/travs1.lm           |  144 ++
 test/travs2.in           |    1 +
 test/travs2.lm           |   93 +
 test/xml/Makefile        |   34 +
 test/xml/xml.in          | 3962 +++++++++++++++++++++++++++++++++++++++++++
 test/xml/xml.lm          |  167 ++
 version.mk               |    2 +
 187 files changed, 62225 insertions(+)
 create mode 100644 COPYING
 create mode 100644 Makefile.in
 create mode 100644 aapl/COPYING
 create mode 100644 aapl/README
 create mode 100644 aapl/astring.h
 create mode 100644 aapl/avlbasic.h
 create mode 100644 aapl/avlcommon.h
 create mode 100644 aapl/avlibasic.h
 create mode 100644 aapl/avlikeyless.h
 create mode 100644 aapl/avlimap.h
 create mode 100644 aapl/avlimel.h
 create mode 100644 aapl/avlimelkey.h
 create mode 100644 aapl/avliset.h
 create mode 100644 aapl/avlitree.h
 create mode 100644 aapl/avlkeyless.h
 create mode 100644 aapl/avlmap.h
 create mode 100644 aapl/avlmel.h
 create mode 100644 aapl/avlmelkey.h
 create mode 100644 aapl/avlset.h
 create mode 100644 aapl/avltree.h
 create mode 100644 aapl/bstcommon.h
 create mode 100644 aapl/bstmap.h
 create mode 100644 aapl/bstset.h
 create mode 100644 aapl/bsttable.h
 create mode 100644 aapl/bubblesort.h
 create mode 100644 aapl/compare.h
 create mode 100644 aapl/dlcommon.h
 create mode 100644 aapl/dlist.h
 create mode 100644 aapl/dlistmel.h
 create mode 100644 aapl/dlistval.h
 create mode 100644 aapl/insertsort.h
 create mode 100644 aapl/mergesort.h
 create mode 100644 aapl/quicksort.h
 create mode 100644 aapl/resize.h
 create mode 100644 aapl/sbstmap.h
 create mode 100644 aapl/sbstset.h
 create mode 100644 aapl/sbsttable.h
 create mode 100644 aapl/svector.h
 create mode 100644 aapl/table.h
 create mode 100644 aapl/vector.h
 create mode 100644 colm.vim
 create mode 100644 colm/Makefile.in
 create mode 100644 colm/bytecode.cpp
 create mode 100644 colm/bytecode.h
 create mode 100644 colm/closure.cpp
 create mode 100644 colm/colm.h
 create mode 100644 colm/compile.cpp
 create mode 100644 colm/dotgen.cpp
 create mode 100644 colm/dotgen.h
 create mode 100644 colm/fsmap.cpp
 create mode 100644 colm/fsmattach.cpp
 create mode 100644 colm/fsmbase.cpp
 create mode 100644 colm/fsmcodegen.cpp
 create mode 100644 colm/fsmcodegen.h
 create mode 100644 colm/fsmexec.cpp
 create mode 100644 colm/fsmgraph.cpp
 create mode 100644 colm/fsmgraph.h
 create mode 100644 colm/fsmmin.cpp
 create mode 100644 colm/fsmrun.cpp
 create mode 100644 colm/fsmrun.h
 create mode 100644 colm/fsmstate.cpp
 create mode 100644 colm/input.cpp
 create mode 100644 colm/input.h
 create mode 100644 colm/list.cpp
 create mode 100644 colm/lmparse.kh
 create mode 100644 colm/lmparse.kl
 create mode 100644 colm/lmscan.h
 create mode 100644 colm/lmscan.rl
 create mode 100644 colm/main.cpp
 create mode 100644 colm/map.cpp
 create mode 100644 colm/parsedata.cpp
 create mode 100644 colm/parsedata.h
 create mode 100644 colm/parsetree.cpp
 create mode 100644 colm/parsetree.h
 create mode 100644 colm/pdabuild.cpp
 create mode 100644 colm/pdacodegen.cpp
 create mode 100644 colm/pdacodegen.h
 create mode 100644 colm/pdagraph.cpp
 create mode 100644 colm/pdagraph.h
 create mode 100644 colm/pdarun.cpp
 create mode 100644 colm/pdarun.h
 create mode 100644 colm/redbuild.cpp
 create mode 100644 colm/redbuild.h
 create mode 100644 colm/redfsm.cpp
 create mode 100644 colm/redfsm.h
 create mode 100644 colm/string.cpp
 create mode 100644 colm/tree.cpp
 create mode 100644 common/Makefile.in
 create mode 100644 common/buffer.h
 create mode 100644 common/common.cpp
 create mode 100644 common/common.h
 create mode 100644 common/config.h.in
 create mode 100644 common/pcheck.h
 create mode 100755 configure
 create mode 100644 configure.in
 create mode 100644 test/Makefile
 create mode 100644 test/backtrack1.lm
 create mode 100644 test/backtrack2.lm
 create mode 100644 test/backtrack3.lm
 create mode 100644 test/btscan.in
 create mode 100644 test/btscan.lm
 create mode 100644 test/constructex.in
 create mode 100644 test/constructex.lm
 create mode 100644 test/counting1.in
 create mode 100644 test/counting1.lm
 create mode 100644 test/counting2.lm
 create mode 100644 test/counting3.lm
 create mode 100644 test/counting4.lm
 create mode 100644 test/cxx/Makefile
 create mode 100644 test/cxx/cxx.lm
 create mode 100644 test/cxx/input01.cpp
 create mode 100644 test/cxx/input02.cpp
 create mode 100644 test/cxx/input03.cpp
 create mode 100644 test/cxx/input04.cpp
 create mode 100644 test/cxx/input05.cpp
 create mode 100644 test/cxx/input06.cpp
 create mode 100644 test/cxx/input07.cpp
 create mode 100644 test/cxx/input08.cpp
 create mode 100644 test/cxx/input09.cpp
 create mode 100644 test/cxx/input10.cpp
 create mode 100644 test/cxx/input11.cpp
 create mode 100644 test/cxx/input12.cpp
 create mode 100644 test/cxx/input13.cpp
 create mode 100755 test/cxx/preproc
 create mode 100644 test/diff/Makefile
 create mode 100644 test/diff/diff.lm
 create mode 100644 test/diff/input1.diff
 create mode 100644 test/dns/Makefile
 create mode 100644 test/dns/dns.lm
 create mode 100644 test/dns/dumpdns
 create mode 100644 test/dns/extract.c
 create mode 100644 test/heredoc.in
 create mode 100644 test/heredoc.lm
 create mode 100644 test/html/Makefile
 create mode 100644 test/html/html-lextag.lm
 create mode 100644 test/html/html.lm
 create mode 100644 test/html/input01.html
 create mode 100644 test/http/Makefile
 create mode 100644 test/http/http.lm
 create mode 100644 test/http/input1
 create mode 100644 test/http/input2
 create mode 100644 test/http/input3
 create mode 100644 test/http/xinetd.conf
 create mode 100644 test/island.in
 create mode 100644 test/island.lm
 create mode 100644 test/liftattrs.in
 create mode 100644 test/liftattrs.lm
 create mode 100644 test/mailbox.in
 create mode 100644 test/mailbox.lm
 create mode 100644 test/matchex.in
 create mode 100644 test/matchex.lm
 create mode 100644 test/maxlen.lm
 create mode 100644 test/nestedcomm.in
 create mode 100644 test/nestedcomm.lm
 create mode 100644 test/python/Makefile
 create mode 100644 test/python/input1.py
 create mode 100644 test/python/input2.py
 create mode 100644 test/python/input3.py
 create mode 100644 test/python/input4.py
 create mode 100644 test/python/python.lm
 create mode 100644 test/ragelambig.in
 create mode 100644 test/ragelambig1.lm
 create mode 100644 test/ragelambig2.lm
 create mode 100644 test/ragelambig3.lm
 create mode 100644 test/ragelambig4.lm
 create mode 100644 test/rediv.in
 create mode 100644 test/rediv.lm
 create mode 100644 test/ruby/Makefile
 create mode 100644 test/ruby/ruby.lm
 create mode 100644 test/rubyhere.in
 create mode 100644 test/rubyhere.lm
 create mode 100644 test/string.in
 create mode 100644 test/string.lm
 create mode 100644 test/superid.in
 create mode 100644 test/superid.lm
 create mode 100644 test/tags.in
 create mode 100644 test/tags.lm
 create mode 100644 test/til.in
 create mode 100644 test/til.lm
 create mode 100644 test/travs1.in
 create mode 100644 test/travs1.lm
 create mode 100644 test/travs2.in
 create mode 100644 test/travs2.lm
 create mode 100644 test/xml/Makefile
 create mode 100644 test/xml/xml.in
 create mode 100644 test/xml/xml.lm
 create mode 100644 version.mk

diff --git a/COPYING b/COPYING
new file mode 100644
index 00000000..ec0507be
--- /dev/null
+++ b/COPYING
@@ -0,0 +1,340 @@
+                    GNU GENERAL PUBLIC LICENSE
+                       Version 2, June 1991
+
+ Copyright (C) 1989, 1991 Free Software Foundation, Inc.
+     59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+                            Preamble
+
+  The licenses for most software are designed to take away your
+freedom to share and change it.  By contrast, the GNU General Public
+License is intended to guarantee your freedom to share and change free
+software--to make sure the software is free for all its users.  This
+General Public License applies to most of the Free Software
+Foundation's software and to any other program whose authors commit to
+using it.  (Some other Free Software Foundation software is covered by
+the GNU Library General Public License instead.)  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+this service if you wish), that you receive source code or can get it
+if you want it, that you can change the software or use pieces of it
+in new free programs; and that you know you can do these things.
+
+  To protect your rights, we need to make restrictions that forbid
+anyone to deny you these rights or to ask you to surrender the rights.
+These restrictions translate to certain responsibilities for you if you
+distribute copies of the software, or if you modify it.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must give the recipients all the rights that
+you have.  You must make sure that they, too, receive or can get the
+source code.  And you must show them these terms so they know their
+rights.
+
+  We protect your rights with two steps: (1) copyright the software, and
+(2) offer you this license which gives you legal permission to copy,
+distribute and/or modify the software.
+
+  Also, for each author's protection and ours, we want to make certain
+that everyone understands that there is no warranty for this free
+software.  If the software is modified by someone else and passed on, we
+want its recipients to know that what they have is not the original, so
+that any problems introduced by others will not reflect on the original
+authors' reputations.
+
+  Finally, any free program is threatened constantly by software
+patents.  We wish to avoid the danger that redistributors of a free
+program will individually obtain patent licenses, in effect making the
+program proprietary.  To prevent this, we have made it clear that any
+patent must be licensed for everyone's free use or not licensed at all.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+                    GNU GENERAL PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. This License applies to any program or other work which contains
+a notice placed by the copyright holder saying it may be distributed
+under the terms of this General Public License.  The "Program", below,
+refers to any such program or work, and a "work based on the Program"
+means either the Program or any derivative work under copyright law:
+that is to say, a work containing the Program or a portion of it,
+either verbatim or with modifications and/or translated into another
+language.  (Hereinafter, translation is included without limitation in
+the term "modification".)  Each licensee is addressed as "you".
+
+Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope.  The act of
+running the Program is not restricted, and the output from the Program
+is covered only if its contents constitute a work based on the
+Program (independent of having been made by running the Program).
+Whether that is true depends on what the Program does.
+
+  1. You may copy and distribute verbatim copies of the Program's
+source code as you receive it, in any medium, provided that you
+conspicuously and appropriately publish on each copy an appropriate
+copyright notice and disclaimer of warranty; keep intact all the
+notices that refer to this License and to the absence of any warranty;
+and give any other recipients of the Program a copy of this License
+along with the Program.
+
+You may charge a fee for the physical act of transferring a copy, and
+you may at your option offer warranty protection in exchange for a fee.
+
+  2. You may modify your copy or copies of the Program or any portion
+of it, thus forming a work based on the Program, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+    a) You must cause the modified files to carry prominent notices
+    stating that you changed the files and the date of any change.
+
+    b) You must cause any work that you distribute or publish, that in
+    whole or in part contains or is derived from the Program or any
+    part thereof, to be licensed as a whole at no charge to all third
+    parties under the terms of this License.
+
+    c) If the modified program normally reads commands interactively
+    when run, you must cause it, when started running for such
+    interactive use in the most ordinary way, to print or display an
+    announcement including an appropriate copyright notice and a
+    notice that there is no warranty (or else, saying that you provide
+    a warranty) and that users may redistribute the program under
+    these conditions, and telling the user how to view a copy of this
+    License.  (Exception: if the Program itself is interactive but
+    does not normally print such an announcement, your work based on
+    the Program is not required to print an announcement.)
+
+These requirements apply to the modified work as a whole.  If
+identifiable sections of that work are not derived from the Program,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works.  But when you
+distribute the same sections as part of a whole which is a work based
+on the Program, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Program.
+
+In addition, mere aggregation of another work not based on the Program
+with the Program (or with a work based on the Program) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+  3. You may copy and distribute the Program (or a work based on it,
+under Section 2) in object code or executable form under the terms of
+Sections 1 and 2 above provided that you also do one of the following:
+
+    a) Accompany it with the complete corresponding machine-readable
+    source code, which must be distributed under the terms of Sections
+    1 and 2 above on a medium customarily used for software interchange; or,
+
+    b) Accompany it with a written offer, valid for at least three
+    years, to give any third party, for a charge no more than your
+    cost of physically performing source distribution, a complete
+    machine-readable copy of the corresponding source code, to be
+    distributed under the terms of Sections 1 and 2 above on a medium
+    customarily used for software interchange; or,
+
+    c) Accompany it with the information you received as to the offer
+    to distribute corresponding source code.  (This alternative is
+    allowed only for noncommercial distribution and only if you
+    received the program in object code or executable form with such
+    an offer, in accord with Subsection b above.)
+
+The source code for a work means the preferred form of the work for
+making modifications to it.  For an executable work, complete source
+code means all the source code for all modules it contains, plus any
+associated interface definition files, plus the scripts used to
+control compilation and installation of the executable.  However, as a
+special exception, the source code distributed need not include
+anything that is normally distributed (in either source or binary
+form) with the major components (compiler, kernel, and so on) of the
+operating system on which the executable runs, unless that component
+itself accompanies the executable.
+
+If distribution of executable or object code is made by offering
+access to copy from a designated place, then offering equivalent
+access to copy the source code from the same place counts as
+distribution of the source code, even though third parties are not
+compelled to copy the source along with the object code.
+
+  4. You may not copy, modify, sublicense, or distribute the Program
+except as expressly provided under this License.  Any attempt
+otherwise to copy, modify, sublicense or distribute the Program is
+void, and will automatically terminate your rights under this License.
+However, parties who have received copies, or rights, from you under
+this License will not have their licenses terminated so long as such
+parties remain in full compliance.
+
+  5. You are not required to accept this License, since you have not
+signed it.  However, nothing else grants you permission to modify or
+distribute the Program or its derivative works.  These actions are
+prohibited by law if you do not accept this License.  Therefore, by
+modifying or distributing the Program (or any work based on the
+Program), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Program or works based on it.
+
+  6. Each time you redistribute the Program (or any work based on the
+Program), the recipient automatically receives a license from the
+original licensor to copy, distribute or modify the Program subject to
+these terms and conditions.  You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties to
+this License.
+
+  7. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Program at all.  For example, if a patent
+license would not permit royalty-free redistribution of the Program by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Program.
+
+If any portion of this section is held invalid or unenforceable under
+any particular circumstance, the balance of the section is intended to
+apply and the section as a whole is intended to apply in other
+circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system, which is
+implemented by public license practices.  Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+
+  8. If the distribution and/or use of the Program is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Program under this License
+may add an explicit geographical distribution limitation excluding
+those countries, so that distribution is permitted only in or among
+countries not thus excluded.  In such case, this License incorporates
+the limitation as if written in the body of this License.
+
+  9. The Free Software Foundation may publish revised and/or new versions
+of the General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+Each version is given a distinguishing version number.  If the Program
+specifies a version number of this License which applies to it and "any
+later version", you have the option of following the terms and conditions
+either of that version or of any later version published by the Free
+Software Foundation.  If the Program does not specify a version number of
+this License, you may choose any version ever published by the Free Software
+Foundation.
+
+  10. If you wish to incorporate parts of the Program into other free
+programs whose distribution conditions are different, write to the author
+to ask for permission.  For software which is copyrighted by the Free
+Software Foundation, write to the Free Software Foundation; we sometimes
+make exceptions for this.  Our decision will be guided by the two goals
+of preserving the free status of all derivatives of our free software and
+of promoting the sharing and reuse of software generally.
+
+                            NO WARRANTY
+
+  11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY
+FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.  EXCEPT WHEN
+OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES
+PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED
+OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS
+TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE
+PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,
+REPAIR OR CORRECTION.
+
+  12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR
+REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,
+INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING
+OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED
+TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY
+YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER
+PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGES.
+
+                     END OF TERMS AND CONDITIONS
+
+            How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software; you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation; either version 2 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License
+    along with this program; if not, write to the Free Software
+    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+
+
+Also add information on how to contact you by electronic and paper mail.
+
+If the program is interactive, make it output a short notice like this
+when it starts in an interactive mode:
+
+    Gnomovision version 69, Copyright (C) year name of author
+    Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, the commands you use may
+be called something other than `show w' and `show c'; they could even be
+mouse-clicks or menu items--whatever suits your program.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the program, if
+necessary.  Here is a sample; alter the names:
+
+  Yoyodyne, Inc., hereby disclaims all copyright interest in the program
+  `Gnomovision' (which makes passes at compilers) written by James Hacker.
+
+  <signature of Ty Coon>, 1 April 1989
+  Ty Coon, President of Vice
+
+This General Public License does not permit incorporating your program into
+proprietary programs.  If your program is a subroutine library, you may
+consider it more useful to permit linking proprietary applications with the
+library.  If this is what you want to do, use the GNU Library General
+Public License instead of this License.
diff --git a/Makefile.in b/Makefile.in
new file mode 100644
index 00000000..26e4b879
--- /dev/null
+++ b/Makefile.in
@@ -0,0 +1,75 @@
+#
+#   Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Colm.
+#
+#   Colm is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Colm is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Colm; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+BUILD_SUBDIRS = common colm
+ALL_SUBDIRS = $(BUILD_SUBDIRS) test
+
+#*************************************
+
+# Programs
+CXX = @CXX@
+
+# Get the version info.
+include version.mk
+
+# build targets
+all: $(BUILD_SUBDIRS)
+
+.PHONY: $(BUILD_SUBDIRS)
+
+$(BUILD_SUBDIRS):
+	@cd $@ && $(MAKE)
+
+# clean targets.
+
+CLEAN_SUBDIRS = $(ALL_SUBDIRS:%=%-clean)
+
+.PHONY: $(CLEAN_SUBDIRS)
+
+$(CLEAN_SUBDIRS):
+	@cd $(@:%-clean=%) && $(MAKE) clean
+
+clean: $(CLEAN_SUBDIRS)
+	rm -f tags
+
+# distcleaan targets
+
+DISTCLEAN_SUBDIRS = $(ALL_SUBDIRS:%=%-distclean)
+
+.PHONY: $(DISTCLEAN_SUBDIRS)
+
+$(DISTCLEAN_SUBDIRS):
+	@cd $(@:%-distclean=%) && $(MAKE) clean
+
+distclean: $(DISTCLEAN_SUBDIRS)
+	rm -f Makefile config.cache config.status config.log
+
+#install targets
+
+INSTALL_SUBDIRS = $(BUILD_SUBDIRS:%=%-install)
+
+.PHONY: $(INSTALL_SUBDIRS)
+
+$(INSTALL_SUBDIRS):
+	@cd $(@:%-install=%) && $(MAKE) install
+
+install: $(INSTALL_SUBDIRS)
+
diff --git a/aapl/COPYING b/aapl/COPYING
new file mode 100644
index 00000000..c6ed510b
--- /dev/null
+++ b/aapl/COPYING
@@ -0,0 +1,502 @@
+                  GNU LESSER GENERAL PUBLIC LICENSE
+                       Version 2.1, February 1999
+
+ Copyright (C) 1991, 1999 Free Software Foundation, Inc.
+     59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+[This is the first released version of the Lesser GPL.  It also counts
+ as the successor of the GNU Library Public License, version 2, hence
+ the version number 2.1.]
+
+                            Preamble
+
+  The licenses for most software are designed to take away your
+freedom to share and change it.  By contrast, the GNU General Public
+Licenses are intended to guarantee your freedom to share and change
+free software--to make sure the software is free for all its users.
+
+  This license, the Lesser General Public License, applies to some
+specially designated software packages--typically libraries--of the
+Free Software Foundation and other authors who decide to use it.  You
+can use it too, but we suggest you first think carefully about whether
+this license or the ordinary General Public License is the better
+strategy to use in any particular case, based on the explanations below.
+
+  When we speak of free software, we are referring to freedom of use,
+not price.  Our General Public Licenses are designed to make sure that
+you have the freedom to distribute copies of free software (and charge
+for this service if you wish); that you receive source code or can get
+it if you want it; that you can change the software and use pieces of
+it in new free programs; and that you are informed that you can do
+these things.
+
+  To protect your rights, we need to make restrictions that forbid
+distributors to deny you these rights or to ask you to surrender these
+rights.  These restrictions translate to certain responsibilities for
+you if you distribute copies of the library or if you modify it.
+
+  For example, if you distribute copies of the library, whether gratis
+or for a fee, you must give the recipients all the rights that we gave
+you.  You must make sure that they, too, receive or can get the source
+code.  If you link other code with the library, you must provide
+complete object files to the recipients, so that they can relink them
+with the library after making changes to the library and recompiling
+it.  And you must show them these terms so they know their rights.
+
+  We protect your rights with a two-step method: (1) we copyright the
+library, and (2) we offer you this license, which gives you legal
+permission to copy, distribute and/or modify the library.
+
+  To protect each distributor, we want to make it very clear that
+there is no warranty for the free library.  Also, if the library is
+modified by someone else and passed on, the recipients should know
+that what they have is not the original version, so that the original
+author's reputation will not be affected by problems that might be
+introduced by others.
+
+  Finally, software patents pose a constant threat to the existence of
+any free program.  We wish to make sure that a company cannot
+effectively restrict the users of a free program by obtaining a
+restrictive license from a patent holder.  Therefore, we insist that
+any patent license obtained for a version of the library must be
+consistent with the full freedom of use specified in this license.
+
+  Most GNU software, including some libraries, is covered by the
+ordinary GNU General Public License.  This license, the GNU Lesser
+General Public License, applies to certain designated libraries, and
+is quite different from the ordinary General Public License.  We use
+this license for certain libraries in order to permit linking those
+libraries into non-free programs.
+
+  When a program is linked with a library, whether statically or using
+a shared library, the combination of the two is legally speaking a
+combined work, a derivative of the original library.  The ordinary
+General Public License therefore permits such linking only if the
+entire combination fits its criteria of freedom.  The Lesser General
+Public License permits more lax criteria for linking other code with
+the library.
+
+  We call this license the "Lesser" General Public License because it
+does Less to protect the user's freedom than the ordinary General
+Public License.  It also provides other free software developers Less
+of an advantage over competing non-free programs.  These disadvantages
+are the reason we use the ordinary General Public License for many
+libraries.  However, the Lesser license provides advantages in certain
+special circumstances.
+
+  For example, on rare occasions, there may be a special need to
+encourage the widest possible use of a certain library, so that it becomes
+a de-facto standard.  To achieve this, non-free programs must be
+allowed to use the library.  A more frequent case is that a free
+library does the same job as widely used non-free libraries.  In this
+case, there is little to gain by limiting the free library to free
+software only, so we use the Lesser General Public License.
+
+  In other cases, permission to use a particular library in non-free
+programs enables a greater number of people to use a large body of
+free software.  For example, permission to use the GNU C Library in
+non-free programs enables many more people to use the whole GNU
+operating system, as well as its variant, the GNU/Linux operating
+system.
+
+  Although the Lesser General Public License is Less protective of the
+users' freedom, it does ensure that the user of a program that is
+linked with the Library has the freedom and the wherewithal to run
+that program using a modified version of the Library.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.  Pay close attention to the difference between a
+"work based on the library" and a "work that uses the library".  The
+former contains code derived from the library, whereas the latter must
+be combined with the library in order to run.
+
+                  GNU LESSER GENERAL PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. This License Agreement applies to any software library or other
+program which contains a notice placed by the copyright holder or
+other authorized party saying it may be distributed under the terms of
+this Lesser General Public License (also called "this License").
+Each licensee is addressed as "you".
+
+  A "library" means a collection of software functions and/or data
+prepared so as to be conveniently linked with application programs
+(which use some of those functions and data) to form executables.
+
+  The "Library", below, refers to any such software library or work
+which has been distributed under these terms.  A "work based on the
+Library" means either the Library or any derivative work under
+copyright law: that is to say, a work containing the Library or a
+portion of it, either verbatim or with modifications and/or translated
+straightforwardly into another language.  (Hereinafter, translation is
+included without limitation in the term "modification".)
+
+  "Source code" for a work means the preferred form of the work for
+making modifications to it.  For a library, complete source code means
+all the source code for all modules it contains, plus any associated
+interface definition files, plus the scripts used to control compilation
+and installation of the library.
+
+  Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope.  The act of
+running a program using the Library is not restricted, and output from
+such a program is covered only if its contents constitute a work based
+on the Library (independent of the use of the Library in a tool for
+writing it).  Whether that is true depends on what the Library does
+and what the program that uses the Library does.
+  
+  1. You may copy and distribute verbatim copies of the Library's
+complete source code as you receive it, in any medium, provided that
+you conspicuously and appropriately publish on each copy an
+appropriate copyright notice and disclaimer of warranty; keep intact
+all the notices that refer to this License and to the absence of any
+warranty; and distribute a copy of this License along with the
+Library.
+
+  You may charge a fee for the physical act of transferring a copy,
+and you may at your option offer warranty protection in exchange for a
+fee.
+
+  2. You may modify your copy or copies of the Library or any portion
+of it, thus forming a work based on the Library, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+    a) The modified work must itself be a software library.
+
+    b) You must cause the files modified to carry prominent notices
+    stating that you changed the files and the date of any change.
+
+    c) You must cause the whole of the work to be licensed at no
+    charge to all third parties under the terms of this License.
+
+    d) If a facility in the modified Library refers to a function or a
+    table of data to be supplied by an application program that uses
+    the facility, other than as an argument passed when the facility
+    is invoked, then you must make a good faith effort to ensure that,
+    in the event an application does not supply such function or
+    table, the facility still operates, and performs whatever part of
+    its purpose remains meaningful.
+
+    (For example, a function in a library to compute square roots has
+    a purpose that is entirely well-defined independent of the
+    application.  Therefore, Subsection 2d requires that any
+    application-supplied function or table used by this function must
+    be optional: if the application does not supply it, the square
+    root function must still compute square roots.)
+
+These requirements apply to the modified work as a whole.  If
+identifiable sections of that work are not derived from the Library,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works.  But when you
+distribute the same sections as part of a whole which is a work based
+on the Library, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote
+it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Library.
+
+In addition, mere aggregation of another work not based on the Library
+with the Library (or with a work based on the Library) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+  3. You may opt to apply the terms of the ordinary GNU General Public
+License instead of this License to a given copy of the Library.  To do
+this, you must alter all the notices that refer to this License, so
+that they refer to the ordinary GNU General Public License, version 2,
+instead of to this License.  (If a newer version than version 2 of the
+ordinary GNU General Public License has appeared, then you can specify
+that version instead if you wish.)  Do not make any other change in
+these notices.
+
+  Once this change is made in a given copy, it is irreversible for
+that copy, so the ordinary GNU General Public License applies to all
+subsequent copies and derivative works made from that copy.
+
+  This option is useful when you wish to copy part of the code of
+the Library into a program that is not a library.
+
+  4. You may copy and distribute the Library (or a portion or
+derivative of it, under Section 2) in object code or executable form
+under the terms of Sections 1 and 2 above provided that you accompany
+it with the complete corresponding machine-readable source code, which
+must be distributed under the terms of Sections 1 and 2 above on a
+medium customarily used for software interchange.
+
+  If distribution of object code is made by offering access to copy
+from a designated place, then offering equivalent access to copy the
+source code from the same place satisfies the requirement to
+distribute the source code, even though third parties are not
+compelled to copy the source along with the object code.
+
+  5. A program that contains no derivative of any portion of the
+Library, but is designed to work with the Library by being compiled or
+linked with it, is called a "work that uses the Library".  Such a
+work, in isolation, is not a derivative work of the Library, and
+therefore falls outside the scope of this License.
+
+  However, linking a "work that uses the Library" with the Library
+creates an executable that is a derivative of the Library (because it
+contains portions of the Library), rather than a "work that uses the
+library".  The executable is therefore covered by this License.
+Section 6 states terms for distribution of such executables.
+
+  When a "work that uses the Library" uses material from a header file
+that is part of the Library, the object code for the work may be a
+derivative work of the Library even though the source code is not.
+Whether this is true is especially significant if the work can be
+linked without the Library, or if the work is itself a library.  The
+threshold for this to be true is not precisely defined by law.
+
+  If such an object file uses only numerical parameters, data
+structure layouts and accessors, and small macros and small inline
+functions (ten lines or less in length), then the use of the object
+file is unrestricted, regardless of whether it is legally a derivative
+work.  (Executables containing this object code plus portions of the
+Library will still fall under Section 6.)
+
+  Otherwise, if the work is a derivative of the Library, you may
+distribute the object code for the work under the terms of Section 6.
+Any executables containing that work also fall under Section 6,
+whether or not they are linked directly with the Library itself.
+
+  6. As an exception to the Sections above, you may also combine or
+link a "work that uses the Library" with the Library to produce a
+work containing portions of the Library, and distribute that work
+under terms of your choice, provided that the terms permit
+modification of the work for the customer's own use and reverse
+engineering for debugging such modifications.
+
+  You must give prominent notice with each copy of the work that the
+Library is used in it and that the Library and its use are covered by
+this License.  You must supply a copy of this License.  If the work
+during execution displays copyright notices, you must include the
+copyright notice for the Library among them, as well as a reference
+directing the user to the copy of this License.  Also, you must do one
+of these things:
+
+    a) Accompany the work with the complete corresponding
+    machine-readable source code for the Library including whatever
+    changes were used in the work (which must be distributed under
+    Sections 1 and 2 above); and, if the work is an executable linked
+    with the Library, with the complete machine-readable "work that
+    uses the Library", as object code and/or source code, so that the
+    user can modify the Library and then relink to produce a modified
+    executable containing the modified Library.  (It is understood
+    that the user who changes the contents of definitions files in the
+    Library will not necessarily be able to recompile the application
+    to use the modified definitions.)
+
+    b) Use a suitable shared library mechanism for linking with the
+    Library.  A suitable mechanism is one that (1) uses at run time a
+    copy of the library already present on the user's computer system,
+    rather than copying library functions into the executable, and (2)
+    will operate properly with a modified version of the library, if
+    the user installs one, as long as the modified version is
+    interface-compatible with the version that the work was made with.
+
+    c) Accompany the work with a written offer, valid for at
+    least three years, to give the same user the materials
+    specified in Subsection 6a, above, for a charge no more
+    than the cost of performing this distribution.
+
+    d) If distribution of the work is made by offering access to copy
+    from a designated place, offer equivalent access to copy the above
+    specified materials from the same place.
+
+    e) Verify that the user has already received a copy of these
+    materials or that you have already sent this user a copy.
+
+  For an executable, the required form of the "work that uses the
+Library" must include any data and utility programs needed for
+reproducing the executable from it.  However, as a special exception,
+the materials to be distributed need not include anything that is
+normally distributed (in either source or binary form) with the major
+components (compiler, kernel, and so on) of the operating system on
+which the executable runs, unless that component itself accompanies
+the executable.
+
+  It may happen that this requirement contradicts the license
+restrictions of other proprietary libraries that do not normally
+accompany the operating system.  Such a contradiction means you cannot
+use both them and the Library together in an executable that you
+distribute.
+
+  7. You may place library facilities that are a work based on the
+Library side-by-side in a single library together with other library
+facilities not covered by this License, and distribute such a combined
+library, provided that the separate distribution of the work based on
+the Library and of the other library facilities is otherwise
+permitted, and provided that you do these two things:
+
+    a) Accompany the combined library with a copy of the same work
+    based on the Library, uncombined with any other library
+    facilities.  This must be distributed under the terms of the
+    Sections above.
+
+    b) Give prominent notice with the combined library of the fact
+    that part of it is a work based on the Library, and explaining
+    where to find the accompanying uncombined form of the same work.
+
+  8. You may not copy, modify, sublicense, link with, or distribute
+the Library except as expressly provided under this License.  Any
+attempt otherwise to copy, modify, sublicense, link with, or
+distribute the Library is void, and will automatically terminate your
+rights under this License.  However, parties who have received copies,
+or rights, from you under this License will not have their licenses
+terminated so long as such parties remain in full compliance.
+
+  9. You are not required to accept this License, since you have not
+signed it.  However, nothing else grants you permission to modify or
+distribute the Library or its derivative works.  These actions are
+prohibited by law if you do not accept this License.  Therefore, by
+modifying or distributing the Library (or any work based on the
+Library), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Library or works based on it.
+
+  10. Each time you redistribute the Library (or any work based on the
+Library), the recipient automatically receives a license from the
+original licensor to copy, distribute, link with or modify the Library
+subject to these terms and conditions.  You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties with
+this License.
+
+  11. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Library at all.  For example, if a patent
+license would not permit royalty-free redistribution of the Library by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Library.
+
+If any portion of this section is held invalid or unenforceable under any
+particular circumstance, the balance of the section is intended to apply,
+and the section as a whole is intended to apply in other circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system which is
+implemented by public license practices.  Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+
+  12. If the distribution and/or use of the Library is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Library under this License may add
+an explicit geographical distribution limitation excluding those countries,
+so that distribution is permitted only in or among countries not thus
+excluded.  In such case, this License incorporates the limitation as if
+written in the body of this License.
+
+  13. The Free Software Foundation may publish revised and/or new
+versions of the Lesser General Public License from time to time.
+Such new versions will be similar in spirit to the present version,
+but may differ in detail to address new problems or concerns.
+
+Each version is given a distinguishing version number.  If the Library
+specifies a version number of this License which applies to it and
+"any later version", you have the option of following the terms and
+conditions either of that version or of any later version published by
+the Free Software Foundation.  If the Library does not specify a
+license version number, you may choose any version ever published by
+the Free Software Foundation.
+
+  14. If you wish to incorporate parts of the Library into other free
+programs whose distribution conditions are incompatible with these,
+write to the author to ask for permission.  For software which is
+copyrighted by the Free Software Foundation, write to the Free
+Software Foundation; we sometimes make exceptions for this.  Our
+decision will be guided by the two goals of preserving the free status
+of all derivatives of our free software and of promoting the sharing
+and reuse of software generally.
+
+                            NO WARRANTY
+
+  15. BECAUSE THE LIBRARY IS LICENSED FREE OF CHARGE, THERE IS NO
+WARRANTY FOR THE LIBRARY, TO THE EXTENT PERMITTED BY APPLICABLE LAW.
+EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR
+OTHER PARTIES PROVIDE THE LIBRARY "AS IS" WITHOUT WARRANTY OF ANY
+KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE
+LIBRARY IS WITH YOU.  SHOULD THE LIBRARY PROVE DEFECTIVE, YOU ASSUME
+THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
+
+  16. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN
+WRITING WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY
+AND/OR REDISTRIBUTE THE LIBRARY AS PERMITTED ABOVE, BE LIABLE TO YOU
+FOR DAMAGES, INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR
+CONSEQUENTIAL DAMAGES ARISING OUT OF THE USE OR INABILITY TO USE THE
+LIBRARY (INCLUDING BUT NOT LIMITED TO LOSS OF DATA OR DATA BEING
+RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD PARTIES OR A
+FAILURE OF THE LIBRARY TO OPERATE WITH ANY OTHER SOFTWARE), EVEN IF
+SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
+DAMAGES.
+
+                     END OF TERMS AND CONDITIONS
+
+           How to Apply These Terms to Your New Libraries
+
+  If you develop a new library, and you want it to be of the greatest
+possible use to the public, we recommend making it free software that
+everyone can redistribute and change.  You can do so by permitting
+redistribution under these terms (or, alternatively, under the terms of the
+ordinary General Public License).
+
+  To apply these terms, attach the following notices to the library.  It is
+safest to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least the
+"copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the library's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This library is free software; you can redistribute it and/or
+    modify it under the terms of the GNU Lesser General Public
+    License as published by the Free Software Foundation; either
+    version 2.1 of the License, or (at your option) any later version.
+
+    This library is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+    Lesser General Public License for more details.
+
+    You should have received a copy of the GNU Lesser General Public
+    License along with this library; if not, write to the Free Software
+    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+
+Also add information on how to contact you by electronic and paper mail.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the library, if
+necessary.  Here is a sample; alter the names:
+
+  Yoyodyne, Inc., hereby disclaims all copyright interest in the
+  library `Frob' (a library for tweaking knobs) written by James Random Hacker.
+
+  <signature of Ty Coon>, 1 April 1990
+  Ty Coon, President of Vice
+
+That's all there is to it!
diff --git a/aapl/README b/aapl/README
new file mode 100644
index 00000000..a2fa5e65
--- /dev/null
+++ b/aapl/README
@@ -0,0 +1,6 @@
+This directory contains the Aapl source distribution. For the
+documentation, build scripts, test programs, ChangeLog, etc. get the
+aapldev package.
+
+AaplDev and other information about Aapl is available from
+http://www.elude.ca/aapl/
diff --git a/aapl/astring.h b/aapl/astring.h
new file mode 100644
index 00000000..37cc0cc4
--- /dev/null
+++ b/aapl/astring.h
@@ -0,0 +1,808 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_ASTRING_H
+#define _AAPL_ASTRING_H
+
+#include <new>
+#include <stdlib.h>
+#include <stdarg.h>
+#include <stdio.h>
+#include <iostream>
+#include <assert.h>
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+#ifdef AAPL_DOCUMENTATION
+
+/**
+ * \defgroup astring String
+ * \brief Implicitly shared copy-on-write string.
+ * 
+ * @{
+ */
+
+/**
+ * \class String
+ * \brief Implicitly shared copy-on-write string.
+ */
+
+/*@}*/
+
+class String
+{
+public:
+	/**
+	 * \brief Create a null string. Data points to NULL.
+	 */
+	String();
+
+	/**
+	 * \brief Construct a string from a c-style string.
+	 *
+	 * A new buffer is allocated for the c string. Initially, this string will
+	 * be the only String class referencing the data.
+	 */
+	String( const char *s );
+
+	/**
+	 * \brief Construct a string from a c-style string of specific length.
+	 *
+	 * A new buffer is allocated for the c string. Initially, this string will
+	 * be the only String class referencing the data.
+	 */
+	String( const char *s, long len );
+
+	/**
+	 * \brief Construct a string from another String.
+	 *
+	 * A refernce to the buffer allocated for s is taken. A new buffer is
+	 * not allocated.
+	 */
+	String( const String &s );
+
+	/**
+	 * \brief Construct a string using snprintf.
+	 *
+	 * Requires a maximum length for the resulting string. If the formatting
+	 * (not including trailing null) requires more space than maxLen, the
+	 * result will be truncated to maxLen long. Only the length actually
+	 * written will be used by the new string. This string will be the only
+	 * String class referencing the data.
+	 */
+	String( long maxLen, const char *format, ... )
+
+	/**
+	 * \brief Clean up the string.
+	 *
+	 * If the string is not null, the referenced data is detached. If no other
+	 * string refernces the detached data, it is deleted.
+	 */
+	~String();
+
+	/**
+	 * \brief Set the string from a c-style string.
+	 *
+	 * If this string is not null, the current buffer is dereferenced and
+	 * possibly deleted. A new buffer is allocated (or possibly the old buffer
+	 * reused) for the string. Initially, this string will be the only String
+	 * class referencing the data.
+	 *
+	 * If s is null, then this string becomes a null ptr.
+	 *
+	 * \returns A reference to this.
+	 */
+	String &operator=( const char *s );
+
+	/**
+	 * \brief Set the string from a c-style of specific length.
+	 *
+	 * If this string is not null, the current buffer is dereferenced and
+	 * possibly deleted. A new buffer is allocated (or possibly the old buffer
+	 * reused) for the string. Initially, this string will be the only String
+	 * class referencing the data.
+	 *
+	 * If s is null, then this string becomes a null ptr.
+	 *
+	 * \returns A reference to this.
+	 */
+	void setAs( const char *s, long len );
+
+	/**
+	 * \brief Set the string from a single char.
+	 *
+	 * The current buffer is dereferenced and possibly deleted. A new buffer
+	 * is allocated (or possibly the old buffer reused) for the string.
+	 * Initially, this string will be the only String class referencing the
+	 * data.
+	 *
+	 * If s is null, then this string becomes a null ptr.
+	 *
+	 * \returns A reference to this.
+	 */
+	String &operator=( const char c );
+
+
+	/**
+	 * \brief Set the string from another String.
+	 *
+	 * If this string is not null, the current buffer is dereferenced and
+	 * possibly deleted. A reference to the buffer allocated for s is taken.
+	 * A new buffer is not allocated.
+	 *
+	 * If s is null, then this string becomes a null ptr.
+	 *
+	 * \returns a reference to this.
+	 */
+	String &operator=( const String &s );
+
+	/**
+	 * \brief Append a c string to the end of this string.
+	 *
+	 * If this string shares its allocation with another, a copy is first
+	 * taken. The buffer for this string is grown and s is appended to the
+	 * end.
+	 * 
+	 * If s is null nothing happens.
+	 *
+	 * \returns a reference to this.
+	 */
+	String &operator+=( const char *s );
+
+	/**
+	 * \brief Append a c string of specific length to the end of this string.
+	 *
+	 * If this string shares its allocation with another, a copy is first
+	 * taken. The buffer for this string is grown and s is appended to the
+	 * end.
+	 * 
+	 * If s is null nothing happens.
+	 *
+	 * \returns a reference to this.
+	 */
+	void append( const char *s, long len );
+
+	/**
+	 * \brief Append a single char to the end of this string.
+	 *
+	 * If this string shares its allocation with another, a copy is first
+	 * taken. The buffer for this string is grown and s is appended to the
+	 * end.
+	 * 
+	 * \returns a reference to this.
+	 */
+	String &operator+=( const char c );
+
+	/**
+	 * \brief Append a String to the end of this string.
+	 *
+	 * If this string shares its allocation with another, a copy is first
+	 * taken. The buffer for this string is grown and the data of s is
+	 * appeneded to the end.
+	 *
+	 * If s is null nothing happens.
+	 *
+	 * returns a reference to this.
+	 */
+	String &operator+=( const String &s );
+
+	/**
+	 * \brief Cast to a char star.
+	 *
+	 * \returns the string data. A null string returns 0.
+	 */
+	operator char*() const;
+
+	/**
+	 * \brief Get a pointer to the data.
+	 *
+	 * \returns the string Data
+	 */
+	char *get() const;
+
+	/**
+	 * \brief Get the length of the string
+	 *
+	 * If the string is null, then undefined behaviour results.
+	 *
+	 * \returns the length of the string.
+	 */
+	long length() const;
+
+	/**
+	 * \brief Pointer to the data.
+	 *
+	 * Publically accessible pointer to the data. Immediately in front of the
+	 * string data block is the string header which stores the refcount and
+	 * length. Consequently, care should be taken if modifying this pointer.
+	 */
+	char *data;
+};
+
+/**
+ * \relates String
+ * \brief Concatenate a c-style string and a String.
+ *
+ * \returns The concatenation of the two strings in a String.
+ */
+String operator+( const String &s1, const char *s2 );
+
+/**
+ * \relates String
+ * \brief Concatenate a String and a c-style string.
+ *
+ * \returns The concatenation of the two strings in a String.
+ */
+String operator+( const char *s1, const String &s2 );
+
+/**
+ * \relates String
+ * \brief Concatenate two String classes.
+ *
+ * \returns The concatenation of the two strings in a String.
+ */
+String operator+( const String &s1, const String &s2 );
+
+#endif 
+
+template<class T> class StrTmpl
+{
+public:
+	class Fresh {};
+
+	/* Header located just before string data. Keeps the length and a refcount on
+	 * the data. */
+	struct Head
+	{
+		long refCount;
+		long length;
+	};
+
+	/**
+	 * \brief Create a null string.
+	 */
+	StrTmpl() : data(0) { }
+
+	/* Clean up the string. */
+	~StrTmpl();
+
+	/* Construct a string from a c-style string. */
+	StrTmpl( const char *s );
+
+	/* Construct a string from a c-style string of specific len. */
+	StrTmpl( const char *s, long len );
+
+	/* Allocate len spaces. */
+	StrTmpl( const Fresh &, long len );
+
+	/* Construct a string from another StrTmpl.  */
+	StrTmpl( const StrTmpl &s );
+
+	/* Construct a string from with, sprintf. */
+	StrTmpl( long lenGuess, const char *format, ... );
+
+	/* Set the string from a c-style string. */
+	StrTmpl &operator=( const char *s );
+
+	/* Set the string from a c-style string of specific len. */
+	void setAs( const char *s, long len );
+
+	/* Allocate len spaces. */
+	void setAs( const Fresh &, long len );
+
+	void chop( long len );
+
+	/* Construct a string from with, sprintf. */
+	void setAs( long lenGuess, const char *format, ... );
+
+	/* Set the string from a single char. */
+	StrTmpl &operator=( const char c );
+
+	/* Set the string from another StrTmpl. */
+	StrTmpl &operator=( const StrTmpl &s );
+
+	/* Append a c string to the end of this string. */
+	StrTmpl &operator+=( const char *s );
+
+	/* Append a c string to the end of this string of specifi len. */
+	void append( const char *s, long len );
+
+	/* Append a single char to the end of this string. */
+	StrTmpl &operator+=( const char c );
+
+	/* Append an StrTmpl to the end of this string. */
+	StrTmpl &operator+=( const StrTmpl &s );
+
+	/* Cast to a char star. */
+	operator char*() const { return data; }
+
+	/* Get a pointer to the data. */
+	char *get() const { return data; }
+
+	/* Return the length of the string. Must check for null data pointer. */
+	long length() const { return data ? (((Head*)data)-1)->length : 0; }
+
+	/**
+	 * \brief Pointer to the data.
+	 */
+	char *data;
+
+protected:
+	/* Make space for a string of length len to be appended. */
+	char *appendSpace( long len );
+	void initSpace( long length );
+	void setSpace( long length );
+
+ 	template <class FT> friend StrTmpl<FT> operator+( 
+			const StrTmpl<FT> &s1, const char *s2 );
+	template <class FT> friend StrTmpl<FT> operator+( 
+			const char *s1, const StrTmpl<FT> &s2 );
+	template <class FT> friend StrTmpl<FT> operator+( 
+			const StrTmpl<FT> &s1, const StrTmpl<FT> &s2 );
+
+private:
+	/* A dummy struct solely to make a constructor that will never be
+	 * ambiguous with the public constructors. */
+	struct DisAmbig { };
+	StrTmpl( char *data, const DisAmbig & ) : data(data) { }
+};
+
+/* Free all mem used by the string. */
+template<class T> StrTmpl<T>::~StrTmpl()
+{
+	if ( data != 0 ) {
+		/* If we are the only ones referencing the string, then delete it. */
+		Head *head = ((Head*) data) - 1;
+		head->refCount -= 1;
+		if ( head->refCount == 0 )
+			free( head );
+	}
+}
+
+/* Create from a c-style string. */
+template<class T> StrTmpl<T>::StrTmpl( const char *s )
+{
+	if ( s == 0 )
+		data = 0;
+	else {
+		/* Find the length and allocate the space for the shared string. */
+		long length = strlen( s );
+
+		/* Init space for the data. */
+		initSpace( length );
+
+		/* Copy in the data. */
+		memcpy( data, s, length+1 );
+	}
+}
+
+/* Create from a c-style string. */
+template<class T> StrTmpl<T>::StrTmpl( const char *s, long length )
+{
+	if ( s == 0 )
+		data = 0;
+	else {
+		/* Init space for the data. */
+		initSpace( length );
+
+		/* Copy in the data. */
+		memcpy( data, s, length );
+		data[length] = 0;
+	}
+}
+
+/* Create from a c-style string. */
+template<class T> StrTmpl<T>::StrTmpl( const Fresh &, long length )
+{
+	/* Init space for the data. */
+	initSpace( length );
+	data[length] = 0;
+}
+
+/* Create from another string class. */
+template<class T> StrTmpl<T>::StrTmpl( const StrTmpl &s )
+{
+	if ( s.data == 0 )
+		data = 0;
+	else {
+		/* Take a reference to the string. */
+		Head *strHead = ((Head*)s.data) - 1;
+		strHead->refCount += 1;
+		data = (char*) (strHead+1);
+	}
+}
+
+/* Construct a string from with, sprintf. */
+template<class T> StrTmpl<T>::StrTmpl( long lenGuess, const char *format, ... )
+{
+	/* Set the string for len. */
+	initSpace( lenGuess );
+
+	va_list args;
+
+	/* Write to the temporary buffer. */
+	va_start( args, format );
+
+	long written = vsnprintf( data, lenGuess+1, format, args );
+	if ( written > lenGuess ) {
+		setSpace( written );
+		written = vsnprintf( data, written+1, format, args );
+	}
+	chop( written );
+
+	va_end( args );
+}
+
+/* Construct a string from with, sprintf. */
+template<class T> void StrTmpl<T>::setAs( long lenGuess, const char *format, ... )
+{
+	/* Set the string for len. */
+	setSpace( lenGuess );
+
+	va_list args;
+
+	/* Write to the temporary buffer. */
+	va_start( args, format );
+
+	long written = vsnprintf( data, lenGuess+1, format, args );
+	if ( written > lenGuess ) {
+		setSpace( written );
+		written = vsnprintf( data, written+1, format, args );
+	}
+	chop( written );
+
+	va_end( args );
+}
+
+template<class T> void StrTmpl<T>::initSpace( long length )
+{
+	/* Find the length and allocate the space for the shared string. */
+	Head *head = (Head*) malloc( sizeof(Head) + length+1 );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Init the header. */
+	head->refCount = 1;
+	head->length = length;
+
+	/* Save the pointer to the data. */
+	data = (char*) (head+1);
+}
+
+
+/* Set this string to be the c string exactly. The old string is discarded.
+ * Returns a reference to this. */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator=( const char *s )
+{
+	if ( s == 0 ) {
+		/* Just free the data, we are being set to null. */
+		if ( data != 0 ) {
+			Head *head = ((Head*)data) - 1;
+			head->refCount -= 1;
+			if ( head->refCount == 0 )
+				free(head);
+			data = 0;
+		}
+	}
+	else {
+		/* Find the length of the string we are setting. */
+		long length = strlen( s );
+		
+		/* Set the string for len. */
+		setSpace( length );
+
+		/* Copy in the data. */
+		memcpy( data, s, length+1 );
+	}
+	return *this;
+}
+
+/* Set this string to be the c string exactly. The old string is discarded.
+ * Returns a reference to this. */
+template<class T> void StrTmpl<T>::setAs( const char *s, long length )
+{
+	if ( s == 0 ) {
+		/* Just free the data, we are being set to null. */
+		if ( data != 0 ) {
+			Head *head = ((Head*)data) - 1;
+			head->refCount -= 1;
+			if ( head->refCount == 0 )
+				free(head);
+			data = 0;
+		}
+	}
+	else {
+		/* Set the string for len. */
+		setSpace( length );
+
+		/* Copy in the data. */
+		memcpy( data, s, length );
+		data[length] = 0;
+	}
+}
+
+template<class T> void StrTmpl<T>::chop( long length )
+{
+	/* Detach from the existing string. */
+	Head *head = ((Head*)data) - 1;
+	assert( head->refCount == 1 );
+	assert( length <= head->length );
+	head->length = length;
+	data[length] = 0;
+}
+
+/* Set this string to be the c string exactly. The old string is discarded.
+ * Returns a reference to this. */
+template<class T> void StrTmpl<T>::setAs( const Fresh &, long length )
+{
+	setSpace( length );
+	data[length] = 0;
+}
+
+/* Set this string to be the single char exactly. The old string is discarded.
+ * Returns a reference to this. */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator=( const char c )
+{
+	/* Set to length 1. */
+	setSpace( 1 );
+
+	/* Copy in the data. */
+	data[0] = c;
+	data[1] = 0;
+
+	/* Return ourselves. */
+	return *this;
+}
+
+/* Set this string to be the StrTmpl s exactly. The old string is
+ * discarded. */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator=( const StrTmpl &s )
+{
+	/* Detach from the existing string. */
+	if ( data != 0 ) {
+		Head *head = ((Head*)data) - 1;
+		head->refCount -= 1;
+		if ( head->refCount == 0 )
+			free( head );
+	}
+
+	if ( s.data != 0 ) {
+		/* Take a reference to the string. */
+		Head *strHead = ((Head*)s.data) - 1;
+		strHead->refCount += 1;
+		data = (char*)(strHead+1);
+	}
+	else {
+		/* Setting from a null string, just null our pointer. */
+		data = 0;
+	}
+	return *this;
+}
+
+/* Prepare the string to be set to something else of the given length. */
+template<class T> void StrTmpl<T>::setSpace( long length )
+{
+	/* Detach from the existing string. */
+	Head *head = ((Head*)data) - 1;
+	if ( data != 0 && --head->refCount == 0 ) {
+		/* Resuse the space. */
+		head = (Head*) realloc( head, sizeof(Head) + length+1 );
+	}
+	else {
+		/* Need to make new space, there is no usable old space. */
+		head = (Head*) malloc( sizeof(Head) + length+1 );
+	}
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Init the header. */
+	head->refCount = 1;
+	head->length = length;
+
+	/* Copy in the data and save the pointer to it. */
+	data = (char*) (head+1);
+}
+
+
+/* Append a c-style string to the end of this string. Returns a reference to
+ * this */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator+=( const char *s )
+{
+	/* Find the length of the string appended. */
+	if ( s != 0 ) {
+		/* Get the string length and make space on the end. */
+		long addedLen = strlen( s );
+		char *dest = appendSpace( addedLen );
+
+		/* Copy the data in. Plus one for the null. */
+		memcpy( dest, s, addedLen+1 );
+	}
+	return *this;
+}
+
+/* Append a c-style string of specific length to the end of this string.
+ * Returns a reference to this */
+template<class T> void StrTmpl<T>::append( const char *s, long length )
+{
+	/* Find the length of the string appended. */
+	if ( s != 0 ) {
+		/* Make space on the end. */
+		char *dest = appendSpace( length );
+
+		/* Copy the data in. Plus one for the null. */
+		memcpy( dest, s, length );
+		dest[length] = 0;
+	}
+}
+
+/* Append a single char to the end of this string. Returns a reference to
+ * this */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator+=( const char c )
+{
+	/* Grow on the end. */
+	char *dst = appendSpace( 1 );
+
+	/* Append a single charachter. */
+	dst[0] = c;
+	dst[1] = 0;
+	return *this;
+}
+
+
+/* Append an StrTmpl string to the end of this string. Returns a reference
+ * to this */
+template<class T> StrTmpl<T> &StrTmpl<T>::operator+=( const StrTmpl &s )
+{
+	/* Find the length of the string appended. */
+	if ( s.data != 0 ) {
+		/* Find the length to append. */
+		long addedLen = (((Head*)s.data) - 1)->length;
+
+		/* Make space on the end to put the string. */
+		char *dest = appendSpace( addedLen );
+
+		/* Append the data, add one for the null. */
+		memcpy( dest, s.data, addedLen+1 );
+	}
+	return *this;
+}
+
+/* Make space for a string of length len to be appended. */
+template<class T> char *StrTmpl<T>::appendSpace( long len )
+{
+	/* Find the length of this and the string appended. */
+	Head *head = (((Head*)data) - 1);
+	long thisLen = head->length;
+
+	if ( head->refCount == 1 ) {
+		/* No other string is using the space, grow this space. */
+		head = (Head*) realloc( head, 
+				sizeof(Head) + thisLen + len + 1 );
+		if ( head == 0 )
+			throw std::bad_alloc();
+		data = (char*) (head+1);
+
+		/* Adjust the length. */
+		head->length += len;
+	}
+	else {
+		/* Another string is using this space, make new space. */
+		head->refCount -= 1;
+		Head *newHead = (Head*) malloc(
+				sizeof(Head) + thisLen + len + 1 );
+		if ( newHead == 0 )
+			throw std::bad_alloc();
+		data = (char*) (newHead+1);
+
+		/* Set the new header and data from this. */
+		newHead->refCount = 1;
+		newHead->length = thisLen + len;
+		memcpy( data, head+1, thisLen );
+	}
+
+	/* Return writing position. */
+	return data + thisLen;
+}
+
+/*  Concatenate a String and a c-style string. */
+template<class T> StrTmpl<T> operator+( const StrTmpl<T> &s1, const char *s2 )
+{
+	/* Find s2 length and alloc the space for the result. */
+	long str1Len = (((typename StrTmpl<T>::Head*)(s1.data)) - 1)->length;
+	long str2Len = strlen( s2 );
+
+	typename StrTmpl<T>::Head *head = (typename StrTmpl<T>::Head*) 
+			malloc( sizeof(typename StrTmpl<T>::Head) + str1Len + str2Len + 1 );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Set up the header. */
+	head->refCount = 1;
+	head->length = str1Len + str2Len;
+
+	/* Save the pointer to data and copy the data in. */
+	char *data = (char*) (head+1);
+	memcpy( data, s1.data, str1Len );
+	memcpy( data + str1Len, s2, str2Len + 1 );
+	return StrTmpl<T>( data, typename StrTmpl<T>::DisAmbig() );
+}
+
+/* Concatenate a c-style string and a String. */
+template<class T> StrTmpl<T> operator+( const char *s1, const StrTmpl<T> &s2 )
+{
+	/* Find s2 length and alloc the space for the result. */
+	long str1Len = strlen( s1 );
+	long str2Len = (((typename StrTmpl<T>::Head*)(s2.data)) - 1)->length;
+
+	typename StrTmpl<T>::Head *head = (typename StrTmpl<T>::Head*) 
+			malloc( sizeof(typename StrTmpl<T>::Head) + str1Len + str2Len + 1 );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Set up the header. */
+	head->refCount = 1;
+	head->length = str1Len + str2Len;
+
+	/* Save the pointer to data and copy the data in. */
+	char *data = (char*) (head+1);
+	memcpy( data, s1, str1Len );
+	memcpy( data + str1Len, s2.data, str2Len + 1 );
+	return StrTmpl<T>( data, typename StrTmpl<T>::DisAmbig() );
+}
+
+/* Add two StrTmpl strings. */
+template<class T> StrTmpl<T> operator+( const StrTmpl<T> &s1, const StrTmpl<T> &s2 )
+{
+	/* Find s2 length and alloc the space for the result. */
+	long str1Len = (((typename StrTmpl<T>::Head*)(s1.data)) - 1)->length;
+	long str2Len = (((typename StrTmpl<T>::Head*)(s2.data)) - 1)->length;
+	typename StrTmpl<T>::Head *head = (typename StrTmpl<T>::Head*) 
+			malloc( sizeof(typename StrTmpl<T>::Head) + str1Len + str2Len + 1 );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Set up the header. */
+	head->refCount = 1;
+	head->length = str1Len + str2Len;
+
+	/* Save the pointer to data and copy the data in. */
+	char *data = (char*) (head+1);
+	memcpy( data, s1.data, str1Len );
+	memcpy( data + str1Len, s2.data, str2Len + 1 );
+	return StrTmpl<T>( data, typename StrTmpl<T>::DisAmbig() );
+}
+
+/* Operator used in case the compiler does not support the conversion. */
+template <class T> inline std::ostream &operator<<( std::ostream &o, const StrTmpl<T> &s )
+{
+	return o.write( s.data, s.length() );
+}
+
+typedef StrTmpl<char> String;
+
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_ASTRING_H */
diff --git a/aapl/avlbasic.h b/aapl/avlbasic.h
new file mode 100644
index 00000000..780ef07a
--- /dev/null
+++ b/aapl/avlbasic.h
@@ -0,0 +1,65 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLBASIC_H
+#define _AAPL_AVLBASIC_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlBasic
+ * \brief AVL Tree in which the entire element structure is the key.
+ *
+ * AvlBasic is an AVL tree that does not distinguish between the element that
+ * it contains and the key. The entire element structure is the key that is
+ * used to compare the relative ordering of elements. This is similar to the
+ * BstSet structure.
+ *
+ * AvlBasic does not assume ownership of elements in the tree. Items must be
+ * explicitly de-allocated.
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Element, class Compare
+#define AVLMEL_TEMPDEF class Element, class Compare
+#define AVLMEL_TEMPUSE Element, Compare
+#define AvlTree AvlBasic
+#define AVL_BASIC
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef AVL_BASIC
+
+#endif /* _AAPL_AVLBASIC_H */
diff --git a/aapl/avlcommon.h b/aapl/avlcommon.h
new file mode 100644
index 00000000..fca4ea4f
--- /dev/null
+++ b/aapl/avlcommon.h
@@ -0,0 +1,1630 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+/* This header is not wrapped in ifndef becuase it is not intended to
+ * be included by the user. */
+
+#include <assert.h>
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+#ifdef WALKABLE
+/* This is used by AvlTree, AvlMel and AvlMelKey so it
+ * must be protected by global ifdefs. */
+#ifndef __AAPL_AVLI_EL__
+#define __AAPL_AVLI_EL__
+
+/**
+ * \brief Tree element properties for linked AVL trees.
+ *
+ * AvliTreeEl needs to be inherited by classes that intend to be element in an
+ * AvliTree. 
+ */
+template<class SubClassEl> struct AvliTreeEl 
+{
+	/**
+	 * \brief Tree pointers connecting element in a tree.
+	 */
+	SubClassEl *left, *right, *parent;
+
+	/**
+	 * \brief Linked list pointers.
+	 */
+	SubClassEl *prev, *next;
+
+	/**
+	 * \brief Height of the tree rooted at this element.
+	 *
+	 * Height is required by the AVL balancing algorithm.
+	 */
+	long height;
+};
+#endif /* __AAPL_AVLI_EL__ */
+
+#else /* not WALKABLE */
+
+/* This is used by All the non walkable trees so it must be
+ * protected by a global ifdef. */
+#ifndef __AAPL_AVL_EL__
+#define __AAPL_AVL_EL__
+/**
+ * \brief Tree element properties for linked AVL trees.
+ *
+ * AvlTreeEl needs to be inherited by classes that intend to be element in an
+ * AvlTree. 
+ */
+template<class SubClassEl> struct AvlTreeEl
+{
+	/**
+	 * \brief Tree pointers connecting element in a tree.
+	 */
+	SubClassEl *left, *right, *parent;
+
+	/**
+	 * \brief Height of the tree rooted at this element.
+	 *
+	 * Height is required by the AVL balancing algorithm.
+	 */
+	long height;
+};
+#endif /* __AAPL_AVL_EL__ */
+#endif /* def WALKABLE */
+
+
+#if defined( AVLTREE_MAP )
+
+#ifdef WALKABLE
+
+/**
+ * \brief Tree element for AvliMap
+ *
+ * Stores the key and value pair.
+ */
+template <class Key, class Value> struct AvliMapEl :
+		public AvliTreeEl< AvliMapEl<Key, Value> >
+{
+	AvliMapEl(const Key &key) 
+		: key(key) { }
+	AvliMapEl(const Key &key, const Value &value) 
+		: key(key), value(value) { }
+
+	const Key &getKey() const { return key; }
+
+	/** \brief The key. */
+	Key key;
+
+	/** \brief The value. */
+	Value value;
+};
+#else /* not WALKABLE */
+
+/**
+ * \brief Tree element for AvlMap
+ *
+ * Stores the key and value pair.
+ */
+template <class Key, class Value> struct AvlMapEl :
+		public AvlTreeEl< AvlMapEl<Key, Value> >
+{
+	AvlMapEl(const Key &key) 
+		: key(key) { }
+	AvlMapEl(const Key &key, const Value &value) 
+		: key(key), value(value) { }
+
+	const Key &getKey() const { return key; }
+
+	/** \brief The key. */
+	Key key;
+
+	/** \brief The value. */
+	Value value;
+};
+#endif /* def WALKABLE */
+
+#elif defined( AVLTREE_SET )
+
+#ifdef WALKABLE
+/**
+ * \brief Tree element for AvliSet
+ *
+ * Stores the key.
+ */
+template <class Key> struct AvliSetEl :
+		public AvliTreeEl< AvliSetEl<Key> >
+{
+	AvliSetEl(const Key &key) : key(key) { }
+
+	const Key &getKey() const { return key; }
+
+	/** \brief The key. */
+	Key key;
+};
+#else /* not WALKABLE */
+/**
+ * \brief Tree element for AvlSet
+ *
+ * Stores the key.
+ */
+template <class Key> struct AvlSetEl :
+		public AvlTreeEl< AvlSetEl<Key> >
+{
+	AvlSetEl(const Key &key) : key(key) { }
+
+	const Key &getKey() const { return key; }
+
+	/** \brief The key. */
+	Key key;
+};
+#endif /* def WALKABLE */
+
+#endif /* AVLTREE_SET */
+
+/* Common AvlTree Class */
+template < AVLMEL_CLASSDEF > class AvlTree
+#if !defined( AVL_KEYLESS ) && defined ( WALKABLE )
+		: public Compare, public BASELIST
+#elif !defined( AVL_KEYLESS )
+		: public Compare
+#elif defined( WALKABLE )
+		: public BASELIST
+#endif
+{
+public:
+	/**
+	 * \brief Create an empty tree.
+	 */
+#ifdef WALKABLE
+	AvlTree() : root(0), treeSize(0) { }
+#else
+	AvlTree() : root(0), head(0), tail(0), treeSize(0) { }
+#endif
+
+	/** 
+	 * \brief Perform a deep copy of the tree. 
+	 *
+	 * Each element is duplicated for the new tree. Copy constructors are used
+	 * to create the new elements.
+	 */
+	AvlTree(const AvlTree &other);
+
+#if defined( AVLTREE_MAP ) || defined( AVLTREE_SET )
+	/**
+	 * \brief Clear the contents of the tree.
+	 *
+	 * All element are deleted.
+	 */
+	~AvlTree() { empty(); }
+
+	/** 
+	 * \brief Perform a deep copy of the tree. 
+	 *
+	 * Each element is duplicated for the new tree. Copy constructors are used
+	 * to create the new element. If this tree contains items, they are first
+	 * deleted.
+	 *
+	 * \returns A reference to this.
+	 */
+	AvlTree &operator=( const AvlTree &tree );
+
+	/**
+	 * \brief Transfer the elements of another tree into this.
+	 *
+	 * First deletes all elements in this tree.
+	 */
+	void transfer( AvlTree &tree );
+#else
+	/**
+	 * \brief Abandon all elements in the tree. 
+	 *
+	 * Tree elements are not deleted.
+	 */
+	~AvlTree() {}
+
+	/**
+	 * \brief Perform a deep copy of the tree.
+	 *
+	 * Each element is duplicated for the new tree. Copy constructors are used
+	 * to create the new element. If this tree contains items, they are
+	 * abandoned.
+	 *
+	 * \returns A reference to this.
+	 */
+	AvlTree &operator=( const AvlTree &tree );
+
+	/**
+	 * \brief Transfer the elements of another tree into this.
+	 *
+	 * All elements in this tree are abandoned first.
+	 */
+	void transfer( AvlTree &tree );
+#endif
+
+#ifndef AVL_KEYLESS
+	/* Insert a element into the tree. */
+	Element *insert( Element *element, Element **lastFound = 0 );
+
+#ifdef AVL_BASIC
+	/* Find a element in the tree. Returns the element if 
+	 * element exists, false otherwise. */
+	Element *find( const Element *element ) const;
+
+#else
+	Element *insert( const Key &key, Element **lastFound = 0 );
+
+#ifdef AVLTREE_MAP
+	Element *insert( const Key &key, const Value &val,
+			Element **lastFound = 0 );
+#endif
+
+	/* Find a element in the tree. Returns the element if 
+	 * key exists, false otherwise. */
+	Element *find( const Key &key ) const;
+
+	/* Detach a element from the tree. */
+	Element *detach( const Key &key );
+
+	/* Detach and delete a element from the tree. */
+	bool remove( const Key &key );
+#endif /* AVL_BASIC */
+#endif /* AVL_KEYLESS */
+
+	/* Detach a element from the tree. */
+	Element *detach( Element *element );
+
+	/* Detach and delete a element from the tree. */
+	void remove( Element *element );
+
+	/* Free all memory used by tree. */
+	void empty();
+
+	/* Abandon all element in the tree. Does not delete element. */
+	void abandon();
+
+	/** Root element of the tree. */
+	Element *root;
+
+#ifndef WALKABLE
+	Element *head, *tail;
+#endif
+
+	/** The number of element in the tree. */
+	long treeSize;
+
+	/** \brief Return the number of elements in the tree. */
+	long length() const         { return treeSize; }
+
+	/** \brief Return the number of elements in the tree. */
+	long size() const           { return treeSize; }
+
+	/* Various classes for setting the iterator */
+	struct Iter;
+	struct IterFirst { IterFirst( const AvlTree &t ) : t(t) { } const AvlTree &t; };
+	struct IterLast { IterLast( const AvlTree &t ) : t(t) { } const AvlTree &t; };
+	struct IterNext { IterNext( const Iter &i ) : i(i) { } const Iter &i; };
+	struct IterPrev { IterPrev( const Iter &i ) : i(i) { } const Iter &i; };
+
+#ifdef WALKABLE
+	/** 
+	 * \brief Avl Tree Iterator. 
+	 * \ingroup iterators
+	 */
+	struct Iter
+	{
+		/* Default construct. */
+		Iter() : ptr(0) { }
+
+		/* Construct from an avl tree and iterator-setting classes. */
+		Iter( const AvlTree &t ) : ptr(t.head) { }
+		Iter( const IterFirst &af ) : ptr(af.t.head) { }
+		Iter( const IterLast &al ) : ptr(al.t.tail) { }
+		Iter( const IterNext &an ) : ptr(findNext(an.i.ptr)) { }
+		Iter( const IterPrev &ap ) : ptr(findPrev(ap.i.ptr)) { }
+		
+		/* Assign from a tree and iterator-setting classes. */
+		Iter &operator=( const AvlTree &tree ) { ptr = tree.head; return *this; }
+		Iter &operator=( const IterFirst &af ) { ptr = af.t.head; return *this; }
+		Iter &operator=( const IterLast &al )  { ptr = al.t.tail; return *this; }
+		Iter &operator=( const IterNext &an )  { ptr = findNext(an.i.ptr); return *this; }
+		Iter &operator=( const IterPrev &ap )  { ptr = findPrev(ap.i.ptr); return *this; }
+
+		/** \brief Less than end? */
+		bool lte() const { return ptr != 0; }
+
+		/** \brief At end? */
+		bool end() const { return ptr == 0; }
+
+		/** \brief Greater than beginning? */
+		bool gtb() const { return ptr != 0; }
+
+		/** \brief At beginning? */
+		bool beg() const { return ptr == 0; }
+
+		/** \brief At first element? */
+		bool first() const { return ptr && ptr->BASE_EL(prev) == 0; }
+
+		/** \brief At last element? */
+		bool last() const { return ptr && ptr->BASE_EL(next) == 0; }
+
+		/** \brief Implicit cast to Element*. */
+		operator Element*() const      { return ptr; }
+
+		/** \brief Dereference operator returns Element&. */
+		Element &operator *() const    { return *ptr; }
+
+		/** \brief Arrow operator returns Element*. */
+		Element *operator->() const    { return ptr; }
+
+		/** \brief Move to next item. */
+		inline Element *operator++();
+
+		/** \brief Move to next item. */
+		inline Element *operator++(int);
+
+		/** \brief Move to next item. */
+		inline Element *increment();
+
+		/** \brief Move to previous item. */
+		inline Element *operator--();
+
+		/** \brief Move to previous item. */
+		inline Element *operator--(int);
+
+		/** \brief Move to previous item. */
+		inline Element *decrement();
+
+		/** \brief Return the next item. Does not modify this. */
+		IterNext next() const { return IterNext( *this ); }
+
+		/** \brief Return the previous item. Does not modify this. */
+		IterPrev prev() const { return IterPrev( *this ); }
+
+	private:
+		static Element *findPrev( Element *element ) { return element->BASE_EL(prev); }
+		static Element *findNext( Element *element ) { return element->BASE_EL(next); }
+
+	public:
+
+		/** \brief The iterator is simply a pointer. */
+		Element *ptr;
+	};
+
+#else
+
+	/**
+	 * \brief Avl Tree Iterator.
+	 * \ingroup iterators
+	 */
+	struct Iter
+	{
+		/* Default construct. */
+		Iter() : ptr(0), tree(0) { }
+
+		/* Construct from a tree and iterator-setting classes. */
+		Iter( const AvlTree &t ) : ptr(t.head), tree(&t) { }
+		Iter( const IterFirst &af ) : ptr(af.t.head), tree(&af.t) { }
+		Iter( const IterLast &al ) : ptr(al.t.tail), tree(&al.t) { }
+		Iter( const IterNext &an ) : ptr(findNext(an.i.ptr)), tree(an.i.tree) { }
+		Iter( const IterPrev &ap ) : ptr(findPrev(ap.i.ptr)), tree(ap.i.tree) { }
+		
+		/* Assign from a tree and iterator-setting classes. */
+		Iter &operator=( const AvlTree &t )    
+				{ ptr = t.head; tree = &t; return *this; }
+		Iter &operator=( const IterFirst &af ) 
+				{ ptr = af.t.head; tree = &af.t; return *this; }
+		Iter &operator=( const IterLast &al )  
+				{ ptr = al.t.tail; tree = &al.t; return *this; }
+		Iter &operator=( const IterNext &an )  
+				{ ptr = findNext(an.i.ptr); tree = an.i.tree; return *this; }
+		Iter &operator=( const IterPrev &ap )  
+				{ ptr = findPrev(ap.i.ptr); tree = ap.i.tree; return *this; }
+
+		/** \brief Less than end? */
+		bool lte() const { return ptr != 0; }
+
+		/** \brief At end? */
+		bool end() const { return ptr == 0; }
+
+		/** \brief Greater than beginning? */
+		bool gtb() const { return ptr != 0; }
+
+		/** \brief At beginning? */
+		bool beg() const { return ptr == 0; }
+
+		/** \brief At first element? */
+		bool first() const { return ptr && ptr == tree->head; }
+
+		/** \brief At last element? */
+		bool last() const { return ptr && ptr == tree->tail; }
+
+		/** \brief Implicit cast to Element*. */
+		operator Element*() const      { return ptr; }
+
+		/** \brief Dereference operator returns Element&. */
+		Element &operator *() const    { return *ptr; }
+
+		/** \brief Arrow operator returns Element*. */
+		Element *operator->() const    { return ptr; }
+
+		/** \brief Move to next item. */
+		inline Element *operator++();
+
+		/** \brief Move to next item. */
+		inline Element *operator++(int);
+
+		/** \brief Move to next item. */
+		inline Element *increment();
+
+		/** \brief Move to previous item. */
+		inline Element *operator--();
+
+		/** \brief Move to previous item. */
+		inline Element *operator--(int);
+
+		/** \brief Move to previous item. */
+		inline Element *decrement();
+
+		/** \brief Return the next item. Does not modify this. */
+		IterNext next() const { return IterNext( *this ); }
+
+		/** \brief Return the previous item. Does not modify this. */
+		IterPrev prev() const { return IterPrev( *this ); }
+
+	private:
+		static Element *findPrev( Element *element );
+		static Element *findNext( Element *element );
+
+	public:
+		/** \brief The iterator is simply a pointer. */
+		Element *ptr;
+
+		/* The list is not walkable so we need to keep a pointerto the tree
+		 * so we can test against head and tail in O(1) time. */
+		const AvlTree *tree;
+	};
+#endif
+
+	/** \brief Return first element. */
+	IterFirst first()  { return IterFirst( *this ); }
+
+	/** \brief Return last element. */
+	IterLast last()    { return IterLast( *this ); }
+
+protected:
+	/* Recursive worker for the copy constructor. */
+	Element *copyBranch( Element *element );
+
+	/* Recursively delete element in the tree. */
+	void deleteChildrenOf(Element *n);
+
+	/* rebalance the tree beginning at the leaf whose 
+	 * grandparent is unbalanced. */
+	Element *rebalance(Element *start);
+
+	/* Move up the tree from a given element, recalculating the heights. */
+	void recalcHeights(Element *start);
+
+	/* Move up the tree and find the first element whose 
+	 * grand-parent is unbalanced. */
+	Element *findFirstUnbalGP(Element *start);
+
+	/* Move up the tree and find the first element which is unbalanced. */
+	Element *findFirstUnbalEl(Element *start);
+
+	/* Replace a element in the tree with another element not in the tree. */
+	void replaceEl(Element *element, Element *replacement);
+
+	/* Remove a element from the tree and put another (normally a child of element)
+	 * in its place. */
+	void removeEl(Element *element, Element *filler);
+
+	/* Once an insertion point is found at a leaf then do the insert. */
+	void attachRebal( Element *element, Element *parentEl, Element *lastLess );
+};
+
+/* Copy constructor. New up each item. */
+template <AVLMEL_TEMPDEF> AvlTree<AVLMEL_TEMPUSE>::
+		AvlTree(const AvlTree<AVLMEL_TEMPUSE> &other)
+#if !defined( AVL_KEYLESS ) && defined ( WALKABLE )
+	/* BASELIST should be made empty. The copyBranch function 
+	 * will fill in the details for us. */
+	: Compare( other ), BASELIST()
+#elif !defined( AVL_KEYLESS )
+	: Compare( other )
+#elif defined( WALKABLE )
+	: BASELIST( )
+#endif
+{
+	treeSize = other.treeSize;
+	root = other.root;
+
+#ifndef WALKABLE
+	head = 0;
+	tail = 0;
+#endif
+
+	/* If there is a root, copy the tree. */
+	if ( other.root != 0 )
+		root = copyBranch( other.root );
+}
+
+#if defined( AVLTREE_MAP ) || defined( AVLTREE_SET )
+
+/* Assignment does deep copy. */
+template <AVLMEL_TEMPDEF> AvlTree<AVLMEL_TEMPUSE> &AvlTree<AVLMEL_TEMPUSE>::
+	operator=( const AvlTree &other )
+{
+	/* Clear the tree first. */
+	empty();
+
+	/* Reset the list pointers, the tree copy will fill in the list for us. */
+#ifdef WALKABLE
+	BASELIST::abandon();
+#else
+	head = 0;
+	tail = 0;
+#endif
+
+	/* Copy the entire tree. */
+	treeSize = other.treeSize;
+	root = other.root;
+	if ( other.root != 0 )
+		root = copyBranch( other.root );
+	return *this;
+}
+
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		transfer(AvlTree<AVLMEL_TEMPUSE> &other)
+{
+	/* Clear the tree first. */
+	empty();
+
+	treeSize = other.treeSize;
+	root = other.root;
+
+#ifdef WALKABLE
+	BASELIST::head = other.BASELIST::head;
+	BASELIST::tail = other.BASELIST::tail;
+	BASELIST::listLen = other.BASELIST::listLen;
+#else
+	head = other.head;
+	tail = other.tail;
+#endif
+
+	other.abandon();
+}
+
+#else /* ! AVLTREE_MAP && ! AVLTREE_SET */
+
+/* Assignment does deep copy. This version does not clear the tree first. */
+template <AVLMEL_TEMPDEF> AvlTree<AVLMEL_TEMPUSE> &AvlTree<AVLMEL_TEMPUSE>::
+	operator=( const AvlTree &other )
+{
+	/* Reset the list pointers, the tree copy will fill in the list for us. */
+#ifdef WALKABLE
+	BASELIST::abandon();
+#else
+	head = 0;
+	tail = 0;
+#endif
+
+	/* Copy the entire tree. */
+	treeSize = other.treeSize;
+	root = other.root;
+	if ( other.root != 0 )
+		root = copyBranch( other.root );
+	return *this;
+}
+
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		transfer(AvlTree<AVLMEL_TEMPUSE> &other)
+{
+	treeSize = other.treeSize;
+	root = other.root;
+
+#ifdef WALKABLE
+	BASELIST::head = other.BASELIST::head;
+	BASELIST::tail = other.BASELIST::tail;
+	BASELIST::listLen = other.BASELIST::listLen;
+#else
+	head = other.head;
+	tail = other.tail;
+#endif
+
+	other.abandon();
+}
+
+#endif
+
+/*
+ * Iterator operators.
+ */
+
+/* Prefix ++ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		operator++()       
+{
+	return ptr = findNext( ptr );
+}
+
+/* Postfix ++ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		operator++(int)       
+{
+	Element *rtn = ptr; 
+	ptr = findNext( ptr );
+	return rtn;
+}
+
+/* increment */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		increment()
+{
+	return ptr = findNext( ptr );
+}
+
+/* Prefix -- */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		operator--()       
+{
+	return ptr = findPrev( ptr );
+}
+
+/* Postfix -- */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		operator--(int)       
+{
+	Element *rtn = ptr;
+	ptr = findPrev( ptr );
+	return rtn;
+}
+
+/* decrement */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		decrement()
+{
+	return ptr = findPrev( ptr );
+}
+
+#ifndef WALKABLE
+
+/* Move ahead one. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		findNext( Element *element )
+{
+	/* Try to go right once then infinite left. */
+	if ( element->BASE_EL(right) != 0 ) {
+		element = element->BASE_EL(right);
+		while ( element->BASE_EL(left) != 0 )
+			element = element->BASE_EL(left);
+	}
+	else {
+		/* Go up to parent until we were just a left child. */
+		while ( true ) {
+			Element *last = element;
+			element = element->BASE_EL(parent);
+			if ( element == 0 || element->BASE_EL(left) == last )
+				break;
+		}
+	}
+	return element;
+}
+
+/* Move back one. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::Iter::
+		findPrev( Element *element )
+{
+	/* Try to go left once then infinite right. */
+	if ( element->BASE_EL(left) != 0 ) {
+		element = element->BASE_EL(left);
+		while ( element->BASE_EL(right) != 0 )
+			element = element->BASE_EL(right);
+	}
+	else {
+		/* Go up to parent until we were just a left child. */
+		while ( true ) {
+			Element *last = element;
+			element = element->BASE_EL(parent);
+			if ( element == 0 || element->BASE_EL(right) == last )
+				break;
+		}
+	}
+	return element;
+}
+
+#endif
+
+
+/* Recursive worker for tree copying. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		copyBranch( Element *element )
+{
+	/* Duplicate element. Either the base element's copy constructor or defaul
+	 * constructor will get called. Both will suffice for initting the
+	 * pointers to null when they need to be. */
+	Element *retVal = new Element(*element);
+
+	/* If the left tree is there, copy it. */
+	if ( retVal->BASE_EL(left) ) {
+		retVal->BASE_EL(left) = copyBranch(retVal->BASE_EL(left));
+		retVal->BASE_EL(left)->BASE_EL(parent) = retVal;
+	}
+
+#ifdef WALKABLE
+	BASELIST::addAfter( BASELIST::tail, retVal );
+#else
+	if ( head == 0 )
+		head = retVal;
+	tail = retVal;
+#endif
+
+	/* If the right tree is there, copy it. */
+	if ( retVal->BASE_EL(right) ) {
+		retVal->BASE_EL(right) = copyBranch(retVal->BASE_EL(right));
+		retVal->BASE_EL(right)->BASE_EL(parent) = retVal;
+	}
+	return retVal;
+}
+
+/* Once an insertion position is found, attach a element to the tree. */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		attachRebal( Element *element, Element *parentEl, Element *lastLess )
+{
+	/* Increment the number of element in the tree. */
+	treeSize += 1;
+
+	/* Set element's parent. */
+	element->BASE_EL(parent) = parentEl;
+
+	/* New element always starts as a leaf with height 1. */
+	element->BASE_EL(left) = 0;
+	element->BASE_EL(right) = 0;
+	element->BASE_EL(height) = 1;
+
+	/* Are we inserting in the tree somewhere? */
+	if ( parentEl != 0 ) {
+		/* We have a parent so we are somewhere in the tree. If the parent
+		 * equals lastLess, then the last traversal in the insertion went
+		 * left, otherwise it went right. */
+		if ( lastLess == parentEl ) {
+			parentEl->BASE_EL(left) = element;
+#ifdef WALKABLE
+			BASELIST::addBefore( parentEl, element );
+#endif
+		}
+		else {
+			parentEl->BASE_EL(right) = element;
+#ifdef WALKABLE
+			BASELIST::addAfter( parentEl, element );
+#endif
+		}
+
+#ifndef WALKABLE
+		/* Maintain the first and last pointers. */
+		if ( head->BASE_EL(left) == element )
+			head = element;
+
+		/* Maintain the first and last pointers. */
+		if ( tail->BASE_EL(right) == element )
+			tail = element;
+#endif
+	}
+	else {
+		/* No parent element so we are inserting the root. */
+		root = element;
+#ifdef WALKABLE
+		BASELIST::addAfter( BASELIST::tail, element );
+#else
+		head = tail = element;
+#endif
+	}
+
+
+	/* Recalculate the heights. */
+	recalcHeights(parentEl);
+
+	/* Find the first unbalance. */
+	Element *ub = findFirstUnbalGP(element);
+
+	/* rebalance. */
+	if ( ub != 0 )
+	{
+		/* We assert that after this single rotation the 
+		 * tree is now properly balanced. */
+		rebalance(ub);
+	}
+}
+
+#ifndef AVL_KEYLESS
+
+/**
+ * \brief Insert an existing element into the tree. 
+ *
+ * If the insert succeeds and lastFound is given then it is set to the element
+ * inserted. If the insert fails then lastFound is set to the existing element in
+ * the tree that has the same key as element. If the element's avl pointers are
+ * already in use then undefined behaviour results.
+ * 
+ * \returns The element inserted upon success, null upon failure.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		insert( Element *element, Element **lastFound )
+{
+	long keyRelation;
+	Element *curEl = root, *parentEl = 0;
+	Element *lastLess = 0;
+
+	while (true) {
+		if ( curEl == 0 ) {
+			/* We are at an external element and did not find the key we were
+			 * looking for. Attach underneath the leaf and rebalance. */
+			attachRebal( element, parentEl, lastLess );
+
+			if ( lastFound != 0 )
+				*lastFound = element;
+			return element;
+		}
+
+#ifdef AVL_BASIC
+		keyRelation = compare( *element, *curEl );
+#else
+		keyRelation = compare( element->BASEKEY(getKey()), 
+				curEl->BASEKEY(getKey()) );
+#endif
+
+		/* Do we go left? */
+		if ( keyRelation < 0 ) {
+			parentEl = lastLess = curEl;
+			curEl = curEl->BASE_EL(left);
+		}
+		/* Do we go right? */
+		else if ( keyRelation > 0 ) {
+			parentEl = curEl;
+			curEl = curEl->BASE_EL(right);
+		}
+		/* We have hit the target. */
+		else {
+			if ( lastFound != 0 )
+				*lastFound = curEl;
+			return 0;
+		}
+	}
+}
+
+#ifdef AVL_BASIC
+
+/**
+ * \brief Find a element in the tree with the given key.
+ *
+ * \returns The element if key exists, null if the key does not exist.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		find( const Element *element ) const
+{
+	Element *curEl = root;
+	long keyRelation;
+
+	while (curEl) {
+		keyRelation = compare( *element, *curEl );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 )
+			curEl = curEl->BASE_EL(left);
+		/* Do we go right? */
+		else if ( keyRelation > 0 )
+			curEl = curEl->BASE_EL(right);
+		/* We have hit the target. */
+		else {
+			return curEl;
+		}
+	}
+	return 0;
+}
+
+#else
+
+/**
+ * \brief Insert a new element into the tree with given key.
+ *
+ * If the key is not already in the tree then a new element is made using the
+ * Element(const Key &key) constructor and the insert succeeds. If lastFound is
+ * given then it is set to the element inserted. If the insert fails then
+ * lastFound is set to the existing element in the tree that has the same key as
+ * element.
+ * 
+ * \returns The new element upon success, null upon failure.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		insert( const Key &key, Element **lastFound )
+{
+	long keyRelation;
+	Element *curEl = root, *parentEl = 0;
+	Element *lastLess = 0;
+
+	while (true) {
+		if ( curEl == 0 ) {
+			/* We are at an external element and did not find the key we were
+			 * looking for. Create the new element, attach it underneath the leaf
+			 * and rebalance. */
+			Element *element = new Element( key );
+			attachRebal( element, parentEl, lastLess );
+
+			if ( lastFound != 0 )
+				*lastFound = element;
+			return element;
+		}
+
+		keyRelation = compare( key, curEl->BASEKEY(getKey()) );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 ) {
+			parentEl = lastLess = curEl;
+			curEl = curEl->BASE_EL(left);
+		}
+		/* Do we go right? */
+		else if ( keyRelation > 0 ) {
+			parentEl = curEl;
+			curEl = curEl->BASE_EL(right);
+		}
+		/* We have hit the target. */
+		else {
+			if ( lastFound != 0 )
+				*lastFound = curEl;
+			return 0;
+		}
+	}
+}
+
+#ifdef AVLTREE_MAP
+/**
+ * \brief Insert a new element into the tree with key and value. 
+ *
+ * If the key is not already in the tree then a new element is constructed and
+ * the insert succeeds. If lastFound is given then it is set to the element
+ * inserted. If the insert fails then lastFound is set to the existing element in
+ * the tree that has the same key as element. This insert routine is only
+ * available in AvlMap because it is the only class that knows about a Value
+ * type.
+ * 
+ * \returns The new element upon success, null upon failure.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		insert( const Key &key, const Value &val, Element **lastFound )
+{
+	long keyRelation;
+	Element *curEl = root, *parentEl = 0;
+	Element *lastLess = 0;
+
+	while (true) {
+		if ( curEl == 0 ) {
+			/* We are at an external element and did not find the key we were
+			 * looking for. Create the new element, attach it underneath the leaf
+			 * and rebalance. */
+			Element *element = new Element( key, val );
+			attachRebal( element, parentEl, lastLess );
+
+			if ( lastFound != 0 )
+				*lastFound = element;
+			return element;
+		}
+
+		keyRelation = compare(key, curEl->getKey());
+
+		/* Do we go left? */
+		if ( keyRelation < 0 ) {
+			parentEl = lastLess = curEl;
+			curEl = curEl->BASE_EL(left);
+		}
+		/* Do we go right? */
+		else if ( keyRelation > 0 ) {
+			parentEl = curEl;
+			curEl = curEl->BASE_EL(right);
+		}
+		/* We have hit the target. */
+		else {
+			if ( lastFound != 0 )
+				*lastFound = curEl;
+			return 0;
+		}
+	}
+}
+#endif /* AVLTREE_MAP */
+
+
+/**
+ * \brief Find a element in the tree with the given key.
+ *
+ * \returns The element if key exists, null if the key does not exist.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		find( const Key &key ) const
+{
+	Element *curEl = root;
+	long keyRelation;
+
+	while (curEl) {
+		keyRelation = compare( key, curEl->BASEKEY(getKey()) );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 )
+			curEl = curEl->BASE_EL(left);
+		/* Do we go right? */
+		else if ( keyRelation > 0 )
+			curEl = curEl->BASE_EL(right);
+		/* We have hit the target. */
+		else {
+			return curEl;
+		}
+	}
+	return 0;
+}
+
+
+/**
+ * \brief Find a element, then detach it from the tree. 
+ * 
+ * The element is not deleted.
+ *
+ * \returns The element detached if the key is found, othewise returns null.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		detach(const Key &key)
+{
+	Element *element = find( key );
+	if ( element ) {
+		detach(element);
+	}
+
+	return element;
+}
+
+/**
+ * \brief Find, detach and delete a element from the tree. 
+ *
+ * \returns True if the element was found and deleted, false otherwise.
+ */
+template <AVLMEL_TEMPDEF> bool AvlTree<AVLMEL_TEMPUSE>::
+		remove(const Key &key)
+{
+	/* Assume not found. */
+	bool retVal = false;
+
+	/* Look for the key. */
+	Element *element = find( key );
+	if ( element != 0 ) {
+		/* If found, detach the element and delete. */
+		detach( element );
+		delete element;
+		retVal = true;
+	}
+
+	return retVal;
+}
+
+#endif /* AVL_BASIC */
+#endif /* AVL_KEYLESS */
+
+
+/**
+ * \brief Detach and delete a element from the tree. 
+ *
+ * If the element is not in the tree then undefined behaviour results.
+ */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		remove(Element *element)
+{
+	/* Detach and delete. */
+	detach(element);
+	delete element;
+}
+
+/**
+ * \brief Detach a element from the tree. 
+ *
+ * If the element is not in the tree then undefined behaviour results.
+ * 
+ * \returns The element given.
+ */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		detach(Element *element)
+{
+	Element *replacement, *fixfrom;
+	long lheight, rheight;
+
+#ifdef WALKABLE
+	/* Remove the element from the ordered list. */
+	BASELIST::detach( element );
+#endif
+	
+	/* Update treeSize. */
+	treeSize--;
+
+	/* Find a replacement element. */
+	if (element->BASE_EL(right))
+	{
+		/* Find the leftmost element of the right subtree. */
+		replacement = element->BASE_EL(right);
+		while (replacement->BASE_EL(left))
+			replacement = replacement->BASE_EL(left);
+
+		/* If replacing the element the with its child then we need to start
+		 * fixing at the replacement, otherwise we start fixing at the
+		 * parent of the replacement. */
+		if (replacement->BASE_EL(parent) == element)
+			fixfrom = replacement;
+		else
+			fixfrom = replacement->BASE_EL(parent);
+
+#ifndef WALKABLE
+		if ( element == head )
+			head = replacement;
+#endif
+
+		removeEl(replacement, replacement->BASE_EL(right));
+		replaceEl(element, replacement);
+	}
+	else if (element->BASE_EL(left))
+	{
+		/* Find the rightmost element of the left subtree. */
+		replacement = element->BASE_EL(left);
+		while (replacement->BASE_EL(right))
+			replacement = replacement->BASE_EL(right);
+
+		/* If replacing the element the with its child then we need to start
+		 * fixing at the replacement, otherwise we start fixing at the
+		 * parent of the replacement. */
+		if (replacement->BASE_EL(parent) == element)
+			fixfrom = replacement;
+		else
+			fixfrom = replacement->BASE_EL(parent);
+
+#ifndef WALKABLE
+		if ( element == tail )
+			tail = replacement;
+#endif
+
+		removeEl(replacement, replacement->BASE_EL(left));
+		replaceEl(element, replacement);
+	}
+	else
+	{
+		/* We need to start fixing at the parent of the element. */
+		fixfrom = element->BASE_EL(parent);
+
+#ifndef WALKABLE
+		if ( element == head )
+			head = element->BASE_EL(parent);
+		if ( element == tail )
+			tail = element->BASE_EL(parent);
+#endif
+
+		/* The element we are deleting is a leaf element. */
+		removeEl(element, 0);
+	}
+
+	/* If fixfrom is null it means we just deleted
+	 * the root of the tree. */
+	if ( fixfrom == 0 )
+		return element;
+
+	/* Fix the heights after the deletion. */
+	recalcHeights(fixfrom);
+
+	/* Fix every unbalanced element going up in the tree. */
+	Element *ub = findFirstUnbalEl(fixfrom);
+	while ( ub )
+	{
+		/* Find the element to rebalance by moving down from the first unbalanced
+		 * element 2 levels in the direction of the greatest heights. On the
+		 * second move down, the heights may be equal ( but not on the first ).
+		 * In which case go in the direction of the first move. */
+		lheight = ub->BASE_EL(left) ? ub->BASE_EL(left)->BASE_EL(height) : 0;
+		rheight = ub->BASE_EL(right) ? ub->BASE_EL(right)->BASE_EL(height) : 0;
+		assert( lheight != rheight );
+		if (rheight > lheight)
+		{
+			ub = ub->BASE_EL(right);
+			lheight = ub->BASE_EL(left) ?
+					ub->BASE_EL(left)->BASE_EL(height) : 0;
+			rheight = ub->BASE_EL(right) ? 
+					ub->BASE_EL(right)->BASE_EL(height) : 0;
+			if (rheight > lheight)
+				ub = ub->BASE_EL(right);
+			else if (rheight < lheight)
+				ub = ub->BASE_EL(left);
+			else
+				ub = ub->BASE_EL(right);
+		}
+		else
+		{
+			ub = ub->BASE_EL(left);
+			lheight = ub->BASE_EL(left) ? 
+					ub->BASE_EL(left)->BASE_EL(height) : 0;
+			rheight = ub->BASE_EL(right) ? 
+					ub->BASE_EL(right)->BASE_EL(height) : 0;
+			if (rheight > lheight)
+				ub = ub->BASE_EL(right);
+			else if (rheight < lheight)
+				ub = ub->BASE_EL(left);
+			else
+				ub = ub->BASE_EL(left);
+		}
+
+
+		/* rebalance returns the grandparant of the subtree formed
+		 * by the element that were rebalanced.
+		 * We must continue upward from there rebalancing. */
+		fixfrom = rebalance(ub);
+
+		/* Find the next unbalaced element. */
+		ub = findFirstUnbalEl(fixfrom);
+	}
+
+	return element;
+}
+
+
+/**
+ * \brief Empty the tree and delete all the element. 
+ *
+ * Resets the tree to its initial state.
+ */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::empty()
+{
+	if ( root ) {
+		/* Recursively delete from the tree structure. */
+		deleteChildrenOf(root);
+		delete root;
+		root = 0;
+		treeSize = 0;
+
+#ifdef WALKABLE
+		BASELIST::abandon();
+#endif
+	}
+}
+
+/**
+ * \brief Forget all element in the tree. 
+ *
+ * Does not delete element. Resets the the tree to it's initial state.
+ */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::abandon()
+{
+	root = 0;
+	treeSize = 0;
+
+#ifdef WALKABLE
+	BASELIST::abandon();
+#endif
+}
+
+/* Recursively delete all the children of a element. */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		deleteChildrenOf( Element *element )
+{
+	/* Recurse left. */
+	if (element->BASE_EL(left)) {
+		deleteChildrenOf(element->BASE_EL(left));
+
+		/* Delete left element. */
+		delete element->BASE_EL(left);
+		element->BASE_EL(left) = 0;
+	}
+
+	/* Recurse right. */
+	if (element->BASE_EL(right)) {
+		deleteChildrenOf(element->BASE_EL(right));
+
+		/* Delete right element. */
+		delete element->BASE_EL(right);
+		element->BASE_EL(left) = 0;
+	}
+}
+
+/* rebalance from a element whose gradparent is unbalanced. Only
+ * call on a element that has a grandparent. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		rebalance(Element *n)
+{
+	long lheight, rheight;
+	Element *a, *b, *c;
+	Element *t1, *t2, *t3, *t4;
+
+	Element *p = n->BASE_EL(parent);      /* parent (Non-NUL). L*/
+	Element *gp = p->BASE_EL(parent);     /* Grand-parent (Non-NULL). */
+	Element *ggp = gp->BASE_EL(parent);   /* Great grand-parent (may be NULL). */
+
+	if (gp->BASE_EL(right) == p)
+	{
+		/*  gp
+		 *   \
+		 *    p
+		 */
+		if (p->BASE_EL(right) == n)
+		{
+			/*  gp
+			 *   \
+			 *    p
+			 *     \
+			 *      n
+			 */
+			a = gp;
+			b = p;
+			c = n;
+			t1 = gp->BASE_EL(left);
+			t2 = p->BASE_EL(left);
+			t3 = n->BASE_EL(left);
+			t4 = n->BASE_EL(right);
+		}
+		else
+		{
+			/*  gp
+			 *     \
+			 *       p
+			 *      /
+			 *     n
+			 */
+			a = gp;
+			b = n;
+			c = p;
+			t1 = gp->BASE_EL(left);
+			t2 = n->BASE_EL(left);
+			t3 = n->BASE_EL(right);
+			t4 = p->BASE_EL(right);
+		}
+	}
+	else
+	{
+		/*    gp
+		 *   /
+		 *  p
+		 */
+		if (p->BASE_EL(right) == n)
+		{
+			/*      gp
+			 *    /
+			 *  p
+			 *   \
+			 *    n
+			 */
+			a = p;
+			b = n;
+			c = gp;
+			t1 = p->BASE_EL(left);
+			t2 = n->BASE_EL(left);
+			t3 = n->BASE_EL(right);
+			t4 = gp->BASE_EL(right);
+		}
+		else
+		{
+			/*      gp
+			 *     /
+			 *    p
+			 *   /
+			 *  n
+			 */
+			a = n;
+			b = p;
+			c = gp;
+			t1 = n->BASE_EL(left);
+			t2 = n->BASE_EL(right);
+			t3 = p->BASE_EL(right);
+			t4 = gp->BASE_EL(right);
+		}
+	}
+
+	/* Perform rotation.
+	 */
+
+	/* Tie b to the great grandparent. */
+	if ( ggp == 0 )
+		root = b;
+	else if ( ggp->BASE_EL(left) == gp )
+		ggp->BASE_EL(left) = b;
+	else
+		ggp->BASE_EL(right) = b;
+	b->BASE_EL(parent) = ggp;
+
+	/* Tie a as a leftchild of b. */
+	b->BASE_EL(left) = a;
+	a->BASE_EL(parent) = b;
+
+	/* Tie c as a rightchild of b. */
+	b->BASE_EL(right) = c;
+	c->BASE_EL(parent) = b;
+
+	/* Tie t1 as a leftchild of a. */
+	a->BASE_EL(left) = t1;
+	if ( t1 != 0 ) t1->BASE_EL(parent) = a;
+
+	/* Tie t2 as a rightchild of a. */
+	a->BASE_EL(right) = t2;
+	if ( t2 != 0 ) t2->BASE_EL(parent) = a;
+
+	/* Tie t3 as a leftchild of c. */
+	c->BASE_EL(left) = t3;
+	if ( t3 != 0 ) t3->BASE_EL(parent) = c;
+
+	/* Tie t4 as a rightchild of c. */
+	c->BASE_EL(right) = t4;
+	if ( t4 != 0 ) t4->BASE_EL(parent) = c;
+
+	/* The heights are all recalculated manualy and the great
+	 * grand-parent is passed to recalcHeights() to ensure
+	 * the heights are correct up the tree.
+	 *
+	 * Note that recalcHeights() cuts out when it comes across
+	 * a height that hasn't changed.
+	 */
+
+	/* Fix height of a. */
+	lheight = a->BASE_EL(left) ? a->BASE_EL(left)->BASE_EL(height) : 0;
+	rheight = a->BASE_EL(right) ? a->BASE_EL(right)->BASE_EL(height) : 0;
+	a->BASE_EL(height) = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of c. */
+	lheight = c->BASE_EL(left) ? c->BASE_EL(left)->BASE_EL(height) : 0;
+	rheight = c->BASE_EL(right) ? c->BASE_EL(right)->BASE_EL(height) : 0;
+	c->BASE_EL(height) = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of b. */
+	lheight = a->BASE_EL(height);
+	rheight = c->BASE_EL(height);
+	b->BASE_EL(height) = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of b's parents. */
+	recalcHeights(ggp);
+	return ggp;
+}
+
+/* Recalculates the heights of all the ancestors of element. */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		recalcHeights(Element *element)
+{
+	long lheight, rheight, new_height;
+	while ( element != 0 )
+	{
+		lheight = element->BASE_EL(left) ? element->BASE_EL(left)->BASE_EL(height) : 0;
+		rheight = element->BASE_EL(right) ? element->BASE_EL(right)->BASE_EL(height) : 0;
+
+		new_height = (lheight > rheight ? lheight : rheight) + 1;
+
+		/* If there is no chage in the height, then there will be no
+		 * change in any of the ancestor's height. We can stop going up.
+		 * If there was a change, continue upward. */
+		if (new_height == element->BASE_EL(height))
+			return;
+		else
+			element->BASE_EL(height) = new_height;
+
+		element = element->BASE_EL(parent);
+	}
+}
+
+/* Finds the first element whose grandparent is unbalanced. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		findFirstUnbalGP(Element *element)
+{
+	long lheight, rheight, balanceProp;
+	Element *gp;
+
+	if ( element == 0 || element->BASE_EL(parent) == 0 ||
+			element->BASE_EL(parent)->BASE_EL(parent) == 0 )
+		return 0;
+	
+	/* Don't do anything if we we have no grandparent. */
+	gp = element->BASE_EL(parent)->BASE_EL(parent);
+	while ( gp != 0 )
+	{
+		lheight = gp->BASE_EL(left) ? gp->BASE_EL(left)->BASE_EL(height) : 0;
+		rheight = gp->BASE_EL(right) ? gp->BASE_EL(right)->BASE_EL(height) : 0;
+		balanceProp = lheight - rheight;
+
+		if ( balanceProp < -1 || balanceProp > 1 )
+			return element;
+
+		element = element->BASE_EL(parent);
+		gp = gp->BASE_EL(parent);
+	}
+	return 0;
+}
+
+
+/* Finds the first element that is unbalanced. */
+template <AVLMEL_TEMPDEF> Element *AvlTree<AVLMEL_TEMPUSE>::
+		findFirstUnbalEl(Element *element)
+{
+	if ( element == 0 )
+		return 0;
+	
+	while ( element != 0 )
+	{
+		long lheight = element->BASE_EL(left) ? 
+				element->BASE_EL(left)->BASE_EL(height) : 0;
+		long rheight = element->BASE_EL(right) ? 
+				element->BASE_EL(right)->BASE_EL(height) : 0;
+		long balanceProp = lheight - rheight;
+
+		if ( balanceProp < -1 || balanceProp > 1 )
+			return element;
+
+		element = element->BASE_EL(parent);
+	}
+	return 0;
+}
+
+/* Replace a element in the tree with another element not in the tree. */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		replaceEl(Element *element, Element *replacement)
+{
+	Element *parent = element->BASE_EL(parent),
+		*left = element->BASE_EL(left),
+		*right = element->BASE_EL(right);
+
+	replacement->BASE_EL(left) = left;
+	if (left)
+		left->BASE_EL(parent) = replacement;
+	replacement->BASE_EL(right) = right;
+	if (right)
+		right->BASE_EL(parent) = replacement;
+
+	replacement->BASE_EL(parent) = parent;
+	if (parent)
+	{
+		if (parent->BASE_EL(left) == element)
+			parent->BASE_EL(left) = replacement;
+		else
+			parent->BASE_EL(right) = replacement;
+	}
+	else
+		root = replacement;
+
+	replacement->BASE_EL(height) = element->BASE_EL(height);
+}
+
+/* Removes a element from a tree and puts filler in it's place.
+ * Filler should be null or a child of element. */
+template <AVLMEL_TEMPDEF> void AvlTree<AVLMEL_TEMPUSE>::
+		removeEl(Element *element, Element *filler)
+{
+	Element *parent = element->BASE_EL(parent);
+
+	if (parent)
+	{
+		if (parent->BASE_EL(left) == element)
+			parent->BASE_EL(left) = filler;
+		else
+			parent->BASE_EL(right) = filler;
+	}
+	else
+		root = filler;
+	
+	if (filler)
+		filler->BASE_EL(parent) = parent;
+
+	return;
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
diff --git a/aapl/avlibasic.h b/aapl/avlibasic.h
new file mode 100644
index 00000000..a48faaa8
--- /dev/null
+++ b/aapl/avlibasic.h
@@ -0,0 +1,67 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLIBASIC_H
+#define _AAPL_AVLIBASIC_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avlitree 
+ * @{
+ */
+
+/**
+ * \class AvliBasic
+ * \brief Linked AVL Tree in which the entire element structure is the key.
+ *
+ * AvliBasic is a linked AVL tree that does not distinguish between the
+ * element that it contains and the key. The entire element structure is the
+ * key that is used to compare the relative ordering of elements. This is
+ * similar to the BstSet structure.
+ *
+ * AvliBasic does not assume ownership of elements in the tree. Items must be
+ * explicitly de-allocated.
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Element, class Compare
+#define AVLMEL_TEMPDEF class Element, class Compare
+#define AVLMEL_TEMPUSE Element, Compare
+#define AvlTree AvliBasic
+#define AVL_BASIC
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef AVL_BASIC
+#undef WALKABLE
+
+#endif /* _AAPL_AVLIBASIC_H */
diff --git a/aapl/avlikeyless.h b/aapl/avlikeyless.h
new file mode 100644
index 00000000..559b75af
--- /dev/null
+++ b/aapl/avlikeyless.h
@@ -0,0 +1,64 @@
+/*
+ *  Copyright 2002, 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLIKEYLESS_H
+#define _AAPL_AVLIKEYLESS_H
+
+#include "compare.h"
+#include "dlistmel.h"
+
+/**
+ * \addtogroup avlitree
+ * @{
+ */
+
+/**
+ * \class AvliKeyless
+ * \brief Linked AVL tree that has no insert/find/remove functions that take a
+ * key.
+ *
+ * AvliKeyless is an implementation of the AVL tree rebalancing functionality
+ * only. It provides the common code for the tiny AVL tree implementations.
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define BASELIST DListMel< Element, AvliTreeEl<Element> >
+#define AVLMEL_CLASSDEF class Element
+#define AVLMEL_TEMPDEF class Element
+#define AVLMEL_TEMPUSE Element
+#define AvlTree AvliKeyless
+#define WALKABLE
+#define AVL_KEYLESS
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef WALKABLE
+#undef AVL_KEYLESS
+
+#endif /* _AAPL_AVLIKEYLESS_H */
diff --git a/aapl/avlimap.h b/aapl/avlimap.h
new file mode 100644
index 00000000..38bfff75
--- /dev/null
+++ b/aapl/avlimap.h
@@ -0,0 +1,77 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLIMAP_H
+#define _AAPL_AVLIMAP_H
+
+#include "compare.h"
+#include "dlist.h"
+
+/**
+ * \addtogroup avlitree 
+ * @{
+ */
+
+/**
+ * \class AvliMap
+ * \brief Linked key and value oriented AVL tree. 
+ *
+ * AvliMap stores key and value pairs in elements that managed by the tree. It
+ * is intendend to be similar to map template found in the STL. AvliMap
+ * requires that a Key type, a Value type, and a class containing a compare()
+ * routine for Key be given. Items can be inserted with just a key or with a
+ * key and value pair.
+ *
+ * AvliMap assumes all elements in the tree are allocated on the heap and are
+ * to be managed by the tree. This means that the class destructor will delete
+ * the contents of the tree. A deep copy will cause existing elements to be
+ * deleted first.
+ *
+ * \include ex_avlimap.cpp
+ */
+
+/*@}*/
+
+#define AVLTREE_MAP
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define BASELIST DList< AvliMapEl<Key,Value> >
+#define AVLMEL_CLASSDEF class Key, class Value, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Key, class Value, class Compare
+#define AVLMEL_TEMPUSE Key, Value, Compare
+#define AvlTree AvliMap
+#define Element AvliMapEl<Key,Value>
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef AVLTREE_MAP
+#undef BASE_EL
+#undef BASEKEY
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef Element
+#undef WALKABLE
+
+#endif /* _AAPL_AVLIMAP_H */
diff --git a/aapl/avlimel.h b/aapl/avlimel.h
new file mode 100644
index 00000000..9442a997
--- /dev/null
+++ b/aapl/avlimel.h
@@ -0,0 +1,79 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLIMEL_H
+#define _AAPL_AVLIMEL_H
+
+#include "compare.h"
+#include "dlistmel.h"
+
+/**
+ * \addtogroup avlitree 
+ * @{
+ */
+
+/**
+ * \class AvliMel
+ * \brief Linked AVL tree for element appearing in multiple trees.
+ *
+ * AvliMel allows for an element to simultaneously be in multiple trees without
+ * the trees interferring with one another. For each tree that the element is
+ * to appear in, there must be a distinct set of AVL Tree management data that
+ * can be unambiguously referenced with some base class name. This name
+ * is passed to the tree as a template parameter and is used in the tree
+ * algorithms.
+ *
+ * The element must use the same key type and value in each tree that it
+ * appears in. If distinct keys are required, the AvliMelKey structure is
+ * available.
+ *
+ * AvliMel does not assume ownership of elements in the tree. The destructor
+ * will not delete the elements. If the user wishes to explicitly deallocate
+ * all the items in the tree the empty() routine is available. 
+ *
+ * \include ex_avlimel.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) BaseEl::name
+#define BASEKEY(name) name
+#define BASELIST DListMel< Element, BaseEl >
+#define AVLMEL_CLASSDEF class Element, class Key, \
+		class BaseEl, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, \
+		class BaseEl, class Compare
+#define AVLMEL_TEMPUSE Element, Key, BaseEl, Compare
+#define AvlTree AvliMel
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef WALKABLE
+
+#endif /* _AAPL_AVLIMEL_H */
diff --git a/aapl/avlimelkey.h b/aapl/avlimelkey.h
new file mode 100644
index 00000000..faa56e83
--- /dev/null
+++ b/aapl/avlimelkey.h
@@ -0,0 +1,76 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLIMELKEY_H
+#define _AAPL_AVLIMELKEY_H
+
+#include "compare.h"
+#include "dlistmel.h"
+
+/**
+ * \addtogroup avlitree 
+ * @{
+ */
+
+/**
+ * \class AvliMelKey
+ * \brief Linked AVL tree for element appearing in multiple trees with different keys.
+ *
+ * AvliMelKey is similar to AvliMel, except that an additional template
+ * parameter, BaseKey, is provided for resolving ambiguous references to
+ * getKey(). This means that if an element is stored in multiple trees, each
+ * tree can use a different key for ordering the elements in it. Using
+ * AvliMelKey an array of data structures can be indexed with an O(log(n))
+ * search on two or more of the values contained within it and without
+ * allocating any additional data.
+ *
+ * AvliMelKey does not assume ownership of elements in the tree. The destructor
+ * will not delete the elements. If the user wishes to explicitly deallocate
+ * all the items in the tree the empty() routine is available. 
+ *
+ * \include ex_avlimelkey.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) BaseEl::name
+#define BASEKEY(name) BaseKey::name
+#define BASELIST DListMel< Element, BaseEl >
+#define AVLMEL_CLASSDEF class Element, class Key, class BaseEl, \
+		class BaseKey, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, class BaseEl, \
+		class BaseKey, class Compare
+#define AVLMEL_TEMPUSE Element, Key, BaseEl, BaseKey, Compare
+#define AvlTree AvliMelKey
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef WALKABLE
+
+#endif /* _AAPL_AVLIMELKEY_H */
diff --git a/aapl/avliset.h b/aapl/avliset.h
new file mode 100644
index 00000000..cf5be365
--- /dev/null
+++ b/aapl/avliset.h
@@ -0,0 +1,75 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLISET_H
+#define _AAPL_AVLISET_H
+
+#include "compare.h"
+#include "dlist.h"
+
+/**
+ * \addtogroup avlitree 
+ * @{
+ */
+
+/**
+ * \class AvliSet
+ * \brief Linked Key-only oriented tree.
+ *
+ * AvliSet stores only keys in elements that are managed by the tree. AvliSet
+ * requires that a Key type and a class containing a compare() routine
+ * for Key be given. Items are inserted with just a key value.
+ *
+ * AvliSet assumes all elements in the tree are allocated on the heap and are
+ * to be managed by the tree. This means that the class destructor will delete
+ * the contents of the tree. A deep copy will cause existing elements to be
+ * deleted first.
+ *
+ * \include ex_avliset.cpp
+ */
+
+/*@}*/
+
+#define AVLTREE_SET
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define BASELIST DList< AvliSetEl<Key> >
+#define AVLMEL_CLASSDEF class Key, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Key, class Compare
+#define AVLMEL_TEMPUSE Key, Compare
+#define AvlTree AvliSet
+#define Element AvliSetEl<Key>
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef AVLTREE_SET
+#undef BASE_EL
+#undef BASEKEY
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef Element
+#undef WALKABLE
+
+#endif /* _AAPL_AVLISET_H */
diff --git a/aapl/avlitree.h b/aapl/avlitree.h
new file mode 100644
index 00000000..b053c96f
--- /dev/null
+++ b/aapl/avlitree.h
@@ -0,0 +1,78 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLITREE_H
+#define _AAPL_AVLITREE_H
+
+#include "compare.h"
+#include "dlistmel.h"
+
+/**
+ * \addtogroup avlitree
+ * @{
+ */
+
+/**
+ * \class AvliTree
+ * \brief Linked AVL tree.
+ *
+ * AvliTree is the standard linked by-structure AVL tree. To use this
+ * structure the user must define an element type and give it the necessary
+ * properties. At the very least it must have a getKey() function that will be
+ * used to compare the relative ordering of elements and tree management data
+ * necessary for the AVL algorithm. An element type can acquire the management
+ * data by inheriting the AvliTreeEl class.
+ *
+ * AvliTree does not presume to manage the allocation of elements in the tree.
+ * The destructor will not delete the items in the tree, instead the elements
+ * must be explicitly de-allocated by the user if necessary and when it is
+ * safe to do so. The empty() routine will traverse the tree and delete all
+ * items. 
+ *
+ * Since the tree does not manage the elements, it can contain elements that
+ * are allocated statically or that are part of another data structure.
+ *
+ * \include ex_avlitree.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define BASELIST DListMel< Element, AvliTreeEl<Element> >
+#define AVLMEL_CLASSDEF class Element, class Key, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, class Compare
+#define AVLMEL_TEMPUSE Element, Key, Compare
+#define AvlTree AvliTree
+#define WALKABLE
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef BASELIST
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef WALKABLE
+
+#endif /* _AAPL_AVLITREE_H */
diff --git a/aapl/avlkeyless.h b/aapl/avlkeyless.h
new file mode 100644
index 00000000..30805136
--- /dev/null
+++ b/aapl/avlkeyless.h
@@ -0,0 +1,58 @@
+/*
+ *  Copyright 2002, 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLKEYLESS_H
+#define _AAPL_AVLKEYLESS_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlKeyless
+ * \brief AVL tree that has no insert/find/remove functions that take a key.
+ *
+ * AvlKeyless is an implementation of the AVL tree rebalancing functionality
+ * only. It provides the common code for the tiny AVL tree implementations.
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define AVLMEL_CLASSDEF class Element
+#define AVLMEL_TEMPDEF class Element
+#define AVLMEL_TEMPUSE Element
+#define AvlTree AvlKeyless
+#define AVL_KEYLESS
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef AVL_KEYLESS
+
+#endif /* _AAPL_AVLKEYLESS_H */
diff --git a/aapl/avlmap.h b/aapl/avlmap.h
new file mode 100644
index 00000000..e4e15662
--- /dev/null
+++ b/aapl/avlmap.h
@@ -0,0 +1,74 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLMAP_H
+#define _AAPL_AVLMAP_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlMap
+ * \brief Key and value oriented AVL tree. 
+ *
+ * AvlMap stores key and value pairs in elements that managed by the tree. It
+ * is intendend to be similar to map template found in the STL. AvlMap
+ * requires that a Key type, a Value type, and a class containing a compare()
+ * routine for Key be given. Items can be inserted with just a key or with a
+ * key and value pair.
+ *
+ * AvlMap assumes all elements in the tree are allocated on the heap and are
+ * to be managed by the tree. This means that the class destructor will delete
+ * the contents of the tree. A deep copy will cause existing elements to be
+ * deleted first.
+ *
+ * \include ex_avlmap.cpp
+ */
+
+/*@}*/
+
+#define AVLTREE_MAP
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Key, class Value, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Key, class Value, class Compare
+#define AVLMEL_TEMPUSE Key, Value, Compare
+#define AvlTree AvlMap
+#define Element AvlMapEl<Key,Value>
+
+#include "avlcommon.h"
+
+#undef AVLTREE_MAP
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef Element
+
+
+
+#endif /* _AAPL_AVLMAP_H */
diff --git a/aapl/avlmel.h b/aapl/avlmel.h
new file mode 100644
index 00000000..7bfad3b7
--- /dev/null
+++ b/aapl/avlmel.h
@@ -0,0 +1,74 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLMEL_H
+#define _AAPL_AVLMEL_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlMel
+ * \brief AVL tree for elements appearing in multiple trees.
+ *
+ * AvlMel allows for an element to simultaneously be in multiple trees without
+ * the trees interferring with one another. For each tree that the element is
+ * to appear in, there must be a distinct set of AVL Tree management data that
+ * can be unambiguously referenced with some base class name. This name
+ * is passed to the tree as a template parameter and is used in the tree
+ * algorithms.
+ *
+ * The element must use the same key type and value in each tree that it
+ * appears in. If distinct keys are required, the AvlMelKey structure is
+ * available.
+ *
+ * AvlMel does not assume ownership of elements in the tree. The destructor
+ * will not delete the elements. If the user wishes to explicitly deallocate
+ * all the items in the tree the empty() routine is available. 
+ *
+ * \include ex_avlmel.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) BaseEl::name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Element, class Key, \
+		class BaseEl, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, \
+		class BaseEl, class Compare
+#define AVLMEL_TEMPUSE Element, Key, BaseEl, Compare
+#define AvlTree AvlMel
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+
+#endif /* _AAPL_AVLMEL_H */
diff --git a/aapl/avlmelkey.h b/aapl/avlmelkey.h
new file mode 100644
index 00000000..9261cc83
--- /dev/null
+++ b/aapl/avlmelkey.h
@@ -0,0 +1,71 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLMELKEY_H
+#define _AAPL_AVLMELKEY_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlMelKey
+ * \brief AVL tree for elements appearing in multiple trees with different keys.
+ *
+ * AvlMelKey is similar to AvlMel, except that an additional template
+ * parameter, BaseKey, is provided for resolving ambiguous references to
+ * getKey(). This means that if an element is stored in multiple trees, each
+ * tree can use a different key for ordering the elements in it. Using
+ * AvlMelKey an array of data structures can be indexed with an O(log(n))
+ * search on two or more of the values contained within it and without
+ * allocating any additional data.
+ *
+ * AvlMelKey does not assume ownership of elements in the tree. The destructor
+ * will not delete the elements. If the user wishes to explicitly deallocate
+ * all the items in the tree the empty() routine is available. 
+ *
+ * \include ex_avlmelkey.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) BaseEl::name
+#define BASEKEY(name) BaseKey::name
+#define AVLMEL_CLASSDEF class Element, class Key, class BaseEl, \
+		class BaseKey, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, class BaseEl, \
+		class BaseKey, class Compare
+#define AVLMEL_TEMPUSE Element, Key, BaseEl, BaseKey, Compare
+#define AvlTree AvlMelKey
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+
+#endif /* _AAPL_AVLMELKEY_H */
diff --git a/aapl/avlset.h b/aapl/avlset.h
new file mode 100644
index 00000000..224ee59f
--- /dev/null
+++ b/aapl/avlset.h
@@ -0,0 +1,70 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLSET_H
+#define _AAPL_AVLSET_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlSet
+ * \brief Key-only oriented tree.
+ *
+ * AvlSet stores only keys in elements that are managed by the tree. AvlSet
+ * requires that a Key type and a class containing a compare() routine
+ * for Key be given. Items are inserted with just a key value.
+ *
+ * AvlSet assumes all elements in the tree are allocated on the heap and are
+ * to be managed by the tree. This means that the class destructor will delete
+ * the contents of the tree. A deep copy will cause existing elements to be
+ * deleted first.
+ *
+ * \include ex_avlset.cpp
+ */
+
+/*@}*/
+
+#define AVLTREE_SET
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Key, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Key, class Compare
+#define AVLMEL_TEMPUSE Key, Compare
+#define AvlTree AvlSet
+#define Element AvlSetEl<Key>
+
+#include "avlcommon.h"
+
+#undef AVLTREE_SET
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+#undef Element
+
+#endif /* _AAPL_AVLSET_H */
diff --git a/aapl/avltree.h b/aapl/avltree.h
new file mode 100644
index 00000000..cf153595
--- /dev/null
+++ b/aapl/avltree.h
@@ -0,0 +1,73 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_AVLTREE_H
+#define _AAPL_AVLTREE_H
+
+#include "compare.h"
+
+/**
+ * \addtogroup avltree 
+ * @{
+ */
+
+/**
+ * \class AvlTree
+ * \brief Basic AVL tree.
+ *
+ * AvlTree is the standard by-structure AVL tree. To use this structure the
+ * user must define an element type and give it the necessary properties. At
+ * the very least it must have a getKey() function that will be used to
+ * compare the relative ordering of elements and tree management data
+ * necessary for the AVL algorithm. An element type can acquire the management
+ * data by inheriting the AvlTreeEl class.
+ *
+ * AvlTree does not presume to manage the allocation of elements in the tree.
+ * The destructor will not delete the items in the tree, instead the elements
+ * must be explicitly de-allocated by the user if necessary and when it is
+ * safe to do so. The empty() routine will traverse the tree and delete all
+ * items. 
+ *
+ * Since the tree does not manage the elements, it can contain elements that
+ * are allocated statically or that are part of another data structure.
+ *
+ * \include ex_avltree.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define BASEKEY(name) name
+#define AVLMEL_CLASSDEF class Element, class Key, class Compare = CmpOrd<Key>
+#define AVLMEL_TEMPDEF class Element, class Key, class Compare
+#define AVLMEL_TEMPUSE Element, Key, Compare
+#define AvlTree AvlTree
+
+#include "avlcommon.h"
+
+#undef BASE_EL
+#undef BASEKEY
+#undef AVLMEL_CLASSDEF
+#undef AVLMEL_TEMPDEF
+#undef AVLMEL_TEMPUSE
+#undef AvlTree
+
+#endif /* _AAPL_AVLTREE_H */
diff --git a/aapl/bstcommon.h b/aapl/bstcommon.h
new file mode 100644
index 00000000..bd390cdc
--- /dev/null
+++ b/aapl/bstcommon.h
@@ -0,0 +1,814 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+/* This header is not wrapped in ifndefs because it is
+ * not intended to be included by users directly. */
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/* Binary Search Table */
+template < BST_TEMPL_DECLARE > class BstTable :
+		public Compare,
+		public Vector< Element, Resize >
+{
+	typedef Vector<Element, Resize> BaseVector;
+	typedef Table<Element> BaseTable;
+
+public:
+	/**
+	 * \brief Default constructor.
+	 *
+	 * Create an empty binary search table.
+	 */
+	BstTable() { }
+
+	/**
+	 * \brief Construct with initial value.
+	 *
+	 * Constructs a binary search table with an initial item. Uses the default
+	 * constructor for initializing Value.
+	 */
+	BstTable(const Key &key) 
+		{ insert(key); }
+
+#if defined( BSTMAP )
+	/**
+	 * \brief Construct with initial value.
+	 *
+	 * Constructs a binary search table with an initial key/value pair.
+	 */
+	BstTable(const Key &key, const Value &val) 
+		{ insert(key, val); }
+#endif
+
+#if ! defined( BSTSET )
+	/**
+	 * \brief Construct with initial value.
+	 *
+	 * Constructs a binary search table with an initial Element.
+	 */
+	BstTable(const Element &el) 
+		{ insert(el); }
+#endif
+
+	Element *insert(const Key &key, Element **lastFound = 0);
+	Element *insertMulti(const Key &key);
+
+	bool insert(const BstTable &other);
+	void insertMulti(const BstTable &other);
+
+#if defined( BSTMAP )
+	Element *insert(const Key &key, const Value &val, 
+			Element **lastFound = 0);
+	Element *insertMulti(const Key &key, const Value &val );
+#endif
+
+#if ! defined( BSTSET )
+	Element *insert(const Element &el, Element **lastFound = 0);
+	Element *insertMulti(const Element &el);
+#endif
+
+	Element *find(const Key &key, Element **lastFound = 0) const;
+	bool findMulti( const Key &key, Element *&lower,
+			Element *&upper ) const;
+
+	bool remove(const Key &key);
+	bool remove(Element *item);
+	long removeMulti(const Key &key);
+	long removeMulti(Element *lower, Element *upper);
+
+	/* The following provide access to the underlying insert and remove
+	 * functions that my be hidden by the BST insert and remove. The insertDup
+	 * and insertNew functions will never be hidden. They are provided for
+	 * consistency. The difference between the non-shared and the shared
+	 * tables is the documentation reference to the invoked function. */	
+
+#if !defined( SHARED_BST )
+	/*@{*/
+
+	/** \brief Call the insert of the underlying vector. 
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes Vector::insert( long pos, const T &val ).
+	 */
+	void vinsert(long pos, const Element &val)
+		{ Vector< Element, Resize >::insert( pos, &val, 1 ); }
+
+	/** \brief Call the insert of the underlying vector.
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes Vector::insert( long pos, const T *val, long len ).
+	 */
+	void vinsert(long pos, const Element *val, long len)
+		{ Vector< Element, Resize >::insert( pos, val, len ); }
+
+	/** \brief Call the insert of the underlying vector.
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes Vector::insert( long pos, const Vector &v ).
+	 */
+	void vinsert(long pos, const BstTable &v)
+		{ Vector< Element, Resize >::insert( pos, v.data, v.tabLen ); }
+
+	/*@}*/
+
+	/*@{*/
+
+	/** \brief Call the remove of the underlying vector. 
+	 *
+	 * 	Provides access to the vector remove, which may become hidden.
+	 * 	Invokes Vector::remove( long pos ).
+	 */
+	void vremove(long pos)
+		{ Vector< Element, Resize >::remove( pos, 1 ); }
+
+	/** \brief Call the remove of the underlying vector. 
+	 *
+	 * Proves access to the vector remove, which may become hidden.
+	 * Invokes Vector::remove( long pos, long len ). 
+	 */
+	void vremove(long pos, long len)
+		{ Vector< Element, Resize >::remove( pos, len ); }
+
+	/*@}*/
+#else /* SHARED_BST */
+	/*@{*/
+
+	/** \brief Call the insert of the underlying vector. 
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes SVector::insert( long pos, const T &val ).
+	 */
+	void vinsert(long pos, const Element &val)
+		{ Vector< Element, Resize >::insert( pos, &val, 1 ); }
+
+	/** \brief Call the insert of the underlying vector.
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes SVector::insert( long pos, const T *val, long len ).
+	 */
+	void vinsert(long pos, const Element *val, long len)
+		{ Vector< Element, Resize >::insert( pos, val, len ); }
+
+	/** \brief Call the insert of the underlying vector.
+	 *
+	 * Provides to access to the vector insert, which may become hidden. Care
+	 * should be taken to ensure that after the insert the ordering of
+	 * elements is preserved. 
+	 * Invokes SVector::insert( long pos, const SVector &v ).
+	 */
+	void vinsert(long pos, const BstTable &v)
+		{ Vector< Element, Resize >::insert( pos, v.data, v.length() ); }
+
+	/*@}*/
+
+	/*@{*/
+
+	/** \brief Call the remove of the underlying vector. 
+	 *
+	 * 	Provides access to the vector remove, which may become hidden.
+	 * 	Invokes SVector::remove( long pos ).
+	 */
+	void vremove(long pos)
+		{ Vector< Element, Resize >::remove( pos, 1 ); }
+
+	/** \brief Call the remove of the underlying vector. 
+	 *
+	 * Proves access to the vector remove, which may become hidden.
+	 * Invokes SVector::remove( long pos, long len ). 
+	 */
+	void vremove(long pos, long len)
+		{ Vector< Element, Resize >::remove( pos, len ); }
+
+	/*@}*/
+
+#endif /* SHARED_BST */
+};
+
+
+#if 0
+#if defined( SHARED_BST )
+/**
+ * \brief Construct a binary search table with an initial amount of
+ * allocation.
+ *
+ * The table is initialized to have room for allocLength elements. The
+ * table starts empty.
+ */
+template <BST_TEMPL_DEF> BstTable<BST_TEMPL_USE>::
+		BstTable( long allocLen ) 
+{
+	/* Allocate the space if we are given a positive allocLen. */
+	if ( allocLen > 0 ) {
+		/* Allocate the data needed. */
+		STabHead *head = (STabHead*) 
+				malloc( sizeof(STabHead) + sizeof(Element) * allocLen );
+		if ( head == 0 )
+			throw std::bad_alloc();
+
+		/* Set up the header and save the data pointer. */
+		head->refCount = 1;
+		head->allocLen = allocLen;
+		head->tabLen = 0;
+		BaseTable::data = (Element*) (head + 1);
+	}
+}
+#else
+/**
+ * \brief Construct a binary search table with an initial amount of
+ * allocation.
+ *
+ * The table is initialized to have room for allocLength elements. The
+ * table starts empty.
+ */
+template <BST_TEMPL_DEF> BstTable<BST_TEMPL_USE>::
+		BstTable( long allocLen ) 
+{
+	/* Allocate the space if we are given a positive allocLen. */
+	BaseTable::allocLen = allocLen;
+	if ( BaseTable::allocLen > 0 ) {
+		BaseTable::data = (Element*) malloc(sizeof(Element) * BaseTable::allocLen);
+		if ( BaseTable::data == NULL )
+			throw std::bad_alloc();
+	}
+}
+
+#endif
+#endif
+
+/**
+ * \brief Find the element with the given key and remove it.
+ *
+ * If multiple elements with the given key exist, then it is unspecified which
+ * element will be removed.
+ *
+ * \returns True if an element is found and consequently removed, false
+ * otherwise.
+ */
+template <BST_TEMPL_DEF> bool BstTable<BST_TEMPL_USE>::
+		remove(const Key &key)
+{
+	Element *el = find(key);
+	if ( el != 0 ) {
+		Vector< Element >::remove(el - BaseTable::data);
+		return true;
+	}
+	return false;
+}
+
+/**
+ * \brief Remove the element pointed to by item.
+ *
+ * If item does not point to an element in the tree, then undefined behaviour
+ * results. If item is null, then remove has no effect.
+ *
+ * \returns True if item is not null, false otherwise.
+ */
+template <BST_TEMPL_DEF> bool BstTable<BST_TEMPL_USE>::
+		remove( Element *item )
+{
+	if ( item != 0 ) {
+		Vector< Element >::remove(item - BaseTable::data);
+		return true;
+	}
+	return false;
+}
+
+/**
+ * \brief Find and remove the entire range of elements with the given key.
+ *
+ * \returns The number of elements removed.
+ */
+template <BST_TEMPL_DEF> long BstTable<BST_TEMPL_USE>::
+		removeMulti(const Key &key)
+{
+	Element *low, *high;
+	if ( findMulti(key, low, high) ) {
+		/* Get the length of the range. */
+		long num = high - low + 1;
+		Vector< Element >::remove(low - BaseTable::data, num);
+		return num;
+	}
+
+	return 0;
+}
+
+template <BST_TEMPL_DEF> long BstTable<BST_TEMPL_USE>::
+		removeMulti(Element *lower, Element *upper)
+{
+	/* Get the length of the range. */
+	long num = upper - lower + 1;
+	Vector< Element >::remove(lower - BaseTable::data, num);
+	return num;
+}
+
+
+/**
+ * \brief Find a range of elements with the given key.
+ *
+ * If any elements with the given key exist then lower and upper are set to
+ * the low and high ends of the continous range of elements with the key.
+ * Lower and upper will point to the first and last elements with the key.
+ *
+ * \returns True if any elements are found, false otherwise.
+ */
+template <BST_TEMPL_DEF> bool BstTable<BST_TEMPL_USE>::
+		findMulti(const Key &key, Element *&low, Element *&high ) const
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation;
+	const long tblLen = BaseTable::length();
+
+	if ( BaseTable::data == 0 )
+		return false;
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the fd in the array. */
+			return false;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(key, GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			Element *lowEnd = BaseTable::data - 1;
+			Element *highEnd = BaseTable::data + tblLen;
+
+			lower = mid - 1;
+			while ( lower != lowEnd && 
+					compare(key, GET_KEY(*lower)) == 0 )
+				lower--;
+
+			upper = mid + 1;
+			while ( upper != highEnd && 
+					compare(key, GET_KEY(*upper)) == 0 )
+				upper++;
+			
+			low = (Element*)lower + 1;
+			high = (Element*)upper - 1;
+			return true;
+		}
+	}
+}
+
+/**
+ * \brief Find an element with the given key.
+ *
+ * If the find succeeds then lastFound is set to the element found. If the
+ * find fails then lastFound is set the location where the key would be
+ * inserted. If there is more than one element in the tree with the given key,
+ * then it is unspecified which element is returned as the match.
+ *
+ * \returns The element found on success, null on failure.
+ */
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		find( const Key &key, Element **lastFound ) const
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation;
+	const long tblLen = BaseTable::length();
+
+	if ( BaseTable::data == 0 )
+		return 0;
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the key. Last found gets the insert location. */
+			if ( lastFound != 0 )
+				*lastFound = (Element*)lower;
+			return 0;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(key, GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			/* Key is found. Last found gets the found record. */
+			if ( lastFound != 0 )
+				*lastFound = (Element*)mid;
+			return (Element*)mid;
+		}
+	}
+}
+
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insert(const Key &key, Element **lastFound)
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the key in the array.
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(key, GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			if ( lastFound != 0 )
+				*lastFound = (Element*)mid;
+			return 0;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. After makeRawSpaceFor, lower pointer is no good. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(key);
+
+	/* Set lastFound */
+	if ( lastFound != 0 )
+		*lastFound = BaseTable::data + insertPos;
+	return BaseTable::data + insertPos;
+}
+
+
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insertMulti(const Key &key)
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the key in the array.
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(key, GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			lower = mid;
+			goto insert;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(key);
+
+	/* Return the element inserted. */
+	return BaseTable::data + insertPos;
+}
+
+/**
+ * \brief Insert each element from other.
+ *
+ * Always attempts to insert all elements even if the insert of some item from
+ * other fails.
+ *
+ * \returns True if all items inserted successfully, false if any insert
+ * failed.
+ */
+template <BST_TEMPL_DEF> bool BstTable<BST_TEMPL_USE>::
+		insert(const BstTable &other)
+{
+	bool allSuccess = true;
+	long otherLen = other.length();
+	for ( long i = 0; i < otherLen; i++ ) {
+		Element *el = insert( other.data[i] );
+		if ( el == 0 )
+			allSuccess = false;
+	}
+	return allSuccess;
+}
+
+/**
+ * \brief Insert each element from other even if the elements exist already.
+ *
+ * No individual insertMulti can fail.
+ */
+template <BST_TEMPL_DEF> void BstTable<BST_TEMPL_USE>::
+		insertMulti(const BstTable &other)
+{
+	long otherLen = other.length();
+	for ( long i = 0; i < otherLen; i++ )
+		insertMulti( other.data[i] );
+}
+
+#if ! defined( BSTSET )
+
+/**
+ * \brief Insert the given element.
+ *
+ * If the key in the given element does not already exist in the table then a
+ * new element is inserted. They element copy constructor is used to place the
+ * element into the table. If lastFound is given, it is set to the new element
+ * created. If the insert fails then lastFound is set to the existing element
+ * of the same key.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insert(const Element &el, Element **lastFound )
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the key in the array.
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(GET_KEY(el), GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			if ( lastFound != 0 )
+				*lastFound = (Element*)mid;
+			return 0;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. After makeRawSpaceFor, lower pointer is no good. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(el);
+
+	/* Set lastFound */
+	if ( lastFound != 0 )
+		*lastFound = BaseTable::data + insertPos;
+	return BaseTable::data + insertPos;
+}
+
+/**
+ * \brief Insert the given element even if it exists already.
+ *
+ * If the key in the given element exists already then the new element is
+ * placed next to some other element of the same key. InsertMulti cannot fail.
+ * The element copy constructor is used to place the element in the table.
+ *
+ * \returns The new element created.
+ */
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insertMulti(const Element &el)
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the fd in the array.
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = compare(GET_KEY(el), GET_KEY(*mid));
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			lower = mid;
+			goto insert;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(el);
+
+	/* Return the element inserted. */
+	return BaseTable::data + insertPos;
+}
+#endif
+
+
+#if defined( BSTMAP )
+
+/**
+ * \brief Insert the given key-value pair.
+ *
+ * If the given key does not already exist in the table then the key-value
+ * pair is inserted. Copy constructors are used to place the pair in the
+ * table. If lastFound is given, it is set to the new entry created. If the
+ * insert fails then lastFound is set to the existing pair of the same key.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insert(const Key &key, const Value &val, Element **lastFound)
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the fd in the array.
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = Compare::compare(key, mid->key);
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			if ( lastFound != NULL )
+				*lastFound = (Element*)mid;
+			return 0;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(key, val);
+
+	/* Set lastFound */
+	if ( lastFound != NULL )
+		*lastFound = BaseTable::data + insertPos;
+	return BaseTable::data + insertPos;
+}
+
+
+/**
+ * \brief Insert the given key-value pair even if the key exists already.
+ *
+ * If the key exists already then the key-value pair is placed next to some
+ * other pair of the same key. InsertMulti cannot fail. Copy constructors are
+ * used to place the pair in the table.
+ *
+ * \returns The new element created.
+ */
+template <BST_TEMPL_DEF> Element *BstTable<BST_TEMPL_USE>::
+		insertMulti(const Key &key, const Value &val)
+{
+	const Element *lower, *mid, *upper;
+	long keyRelation, insertPos;
+	const long tblLen = BaseTable::length();
+
+	if ( tblLen == 0 ) {
+		/* If the table is empty then go straight to insert. */
+		lower = BaseTable::data;
+		goto insert;
+	}
+
+	lower = BaseTable::data;
+	upper = BaseTable::data + tblLen - 1;
+	while ( true ) {
+		if ( upper < lower ) {
+			/* Did not find the key in the array. 
+			 * Place to insert at is lower. */
+			goto insert;
+		}
+
+		mid = lower + ((upper-lower)>>1);
+		keyRelation = Compare::compare(key, mid->key);
+
+		if ( keyRelation < 0 )
+			upper = mid - 1;
+		else if ( keyRelation > 0 )
+			lower = mid + 1;
+		else {
+			lower = mid;
+			goto insert;
+		}
+	}
+
+insert:
+	/* Get the insert pos. */
+	insertPos = lower - BaseTable::data;
+
+	/* Do the insert. */
+	BaseVector::makeRawSpaceFor(insertPos, 1);
+	new(BaseTable::data + insertPos) Element(key, val);
+
+	/* Return the element inserted. */
+	return BaseTable::data + insertPos;
+}
+
+#endif
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
diff --git a/aapl/bstmap.h b/aapl/bstmap.h
new file mode 100644
index 00000000..5154b86c
--- /dev/null
+++ b/aapl/bstmap.h
@@ -0,0 +1,113 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_BSTMAP_H
+#define _AAPL_BSTMAP_H
+
+#include "compare.h"
+#include "vector.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \brief Element for BstMap.
+ *
+ * Stores the key and value pair. 
+ */
+template <class Key, class Value> struct BstMapEl
+{
+	BstMapEl() {}
+	BstMapEl(const Key &key) : key(key) {}
+	BstMapEl(const Key &key, const Value &val) : key(key), value(val) {}
+
+	/** \brief The key */
+	Key key;
+
+	/** \brief The value. */
+	Value value;
+};
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class BstMap
+ * \brief Binary search table for key and value pairs.
+ *
+ * BstMap stores key and value pairs in each element. The key and value can be
+ * any type. A compare class for the key must be supplied.
+ */
+
+/*@}*/
+
+#define BST_TEMPL_DECLARE class Key, class Value, \
+		class Compare = CmpOrd<Key>, class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Key, class Value, class Compare, class Resize
+#define BST_TEMPL_USE Key, Value, Compare, Resize
+#define GET_KEY(el) ((el).key)
+#define BstTable BstMap
+#define Element BstMapEl<Key, Value>
+#define BSTMAP
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BstTable
+#undef Element
+#undef BSTMAP
+
+/**
+ * \fn BstMap::insert(const Key &key, BstMapEl<Key, Value> **lastFound)
+ * \brief Insert the given key.
+ *
+ * If the given key does not already exist in the table then a new element
+ * having key is inserted. They key copy constructor and value default
+ * constructor are used to place the pair in the table. If lastFound is given,
+ * it is set to the new entry created. If the insert fails then lastFound is
+ * set to the existing pair of the same key.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn BstMap::insertMulti(const Key &key)
+ * \brief Insert the given key even if it exists already.
+ *
+ * If the key exists already then the new element having key is placed next
+ * to some other pair of the same key. InsertMulti cannot fail. The key copy
+ * constructor and the value default constructor are used to place the pair in
+ * the table.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_BSTMAP_H */
diff --git a/aapl/bstset.h b/aapl/bstset.h
new file mode 100644
index 00000000..ce710ee0
--- /dev/null
+++ b/aapl/bstset.h
@@ -0,0 +1,86 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_BSTSET_H
+#define _AAPL_BSTSET_H
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class BstSet
+ * \brief Binary search table for types that are the key.
+ *
+ * BstSet is suitable for types that comprise the entire key. Rather than look
+ * into the element to retrieve the key, the element is the key. A class that
+ * contains a comparison routine for the key must be given.
+ */
+
+/*@}*/
+
+#include "compare.h"
+#include "vector.h"
+
+#define BST_TEMPL_DECLARE class Key, class Compare = CmpOrd<Key>, \
+		class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Key, class Compare, class Resize
+#define BST_TEMPL_USE Key, Compare, Resize
+#define GET_KEY(el) (el)
+#define BstTable BstSet
+#define Element Key
+#define BSTSET
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BstTable
+#undef Element
+#undef BSTSET
+
+/**
+ * \fn BstSet::insert(const Key &key, Key **lastFound)
+ * \brief Insert the given key.
+ *
+ * If the given key does not already exist in the table then it is inserted.
+ * The key's copy constructor is used to place the item in the table. If
+ * lastFound is given, it is set to the new entry created. If the insert fails
+ * then lastFound is set to the existing key of the same value.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn BstSet::insertMulti(const Key &key)
+ * \brief Insert the given key even if it exists already.
+ *
+ * If the key exists already then it is placed next to some other key of the
+ * same value. InsertMulti cannot fail. The key's copy constructor is used to
+ * place the item in the table.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_BSTSET_H */
diff --git a/aapl/bsttable.h b/aapl/bsttable.h
new file mode 100644
index 00000000..9898ebff
--- /dev/null
+++ b/aapl/bsttable.h
@@ -0,0 +1,84 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_BSTTABLE_H
+#define _AAPL_BSTTABLE_H
+
+#include "compare.h"
+#include "vector.h"
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class BstTable
+ * \brief Binary search table for structures that contain a key.
+ *
+ * This is the basic binary search table. It can be used to contain a
+ * structure that has a key and possibly some data. The key should be a member
+ * of the element class and accessible with getKey(). A class containing the
+ * compare routine must be supplied.
+ */
+
+/*@}*/
+
+#define BST_TEMPL_DECLARE class Element, class Key, \
+		class Compare = CmpOrd<Key>, class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Element, class Key, class Compare, class Resize
+#define BST_TEMPL_USE Element, Key, Compare, Resize
+#define GET_KEY(el) ((el).getKey())
+#define BSTTABLE
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BSTTABLE
+
+/**
+ * \fn BstTable::insert(const Key &key, Element **lastFound)
+ * \brief Insert a new element with the given key.
+ *
+ * If the given key does not already exist in the table a new element is
+ * inserted with the given key. A constructor taking only const Key& is used
+ * to initialize the new element. If lastFound is given, it is set to the new
+ * element created. If the insert fails then lastFound is set to the existing
+ * element with the same key. 
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn BstTable::insertMulti(const Key &key)
+ * \brief Insert a new element even if the key exists already.
+ *
+ * If the key exists already then the new element is placed next to some
+ * element with the same key. InsertMulti cannot fail. A constructor taking
+ * only const Key& is used to initialize the new element.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_BSTTABLE_H */
diff --git a/aapl/bubblesort.h b/aapl/bubblesort.h
new file mode 100644
index 00000000..20e0f6f4
--- /dev/null
+++ b/aapl/bubblesort.h
@@ -0,0 +1,94 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_BUBBLESORT_H
+#define _AAPL_BUBBLESORT_H
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup sort 
+ * @{
+ */
+
+/** 
+ * \class BubbleSort
+ * \brief Bubble sort an array of data.
+ *
+ * BubbleSort can be used to sort any array of objects of type T provided a
+ * compare class is given. BubbleSort is in-place. It does not require any
+ * temporary storage.
+ *
+ * Objects are not made aware that they are being moved around in memory.
+ * Assignment operators, constructors and destructors are never invoked by the
+ * sort.
+ *
+ * BubbleSort runs in O(n^2) time. It is most useful when sorting arrays that
+ * are nearly sorted. It is best when neighbouring pairs are out of place.
+ * BubbleSort is a stable sort, meaning that objects with the same key have
+ * their relative ordering preserved.
+ */
+
+/*@}*/
+
+/* BubbleSort. */
+template <class T, class Compare> class BubbleSort 
+	: public Compare
+{
+public:
+	/* Sorting interface routine. */
+	void sort(T *data, long len);
+};
+
+
+/**
+ * \brief Bubble sort an array of data.
+ */
+template <class T, class Compare> void BubbleSort<T,Compare>::
+		sort(T *data, long len)
+{
+	bool changed = true;
+	for ( long pass = 1; changed && pass < len; pass ++ ) {
+		changed = false;
+		for ( long i = 0; i < len-pass; i++ ) {
+			/* Do we swap pos with the next one? */
+			if ( compare( data[i], data[i+1] ) > 0 ) {
+				char tmp[sizeof(T)];
+
+				/* Swap the two items. */
+				memcpy( tmp, data+i, sizeof(T) );
+				memcpy( data+i, data+i+1, sizeof(T) );
+				memcpy( data+i+1, tmp, sizeof(T) );
+
+				/* Note that we made a change. */
+				changed = true;
+			}
+		}
+	}
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_BUBBLESORT_H */
diff --git a/aapl/compare.h b/aapl/compare.h
new file mode 100644
index 00000000..3d547b51
--- /dev/null
+++ b/aapl/compare.h
@@ -0,0 +1,273 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_COMPARE_H
+#define _AAPL_COMPARE_H
+
+#include <string.h>
+#include "astring.h"
+#include "table.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \defgroup compare Compare
+ * \brief Basic compare clases.
+ *
+ * Compare classes are used by data structures that need to know the relative
+ * ordering of elemets. To become a compare class, a class must imlement a
+ * routine long compare(const T &key1, const T &key2) that behaves just like
+ * strcmp. 
+ *
+ * Compare classes are passed to the template data structure as a template
+ * parameter and are inherited. In most cases the compare routine will base
+ * the key comparision only on the two keys and the compare routine can
+ * therefore be static. Though sometimes it is useful to include data in the
+ * compare class and use this data in the comparison. For example the compare
+ * class may contain a pointer to some other data structure to which the
+ * comparison is delegated.
+ *
+ * @{
+ */
+
+/**
+ * \brief Compare two null terminated character sequences.
+ *
+ * This comparision class is a wrapper for strcmp.
+ */
+template<class T> struct CmpStrTmpl
+{
+	/**
+	 * \brief Compare two null terminated string types.
+	 */
+	static inline long compare( const char *k1, const char *k2 )
+		{ return strcmp(k1, k2); }
+
+	static int compare( const StrTmpl<T> &s1, const StrTmpl<T> &s2 )
+	{
+		if ( s1.length() < s2.length() )
+			return -1;
+		else if ( s1.length() > s2.length() )
+			return 1;
+		else
+			return memcmp( s1.data, s2.data, s1.length() );
+	}
+};
+
+typedef CmpStrTmpl<char> CmpStr;
+
+/**
+ * \brief Compare a type for which < and > are implemented.
+ *
+ * CmpOrd is suitable for simple types such as integers and pointers that by
+ * default have the less-than and greater-than operators defined.
+ */
+template <class T> struct CmpOrd
+{
+	/**
+	 * \brief Compare two ordinal types.
+	 *
+	 * This compare routine copies its arguements in by value.
+	 */
+	static inline long compare(const T k1, const T k2)
+	{
+		if (k1 < k2)
+			return -1;
+		else if (k1 > k2)
+			return 1;
+		else
+			return 0;
+	}
+};
+
+/**
+ * \brief Compare two tables of type T
+ *
+ * Table comparison is useful for keying a data structure on a vector or
+ * binary search table. T is the element type stored in the table.
+ * CompareT is the comparison structure used to compare the individual values
+ * in the table.
+ */
+template < class T, class CompareT = CmpOrd<T> > struct CmpTable 
+		: public CompareT
+{
+	/**
+	 * \brief Compare two tables storing type T.
+	 */
+	static inline long compare(const Table<T> &t1, const Table<T> &t2)
+	{
+		if ( t1.tabLen < t2.tabLen )
+			return -1;
+		else if ( t1.tabLen > t2.tabLen )
+			return 1;
+		else
+		{
+			T *i1 = t1.data, *i2 = t2.data;
+			long len = t1.tabLen, cmpResult;
+			for ( long pos = 0; pos < len;
+					pos += 1, i1 += 1, i2 += 1 )
+			{
+				cmpResult = CompareT::compare(*i1, *i2);
+				if ( cmpResult != 0 )
+					return cmpResult;
+			}
+			return 0;
+		}
+	}
+};
+
+/**
+ * \brief Compare two tables of type T -- non-static version.
+ *
+ * CmpTableNs is identical to CmpTable, however the compare routine is
+ * non-static.  If the CompareT class contains a non-static compare, then this
+ * version must be used because a static member cannot invoke a non-static
+ * member.
+ *
+ * Table comparison is useful for keying a data structure on a vector or binary
+ * search table. T is the element type stored in the table. CompareT
+ * is the comparison structure used to compare the individual values in the
+ * table.
+ */
+template < class T, class CompareT = CmpOrd<T> > struct CmpTableNs 
+		: public CompareT
+{
+	/**
+	 * \brief Compare two tables storing type T.
+	 */
+	inline long compare(const Table<T> &t1, const Table<T> &t2)
+	{
+		if ( t1.tabLen < t2.tabLen )
+			return -1;
+		else if ( t1.tabLen > t2.tabLen )
+			return 1;
+		else
+		{
+			T *i1 = t1.data, *i2 = t2.data;
+			long len = t1.tabLen, cmpResult;
+			for ( long pos = 0; pos < len;
+					pos += 1, i1 += 1, i2 += 1 )
+			{
+				cmpResult = CompareT::compare(*i1, *i2);
+				if ( cmpResult != 0 )
+					return cmpResult;
+			}
+			return 0;
+		}
+	}
+};
+
+/**
+ * \brief Compare two implicitly shared tables of type T
+ *
+ * This table comparison is for data structures based on implicitly
+ * shared tables.
+ *
+ * Table comparison is useful for keying a data structure on a vector or
+ * binary search table. T is the element type stored in the table.
+ * CompareT is the comparison structure used to compare the individual values
+ * in the table.
+ */
+template < class T, class CompareT = CmpOrd<T> > struct CmpSTable : public CompareT
+{
+	/**
+	 * \brief Compare two tables storing type T.
+	 */
+	static inline long compare(const STable<T> &t1, const STable<T> &t2)
+	{
+		long t1Length = t1.length();
+		long t2Length = t2.length();
+
+		/* Compare lengths. */
+		if ( t1Length < t2Length )
+			return -1;
+		else if ( t1Length > t2Length )
+			return 1;
+		else {
+			/* Compare the table data. */
+			T *i1 = t1.data, *i2 = t2.data;
+			for ( long pos = 0; pos < t1Length;
+					pos += 1, i1 += 1, i2 += 1 )
+			{
+				long cmpResult = CompareT::compare(*i1, *i2);
+				if ( cmpResult != 0 )
+					return cmpResult;
+			}
+			return 0;
+		}
+	}
+};
+
+/**
+ * \brief Compare two implicitly shared tables of type T -- non-static
+ * version.
+ *
+ * This is a non-static table comparison for data structures based on
+ * implicitly shared tables. If the CompareT class contains a non-static
+ * compare, then this version must be used because a static member cannot
+ * invoke a non-static member.
+ *
+ * Table comparison is useful for keying a data structure on a vector or
+ * binary search table. T is the element type stored in the table.
+ * CompareT is the comparison structure used to compare the individual values
+ * in the table.
+ */
+template < class T, class CompareT = CmpOrd<T> > struct CmpSTableNs 
+		: public CompareT
+{
+	/**
+	 * \brief Compare two tables storing type T.
+	 */
+	inline long compare(const STable<T> &t1, const STable<T> &t2)
+	{
+		long t1Length = t1.length();
+		long t2Length = t2.length();
+
+		/* Compare lengths. */
+		if ( t1Length < t2Length )
+			return -1;
+		else if ( t1Length > t2Length )
+			return 1;
+		else {
+			/* Compare the table data. */
+			T *i1 = t1.data, *i2 = t2.data;
+			for ( long pos = 0; pos < t1Length;
+					pos += 1, i1 += 1, i2 += 1 )
+			{
+				long cmpResult = CompareT::compare(*i1, *i2);
+				if ( cmpResult != 0 )
+					return cmpResult;
+			}
+			return 0;
+		}
+	}
+};
+
+
+/*@}*/
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_COMPARE_H */
diff --git a/aapl/dlcommon.h b/aapl/dlcommon.h
new file mode 100644
index 00000000..5ce9bd30
--- /dev/null
+++ b/aapl/dlcommon.h
@@ -0,0 +1,790 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+/* This header is not wrapped in ifndef becuase it is not intended to
+ * be included by the user. */
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+#if defined( DOUBLELIST_VALUE )
+/**
+ * \brief Double list element for DListVal.
+ *
+ * DListValEl stores the type T of DListVal by value. 
+ */
+template <class T> struct DListValEl
+{
+	/**
+	 * \brief Construct a DListValEl with a given value.
+	 *
+	 * The only constructor available initializes the value element. This
+	 * enforces that DListVal elements are never created without having their
+	 * value intialzed by the user. T's copy constructor is used to copy the
+	 * value in.
+	 */
+	DListValEl( const T &val ) : value(val) { }
+
+	/**
+	 * \brief Value stored by the list element.
+	 *
+	 * Value is always copied into new list elements using the copy
+	 * constructor.
+	 */
+	T value;
+
+	/**
+	 * \brief List previous pointer.
+	 *
+	 * Points to the previous item in the list. If this is the first item in
+	 * the list, then prev is NULL. If this element is not in a list then
+	 * prev is undefined.
+	 */
+	DListValEl<T> *prev;
+
+	/**
+	 * \brief List next pointer.
+	 *
+	 * Points to the next item in the list. If this is the list item in the
+	 * list, then next is NULL. If this element is not in a list then next is
+	 * undefined.
+	 */
+	DListValEl<T> *next;
+};
+#else
+
+#ifndef __AAPL_DOUBLE_LIST_EL
+#define __AAPL_DOUBLE_LIST_EL
+/**
+ * \brief Double list element properties.
+ *
+ * This class can be inherited to make a class suitable to be a double list
+ * element. It simply provides the next and previous pointers. An alternative
+ * is to put the next and previous pointers in the class directly.
+ */
+template <class Element> struct DListEl
+{
+	/**
+	 * \brief List previous pointer.
+	 *
+	 * Points to the previous item in the list. If this is the first item in
+	 * the list, then prev is NULL. If this element is not in a list then
+	 * prev is undefined.
+	 */
+	Element *prev;
+
+	/**
+	 * \brief List next pointer.
+	 *
+	 * Points to the next item in the list. If this is the list item in the
+	 * list, then next is NULL. If this element is not in a list then next is
+	 * undefined.
+	 */
+	Element *next;
+};
+#endif /* __AAPL_DOUBLE_LIST_EL */
+
+#endif
+
+/* Doubly Linked List */
+template <DLMEL_TEMPDEF> class DList
+{
+public:
+	/** \brief Initialize an empty list. */
+	DList() : head(0), tail(0), listLen(0) {}
+
+	/** 
+	 * \brief Perform a deep copy of the list.
+	 * 
+	 * The elements of the other list are duplicated and put into this list.
+	 * Elements are copied using the copy constructor.
+	 */
+	DList(const DList &other);
+
+#ifdef DOUBLELIST_VALUE
+	/**
+	 * \brief Clear the double list contents.
+	 *
+	 * All elements are deleted.
+	 */
+	~DList() { empty(); }
+
+	/**
+	 * \brief Assign another list into this list using a deep copy.
+	 *
+	 * The elements of the other list are duplicated and put into this list.
+	 * Each list item is created using the copy constructor. If this list
+	 * contains any elements before the copy, they are deleted first.
+	 *
+	 * \returns A reference to this.
+	 */
+	DList &operator=(const DList &other);
+
+	/**
+	 * \brief Transfer the contents of another list into this list.
+	 *
+	 * The elements of the other list moved in. The other list will be empty
+	 * afterwards.  If this list contains any elements before the copy, then
+	 * they are deleted. 
+	 */
+	void transfer(DList &other);
+#else
+	/**
+	 * \brief Abandon all elements in the list. 
+	 *
+	 * List elements are not deleted.
+	 */
+	~DList() {}
+
+	/**
+	 * \brief Perform a deep copy of the list.
+	 *
+	 * The elements of the other list are duplicated and put into this list.
+	 * Each list item is created using the copy constructor. If this list
+	 * contains any elements before the copy, they are abandoned.
+	 *
+	 * \returns A reference to this.
+	 */
+	DList &operator=(const DList &other);
+
+	/**
+	 * \brief Transfer the contents of another list into this list.
+	 *
+	 * The elements of the other list moved in. The other list will be empty
+	 * afterwards.  If this list contains any elements before the copy, they
+	 * are abandoned. 
+	 */
+	void transfer(DList &other);
+#endif
+
+
+#ifdef DOUBLELIST_VALUE
+	/**
+	 * \brief Make a new element and prepend it to the front of the list.
+	 *
+	 * The item is copied into the new element using the copy constructor.
+	 * Equivalent to list.addBefore(list.head, item).
+	 */
+	void prepend(const T &item);
+
+	/**
+	 * \brief Make a new element and append it to the end of the list.
+	 *
+	 * The item is copied into the new element using the copy constructor.
+	 * Equivalent to list.addAfter(list.tail, item).
+	 */
+	void append(const T &item);
+
+	/**
+	 * \brief Make a new element and insert it immediately after an element in
+	 * the list.
+	 *
+	 * The item is copied into the new element using the copy constructor. If
+	 * prev_el is NULL then the new element is prepended to the front of the
+	 * list. If prev_el is not already in the list then undefined behaviour
+	 * results.  Equivalent to list.addAfter(prev_el, new DListValEl(item)).
+	 */
+	void addAfter(Element *prev_el, const T &item);
+
+	/**
+	 * \brief Make a new element and insert it immediately before an element
+	 * in the list. 
+	 *
+	 * The item is copied into the new element using the copy construcotor. If
+	 * next_el is NULL then the new element is appended to the end of the
+	 * list.  If next_el is not already in the list then undefined behaviour
+	 * results.  Equivalent to list.addBefore(next_el, new DListValEl(item)).
+	 */
+	void addBefore(Element *next_el, const T &item);
+#endif
+
+	/**
+	 * \brief Prepend a single element to the front of the list.
+	 *
+	 * If new_el is already an element of some list, then undefined behaviour
+	 * results. Equivalent to list.addBefore(list.head, new_el).
+	 */
+	void prepend(Element *new_el) { addBefore(head, new_el); }
+
+	/**
+	 * \brief Append a single element to the end of the list.
+	 *
+	 * If new_el is alreay an element of some list, then undefined behaviour
+	 * results.  Equivalent to list.addAfter(list.tail, new_el).
+	 */
+	void append(Element *new_el)  { addAfter(tail, new_el); }
+
+	/**
+	 * \brief Prepend an entire list to the beginning of this list.
+	 *
+	 * All items are moved, not copied. Afterwards, the other list is emtpy.
+	 * All items are prepended at once, so this is an O(1) operation.
+	 * Equivalent to list.addBefore(list.head, dl).
+	 */
+	void prepend(DList &dl)       { addBefore(head, dl); }
+
+	/**
+	 * \brief Append an entire list to the end of the list.
+	 *
+	 * All items are moved, not copied. Afterwards, the other list is empty.
+	 * All items are appened at once, so this is an O(1) operation.
+	 * Equivalent to list.addAfter(list.tail, dl).
+	 */
+	void append(DList &dl)        { addAfter(tail, dl); }
+
+	void addAfter(Element *prev_el, Element *new_el);
+	void addBefore(Element *next_el, Element *new_el);
+
+	void addAfter(Element *prev_el, DList &dl);
+	void addBefore(Element *next_el, DList &dl);
+
+	/**
+	 * \brief Detach the head of the list
+	 *
+	 * The element detached is not deleted. If there is no head of the list
+	 * (the list is empty) then undefined behaviour results.  Equivalent to
+	 * list.detach(list.head).
+	 *
+	 * \returns The element detached.
+	 */
+	Element *detachFirst()        { return detach(head); }
+
+	/**
+	 * \brief Detach the tail of the list
+	 *
+	 * The element detached is not deleted. If there is no tail of the list
+	 * (the list is empty) then undefined behaviour results.  Equivalent to
+	 * list.detach(list.tail).
+	 *
+	 * \returns The element detached.
+	 */
+	Element *detachLast()         { return detach(tail); }
+
+ 	/* Detaches an element from the list. Does not free any memory. */
+	Element *detach(Element *el);
+
+	/**
+	 * \brief Detach and delete the first element in the list.
+	 *
+	 * If there is no first element (the list is empty) then undefined
+	 * behaviour results.  Equivalent to delete list.detach(list.head);
+	 */
+	void removeFirst()         { delete detach( head ); }
+
+	/**
+	 * \brief Detach and delete the last element in the list.
+	 *
+	 * If there is no last element (the list is emtpy) then undefined
+	 * behaviour results.  Equivalent to delete list.detach(list.tail);
+	 */
+	void removeLast()          { delete detach( tail ); }
+
+	/**
+	 * \brief Detach and delete an element from the list.
+	 *
+	 * If the element is not in the list, then undefined behaviour results.
+	 * Equivalent to delete list.detach(el);
+	 */
+	void remove(Element *el)   { delete detach( el ); }
+	
+	void empty();
+	void abandon();
+
+	/** \brief The number of elements in the list. */
+	long length() const { return listLen; }
+
+	/** \brief Head and tail of the linked list. */
+	Element *head, *tail;
+
+	/** \brief The number of element in the list. */
+	long listLen;
+
+	/* Convenience access. */
+	long size() const           { return listLen; }
+
+	/* Forward this so a ref can be used. */
+	struct Iter;
+
+	/* Class for setting the iterator. */
+	struct IterFirst { IterFirst( const DList &l ) : l(l) { } const DList &l; };
+	struct IterLast { IterLast( const DList &l ) : l(l) { } const DList &l; };
+	struct IterNext { IterNext( const Iter &i ) : i(i) { } const Iter &i; };
+	struct IterPrev { IterPrev( const Iter &i ) : i(i) { } const Iter &i; };
+
+	/**
+	 * \brief Double List Iterator. 
+	 * \ingroup iterators
+	 */
+	struct Iter
+	{
+		/* Default construct. */
+		Iter() : ptr(0) { }
+
+		/* Construct from a double list. */
+		Iter( const DList &dl )      : ptr(dl.head) { }
+		Iter( Element *el )          : ptr(el) { }
+		Iter( const IterFirst &dlf ) : ptr(dlf.l.head) { }
+		Iter( const IterLast &dll )  : ptr(dll.l.tail) { }
+		Iter( const IterNext &dln )  : ptr(dln.i.ptr->BASE_EL(next)) { }
+		Iter( const IterPrev &dlp )  : ptr(dlp.i.ptr->BASE_EL(prev)) { }
+
+		/* Assign from a double list. */
+		Iter &operator=( const DList &dl )     { ptr = dl.head; return *this; }
+		Iter &operator=( Element *el )         { ptr = el; return *this; }
+		Iter &operator=( const IterFirst &af ) { ptr = af.l.head; return *this; }
+		Iter &operator=( const IterLast &al )  { ptr = al.l.tail; return *this; }
+		Iter &operator=( const IterNext &an )  { ptr = an.i.ptr->BASE_EL(next); return *this; }
+		Iter &operator=( const IterPrev &ap )  { ptr = ap.i.ptr->BASE_EL(prev); return *this; }
+
+		/** \brief Less than end? */
+		bool lte() const    { return ptr != 0; }
+
+		/** \brief At end? */
+		bool end() const    { return ptr == 0; }
+
+		/** \brief Greater than beginning? */
+		bool gtb() const { return ptr != 0; }
+
+		/** \brief At beginning? */
+		bool beg() const { return ptr == 0; }
+
+		/** \brief At first element? */
+		bool first() const { return ptr && ptr->BASE_EL(prev) == 0; }
+
+		/** \brief At last element? */
+		bool last() const  { return ptr && ptr->BASE_EL(next) == 0; }
+
+		/** \brief Implicit cast to Element*. */
+		operator Element*() const   { return ptr; }
+
+		/** \brief Dereference operator returns Element&. */
+		Element &operator *() const { return *ptr; }
+
+		/** \brief Arrow operator returns Element*. */
+		Element *operator->() const { return ptr; }
+
+		/** \brief Move to next item. */
+		inline Element *operator++()      { return ptr = ptr->BASE_EL(next); }
+
+		/** \brief Move to next item. */
+		inline Element *increment()       { return ptr = ptr->BASE_EL(next); }
+
+		/** \brief Move to next item. */
+		inline Element *operator++(int);
+
+		/** \brief Move to previous item. */
+		inline Element *operator--()      { return ptr = ptr->BASE_EL(prev); }
+
+		/** \brief Move to previous item. */
+		inline Element *decrement()       { return ptr = ptr->BASE_EL(prev); }
+
+		/** \brief Move to previous item. */
+		inline Element *operator--(int);
+
+		/** \brief Return the next item. Does not modify this. */
+		inline IterNext next() const { return IterNext(*this); }
+
+		/** \brief Return the prev item. Does not modify this. */
+		inline IterPrev prev() const { return IterPrev(*this); }
+
+		/** \brief The iterator is simply a pointer. */
+		Element *ptr;
+	};
+
+	/** \brief Return first element. */
+	IterFirst first()  { return IterFirst(*this); }
+
+	/** \brief Return last element. */
+	IterLast last()    { return IterLast(*this); }
+};
+
+/* Copy constructor, does a deep copy of other. */
+template <DLMEL_TEMPDEF> DList<DLMEL_TEMPUSE>::
+		DList(const DList<DLMEL_TEMPUSE> &other) :
+			head(0), tail(0), listLen(0)
+{
+	Element *el = other.head;
+	while( el != 0 ) {
+		append( new Element(*el) );
+		el = el->BASE_EL(next);
+	}
+}
+
+#ifdef DOUBLELIST_VALUE
+
+/* Assignement operator does deep copy. */
+template <DLMEL_TEMPDEF> DList<DLMEL_TEMPUSE> &DList<DLMEL_TEMPUSE>::
+		operator=(const DList &other)
+{
+	/* Free the old list. The value list assumes items were allocated on the
+	 * heap by itself. */
+	empty();
+
+	Element *el = other.head;
+	while( el != 0 ) {
+		append( new Element(*el) );
+		el = el->BASE_EL(next);
+	}
+	return *this;
+}
+
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		transfer(DList &other)
+{
+	/* Free the old list. The value list assumes items were allocated on the
+	 * heap by itself. */
+	empty();
+
+	head = other.head;
+	tail = other.tail;
+	listLen = other.listLen;
+
+	other.abandon();
+}
+
+#else 
+
+/* Assignement operator does deep copy. */
+template <DLMEL_TEMPDEF> DList<DLMEL_TEMPUSE> &DList<DLMEL_TEMPUSE>::
+		operator=(const DList &other)
+{
+	Element *el = other.head;
+	while( el != 0 ) {
+		append( new Element(*el) );
+		el = el->BASE_EL(next);
+	}
+	return *this;
+}
+
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		transfer(DList &other)
+{
+	head = other.head;
+	tail = other.tail;
+	listLen = other.listLen;
+
+	other.abandon();
+}
+
+#endif
+
+#ifdef DOUBLELIST_VALUE
+
+/* Prepend a new item. Inlining this bloats the caller with new overhead. */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		prepend(const T &item)
+{
+	addBefore(head, new Element(item)); 
+}
+
+/* Append a new item. Inlining this bloats the caller with the new overhead. */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		append(const T &item)
+{
+	addAfter(tail, new Element(item));
+}
+
+/* Add a new item after a prev element. Inlining this bloats the caller with
+ * the new overhead. */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addAfter(Element *prev_el, const T &item)
+{
+	addAfter(prev_el, new Element(item));
+}
+
+/* Add a new item before a next element. Inlining this bloats the caller with
+ * the new overhead. */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addBefore(Element *next_el, const T &item)
+{
+	addBefore(next_el, new Element(item));
+}
+
+#endif
+
+/*
+ * The larger iterator operators.
+ */
+
+/* Postfix ++ */
+template <DLMEL_TEMPDEF> Element *DList<DLMEL_TEMPUSE>::Iter::
+		operator++(int)       
+{
+	Element *rtn = ptr; 
+	ptr = ptr->BASE_EL(next);
+	return rtn;
+}
+
+/* Postfix -- */
+template <DLMEL_TEMPDEF> Element *DList<DLMEL_TEMPUSE>::Iter::
+		operator--(int)       
+{
+	Element *rtn = ptr;
+	ptr = ptr->BASE_EL(prev);
+	return rtn;
+}
+
+/**
+ * \brief Insert an element immediately after an element in the list.
+ *
+ * If prev_el is NULL then new_el is prepended to the front of the list. If
+ * prev_el is not in the list or if new_el is already in a list, then
+ * undefined behaviour results.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addAfter(Element *prev_el, Element *new_el)
+{
+	/* Set the previous pointer of new_el to prev_el. We do
+	 * this regardless of the state of the list. */
+	new_el->BASE_EL(prev) = prev_el; 
+
+	/* Set forward pointers. */
+	if (prev_el == 0) {
+		/* There was no prev_el, we are inserting at the head. */
+		new_el->BASE_EL(next) = head;
+		head = new_el;
+	} 
+	else {
+		/* There was a prev_el, we can access previous next. */
+		new_el->BASE_EL(next) = prev_el->BASE_EL(next);
+		prev_el->BASE_EL(next) = new_el;
+	} 
+
+	/* Set reverse pointers. */
+	if (new_el->BASE_EL(next) == 0) {
+		/* There is no next element. Set the tail pointer. */
+		tail = new_el;
+	}
+	else {
+		/* There is a next element. Set it's prev pointer. */
+		new_el->BASE_EL(next)->BASE_EL(prev) = new_el;
+	}
+
+	/* Update list length. */
+	listLen++;
+}
+
+/**
+ * \brief Insert an element immediatly before an element in the list.
+ *
+ * If next_el is NULL then new_el is appended to the end of the list. If
+ * next_el is not in the list or if new_el is already in a list, then
+ * undefined behaviour results.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addBefore(Element *next_el, Element *new_el)
+{
+	/* Set the next pointer of the new element to next_el. We do
+	 * this regardless of the state of the list. */
+	new_el->BASE_EL(next) = next_el; 
+
+	/* Set reverse pointers. */
+	if (next_el == 0) {
+		/* There is no next elememnt. We are inserting at the tail. */
+		new_el->BASE_EL(prev) = tail;
+		tail = new_el;
+	} 
+	else {
+		/* There is a next element and we can access next's previous. */
+		new_el->BASE_EL(prev) = next_el->BASE_EL(prev);
+		next_el->BASE_EL(prev) = new_el;
+	} 
+
+	/* Set forward pointers. */
+	if (new_el->BASE_EL(prev) == 0) {
+		/* There is no previous element. Set the head pointer.*/
+		head = new_el;
+	}
+	else {
+		/* There is a previous element, set it's next pointer to new_el. */
+		new_el->BASE_EL(prev)->BASE_EL(next) = new_el;
+	}
+
+	/* Update list length. */
+	listLen++;
+}
+
+/**
+ * \brief Insert an entire list immediatly after an element in this list.
+ *
+ * Elements are moved, not copied. Afterwards, the other list is empty. If
+ * prev_el is NULL then the elements are prepended to the front of the list.
+ * If prev_el is not in the list then undefined behaviour results. All
+ * elements are inserted into the list at once, so this is an O(1) operation.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addAfter( Element *prev_el, DList<DLMEL_TEMPUSE> &dl )
+{
+	/* Do not bother if dl has no elements. */
+	if ( dl.listLen == 0 )
+		return;
+
+	/* Set the previous pointer of dl.head to prev_el. We do
+	 * this regardless of the state of the list. */
+	dl.head->BASE_EL(prev) = prev_el; 
+
+	/* Set forward pointers. */
+	if (prev_el == 0) {
+		/* There was no prev_el, we are inserting at the head. */
+		dl.tail->BASE_EL(next) = head;
+		head = dl.head;
+	} 
+	else {
+		/* There was a prev_el, we can access previous next. */
+		dl.tail->BASE_EL(next) = prev_el->BASE_EL(next);
+		prev_el->BASE_EL(next) = dl.head;
+	} 
+
+	/* Set reverse pointers. */
+	if (dl.tail->BASE_EL(next) == 0) {
+		/* There is no next element. Set the tail pointer. */
+		tail = dl.tail;
+	}
+	else {
+		/* There is a next element. Set it's prev pointer. */
+		dl.tail->BASE_EL(next)->BASE_EL(prev) = dl.tail;
+	}
+
+	/* Update the list length. */
+	listLen += dl.listLen;
+
+	/* Empty out dl. */
+	dl.head = dl.tail = 0;
+	dl.listLen = 0;
+}
+
+/**
+ * \brief Insert an entire list immediately before an element in this list.
+ *
+ * Elements are moved, not copied. Afterwards, the other list is empty. If
+ * next_el is NULL then the elements are appended to the end of the list. If
+ * next_el is not in the list then undefined behaviour results. All elements
+ * are inserted at once, so this is an O(1) operation.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::
+		addBefore( Element *next_el, DList<DLMEL_TEMPUSE> &dl )
+{
+	/* Do not bother if dl has no elements. */
+	if ( dl.listLen == 0 )
+		return;
+
+	/* Set the next pointer of dl.tail to next_el. We do
+	 * this regardless of the state of the list. */
+	dl.tail->BASE_EL(next) = next_el; 
+
+	/* Set reverse pointers. */
+	if (next_el == 0) {
+		/* There is no next elememnt. We are inserting at the tail. */
+		dl.head->BASE_EL(prev) = tail;
+		tail = dl.tail;
+	} 
+	else {
+		/* There is a next element and we can access next's previous. */
+		dl.head->BASE_EL(prev) = next_el->BASE_EL(prev);
+		next_el->BASE_EL(prev) = dl.tail;
+	} 
+
+	/* Set forward pointers. */
+	if (dl.head->BASE_EL(prev) == 0) {
+		/* There is no previous element. Set the head pointer.*/
+		head = dl.head;
+	}
+	else {
+		/* There is a previous element, set it's next pointer to new_el. */
+		dl.head->BASE_EL(prev)->BASE_EL(next) = dl.head;
+	}
+
+	/* Update list length. */
+	listLen += dl.listLen;
+
+	/* Empty out dl. */
+	dl.head = dl.tail = 0;
+	dl.listLen = 0;
+}
+
+
+/**
+ * \brief Detach an element from the list.
+ *
+ * The element is not deleted. If the element is not in the list, then
+ * undefined behaviour results.
+ *
+ * \returns The element detached.
+ */
+template <DLMEL_TEMPDEF> Element *DList<DLMEL_TEMPUSE>::
+		detach(Element *el)
+{
+	/* Set forward pointers to skip over el. */
+	if (el->BASE_EL(prev) == 0) 
+		head = el->BASE_EL(next); 
+	else {
+		el->BASE_EL(prev)->BASE_EL(next) =
+				el->BASE_EL(next); 
+	}
+
+	/* Set reverse pointers to skip over el. */
+	if (el->BASE_EL(next) == 0) 
+		tail = el->BASE_EL(prev); 
+	else {
+		el->BASE_EL(next)->BASE_EL(prev) =
+				el->BASE_EL(prev); 
+	}
+
+	/* Update List length and return element we detached. */
+	listLen--;
+	return el;
+}
+
+/**
+ * \brief Clear the list by deleting all elements.
+ *
+ * Each item in the list is deleted. The list is reset to its initial state.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::empty()
+{
+	Element *nextToGo = 0, *cur = head;
+	
+	while (cur != 0)
+	{
+		nextToGo = cur->BASE_EL(next);
+		delete cur;
+		cur = nextToGo;
+	}
+	head = tail = 0;
+	listLen = 0;
+}
+
+/**
+ * \brief Clear the list by forgetting all elements.
+ *
+ * All elements are abandoned, not deleted. The list is reset to it's initial
+ * state.
+ */
+template <DLMEL_TEMPDEF> void DList<DLMEL_TEMPUSE>::abandon()
+{
+	head = tail = 0;
+	listLen = 0;
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
diff --git a/aapl/dlist.h b/aapl/dlist.h
new file mode 100644
index 00000000..eaf3e5d5
--- /dev/null
+++ b/aapl/dlist.h
@@ -0,0 +1,64 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_DLIST_H
+#define _AAPL_DLIST_H
+
+#define BASE_EL(name) name
+#define DLMEL_TEMPDEF class Element
+#define DLMEL_TEMPUSE Element
+#define DList DList
+
+/**
+ * \addtogroup dlist
+ * @{
+ */
+
+/**
+ * \class DList
+ * \brief Basic doubly linked list.
+ *
+ * DList is the standard by-structure list type. This class requires the
+ * programmer to declare a list element type that has the necessary next and
+ * previous pointers in it. This can be achieved by inheriting from the
+ * DListEl class or by simply adding next and previous pointers directly into
+ * the list element class.
+ *
+ * DList does not assume ownership of elements in the list. If the elements
+ * are known to reside on the heap, the provided empty() routine can be used to
+ * delete all elements, however the destructor will not call this routine, it
+ * will simply abandon all the elements. It is up to the programmer to
+ * explicitly de-allocate items when necessary.
+ *
+ * \include ex_dlist.cpp
+ */
+
+/*@}*/
+
+#include "dlcommon.h"
+
+#undef BASE_EL
+#undef DLMEL_TEMPDEF
+#undef DLMEL_TEMPUSE
+#undef DList
+
+#endif /* _AAPL_DLIST_H */
+
diff --git a/aapl/dlistmel.h b/aapl/dlistmel.h
new file mode 100644
index 00000000..34331393
--- /dev/null
+++ b/aapl/dlistmel.h
@@ -0,0 +1,71 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_DLISTMEL_H
+#define _AAPL_DLISTMEL_H
+
+/**
+ * \addtogroup dlist
+ * @{
+ */
+
+/**
+ * \class DListMel
+ * \brief Doubly linked list for elements that may appear in multiple lists.
+ *
+ * This class is similar to DList, except that the user defined list element
+ * can inherit from multple DListEl classes and consequently be an element in
+ * multiple lists. In other words, DListMel allows a single instance of a data
+ * structure to be an element in multiple lists without the lists interfereing
+ * with one another.
+ *
+ * For each list that an element class is to appear in, the element must have
+ * unique next and previous pointers that can be unambiguously refered to with
+ * some base class name. This name is given to DListMel as a template argument
+ * so it can use the correct next and previous pointers in its list
+ * operations.
+ *
+ * DListMel does not assume ownership of elements in the list. If the elements
+ * are known to reside on the heap and are not contained in any other list or
+ * data structure, the provided empty() routine can be used to delete all
+ * elements, however the destructor will not call this routine, it will simply
+ * abandon all the elements. It is up to the programmer to explicitly
+ * de-allocate items when it is safe to do so.
+ *
+ * \include ex_dlistmel.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) BaseEl::name
+#define DLMEL_TEMPDEF class Element, class BaseEl
+#define DLMEL_TEMPUSE Element, BaseEl
+#define DList DListMel
+
+#include "dlcommon.h"
+
+#undef BASE_EL
+#undef DLMEL_TEMPDEF
+#undef DLMEL_TEMPUSE
+#undef DList
+
+#endif /* _AAPL_DLISTMEL_H */
+
diff --git a/aapl/dlistval.h b/aapl/dlistval.h
new file mode 100644
index 00000000..6f249995
--- /dev/null
+++ b/aapl/dlistval.h
@@ -0,0 +1,71 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_DLISTVAL_H
+#define _AAPL_DLISTVAL_H
+
+/**
+ * \addtogroup dlist
+ * @{
+ */
+
+/**
+ * \class DListVal
+ * \brief By-value doubly linked list.
+ *
+ * This class is a doubly linked list that does not require a list element
+ * type to be declared. The user instead gives a type that is to be stored in
+ * the list element. When inserting a new data item, the value is copied into
+ * a newly allocated element. This list is inteded to behave and be utilized
+ * like the list template found in the STL.
+ *
+ * DListVal is different from the other lists in that it allocates elements
+ * itself. The raw element insert interface is still exposed for convenience,
+ * however, the list assumes all elements in the list are allocated on the
+ * heap and are to be managed by the list. The destructor WILL delete the
+ * contents of the list. If the list is ever copied in from another list, the
+ * existing contents are deleted first. This is in contrast to DList and
+ * DListMel, which will never delete their contents to allow for statically
+ * allocated elements.
+ *
+ * \include ex_dlistval.cpp
+ */
+
+/*@}*/
+
+#define BASE_EL(name) name
+#define DLMEL_TEMPDEF class T
+#define DLMEL_TEMPUSE T
+#define DList DListVal
+#define Element DListValEl<T>
+#define DOUBLELIST_VALUE
+
+#include "dlcommon.h"
+
+#undef BASE_EL
+#undef DLMEL_TEMPDEF
+#undef DLMEL_TEMPUSE
+#undef DList
+#undef Element
+#undef DOUBLELIST_VALUE
+
+#endif /* _AAPL_DLISTVAL_H */
+
diff --git a/aapl/insertsort.h b/aapl/insertsort.h
new file mode 100644
index 00000000..eb3e2649
--- /dev/null
+++ b/aapl/insertsort.h
@@ -0,0 +1,94 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_INSERTSORT_H
+#define _AAPL_INSERTSORT_H
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup sort 
+ * @{
+ */
+
+/** 
+ * \class InsertSort
+ * \brief Insertion sort an array of data.
+ *
+ * InsertSort can be used to sort any array of objects of type T provided a
+ * compare class is given. InsertSort is in-place. It does not require any
+ * temporary storage.
+ *
+ * Objects are not made aware that they are being moved around in memory.
+ * Assignment operators, constructors and destructors are never invoked by the
+ * sort.
+ *
+ * InsertSort runs in O(n^2) time. It is most useful when sorting small arrays.
+ * where it can outperform the O(n*log(n)) sorters due to its simplicity.
+ * InsertSort is a not a stable sort. Elements with the same key will not have
+ * their relative ordering preserved.
+ */
+
+/*@}*/
+
+/* InsertSort. */
+template <class T, class Compare> class InsertSort
+	: public Compare
+{
+public:
+	/* Sorting interface routine. */
+	void sort(T *data, long len);
+};
+
+
+/**
+ * \brief Insertion sort an array of data.
+ */
+template <class T, class Compare> 
+	void InsertSort<T,Compare>::sort(T *data, long len)
+{
+	/* For each next largest spot in the sorted array... */
+	for ( T *dest = data; dest < data+len-1; dest++ ) {
+		/* Find the next smallest element in the unsorted array. */
+		T *smallest = dest;
+		for ( T *src = dest+1; src < data+len; src++ ) {
+			/* If src is smaller than the current src, then use it. */
+			if ( compare( *src, *smallest ) < 0 )
+				smallest = src;
+		}
+
+		if ( smallest != dest ) {
+			/* Swap dest, smallest. */
+			char tmp[sizeof(T)];
+			memcpy( tmp, dest, sizeof(T) );
+			memcpy( dest, smallest, sizeof(T) );
+			memcpy( smallest, tmp, sizeof(T) );
+		}
+	}
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_INSERTSORT_H */
diff --git a/aapl/mergesort.h b/aapl/mergesort.h
new file mode 100644
index 00000000..d017511f
--- /dev/null
+++ b/aapl/mergesort.h
@@ -0,0 +1,140 @@
+/*
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_MERGESORT_H
+#define _AAPL_MERGESORT_H
+
+#include "bubblesort.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup sort 
+ * @{
+ */
+
+/** 
+ * \class MergeSort
+ * \brief Merge sort an array of data.
+ *
+ * MergeSort can be used to sort any array of objects of type T provided a
+ * compare class is given. MergeSort is not in-place, it requires temporary
+ * storage equal to the size of the array. The temporary storage is allocated
+ * on the heap.
+ *
+ * Objects are not made aware that they are being moved around in memory.
+ * Assignment operators, constructors and destructors are never invoked by the
+ * sort. 
+ *
+ * MergeSort runs in worst case O(n*log(n)) time. In most cases it is slower
+ * than QuickSort because more copying is neccessary. But on the other hand,
+ * it is a stable sort, meaning that objects with the same key have their
+ * relative ordering preserved. Also, its worst case is better. MergeSort
+ * switches to a BubbleSort when the size of the array being sorted is small.
+ * This happens when directly sorting a small array or when MergeSort calls
+ * itself recursively on a small portion of a larger array.
+ */
+
+/*@}*/
+
+
+/* MergeSort. */
+template <class T, class Compare> class MergeSort 
+		: public BubbleSort<T, Compare>
+{
+public:
+	/* Sorting interface routine. */
+	void sort(T *data, long len);
+
+private:
+	/* Recursive worker. */
+	void doSort(T *tmpStor, T *data, long len);
+};
+
+#define _MS_BUBBLE_THRESH 16
+
+/* Recursive mergesort worker. Split data, make recursive calls, merge
+ * results. */
+template< class T, class Compare> void MergeSort<T,Compare>::
+		doSort(T *tmpStor, T *data, long len)
+{
+	if ( len <= 1 )
+		return;
+
+	if ( len <= _MS_BUBBLE_THRESH ) {
+		BubbleSort<T, Compare>::sort( data, len );
+		return;
+	}
+
+	long mid = len / 2;
+
+	doSort( tmpStor, data, mid );
+	doSort( tmpStor + mid, data + mid, len - mid );
+	
+	/* Merge the data. */
+	T *endLower = data + mid, *lower = data;
+	T *endUpper = data + len, *upper = data + mid;
+	T *dest = tmpStor;
+	while ( true ) {
+		if ( lower == endLower ) {
+			/* Possibly upper left. */
+			if ( upper != endUpper )
+				memcpy( dest, upper, (endUpper - upper) * sizeof(T) );
+			break;
+		}
+		else if ( upper == endUpper ) {
+			/* Only lower left. */
+			if ( lower != endLower )
+				memcpy( dest, lower, (endLower - lower) * sizeof(T) );
+			break;
+		}
+		else {
+			/* Both upper and lower left. */
+			if ( compare(*lower, *upper) <= 0 )
+				memcpy( dest++, lower++, sizeof(T) );
+			else
+				memcpy( dest++, upper++, sizeof(T) );
+		}
+	}
+
+	/* Copy back from the tmpStor array. */
+	memcpy( data, tmpStor, sizeof( T ) * len );
+}
+
+/**
+ * \brief Merge sort an array of data.
+ */
+template< class T, class Compare> 
+	void MergeSort<T,Compare>::sort(T *data, long len)
+{
+	/* Allocate the tmp space needed by merge sort, sort and free. */
+	T *tmpStor = (T*) new char[sizeof(T) * len];
+	doSort( tmpStor, data, len );
+	delete[] (char*) tmpStor;
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_MERGESORT_H */
diff --git a/aapl/quicksort.h b/aapl/quicksort.h
new file mode 100644
index 00000000..9bb96efd
--- /dev/null
+++ b/aapl/quicksort.h
@@ -0,0 +1,185 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_QUICKSORT_H
+#define _AAPL_QUICKSORT_H
+
+#include "insertsort.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup sort 
+ * @{
+ */
+
+/** 
+ * \class QuickSort
+ * \brief Quick sort an array of data.
+ *
+ * QuickSort can be used to sort any array of objects of type T provided a
+ * compare class is given. QuickSort is in-place. It does not require any
+ * temporary storage.
+ *
+ * Objects are not made aware that they are being moved around in memory.
+ * Assignment operators, constructors and destructors are never invoked by the
+ * sort.
+ *
+ * QuickSort runs in O(n*log(n)) time in the average case. It is faster than
+ * mergsort in the average case because it does less moving of data. The
+ * performance of quicksort depends mostly on the choice of pivot. This
+ * implementation picks the pivot as the median of first, middle, last. This
+ * choice of pivot avoids the O(n^2) worst case for input already sorted, but
+ * it is still possible to encounter the O(n^2) worst case. For example an
+ * array of identical elements will run in O(n^2)
+ *
+ * QuickSort is not a stable sort. Elements with the same key will not have
+ * their relative ordering preserved.  QuickSort switches to an InsertSort
+ * when the size of the array being sorted is small. This happens when
+ * directly sorting a small array or when QuickSort calls iteself recursively
+ * on a small portion of a larger array.
+ */
+
+/*@}*/
+
+/* QuickSort. */
+template <class T, class Compare> class QuickSort : 
+		public InsertSort<T, Compare>
+{
+public:
+	/* Sorting interface routine. */
+	void sort(T *data, long len);
+
+private:
+	/* Recursive worker. */
+	void doSort(T *start, T *end);
+	T *partition(T *start, T *end);
+	inline T *median(T *start, T *end);
+};
+
+#define _QS_INSERTION_THRESH 16
+
+/* Finds the median of start, middle, end. */
+template <class T, class Compare> T *QuickSort<T,Compare>::
+		median(T *start, T *end)
+{
+	T *pivot, *mid = start + (end-start)/2;
+
+	/* CChoose the pivot. */
+	if ( compare(*start, *mid) < 0  ) {
+		if ( compare(*mid, *end) < 0 )
+			pivot = mid;
+		else if ( compare(*start, *end) < 0 )
+			pivot = end;
+		else
+			pivot = start;
+	}
+	else if ( compare(*start, *end) < 0 )
+		pivot = start;
+	else if ( compare(*mid, *end) < 0 )
+		pivot = end;
+	else
+		pivot = mid;
+
+	return pivot;
+}
+
+template <class T, class Compare> T *QuickSort<T,Compare>::
+		partition(T *start, T *end)
+{
+	/* Use the median of start, middle, end as the pivot. First save
+	 * it off then move the last element to the free spot. */
+	char pcPivot[sizeof(T)];
+	T *pivot = median(start, end);
+
+	memcpy( pcPivot, pivot, sizeof(T) );
+	if ( pivot != end )
+		memcpy( pivot, end, sizeof(T) );
+
+	T *first = start-1;
+	T *last = end;
+	pivot = (T*) pcPivot;
+
+	/* Shuffle element to the correct side of the pivot, ending
+	 * up with the free spot where the pivot will go. */
+	while ( true ) {
+		/* Throw one element ahead to the free spot at last. */
+		while ( true ) {
+			first += 1;
+			if ( first == last )
+				goto done;
+			if ( compare( *first, *pivot ) > 0 ) {
+				memcpy(last, first, sizeof(T));
+				break;
+			}
+		}
+
+		/* Throw one element back to the free spot at first. */
+		while ( true ) {
+			last -= 1;
+			if ( last == first )
+				goto done;
+			if ( compare( *last, *pivot ) < 0 ) {
+				memcpy(first, last, sizeof(T));
+				break;
+			}
+		}
+	}
+done:
+	/* Put the pivot into the middle spot for it. */
+	memcpy( first, pivot, sizeof(T) );
+	return first;
+}
+
+
+template< class T, class Compare> void QuickSort<T,Compare>::
+		doSort(T *start, T *end)
+{
+	long len = end - start + 1;
+	if ( len > _QS_INSERTION_THRESH ) {
+		/* Use quicksort. */
+		T *pivot = partition( start, end );
+		doSort(start, pivot-1);
+		doSort(pivot+1, end);
+	} 
+	else if ( len > 1 ) {
+		/* Array is small, use insertion sort. */
+		InsertSort<T, Compare>::sort( start, len );
+	}
+}
+
+/**
+ * \brief Quick sort an array of data.
+ */
+template< class T, class Compare> 
+	void QuickSort<T,Compare>::sort(T *data, long len)
+{
+	/* Call recursive worker. */
+	doSort(data, data+len-1);
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_QUICKSORT_H */
diff --git a/aapl/resize.h b/aapl/resize.h
new file mode 100644
index 00000000..24edc16e
--- /dev/null
+++ b/aapl/resize.h
@@ -0,0 +1,344 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_RESIZE_H
+#define _AAPL_RESIZE_H
+
+#include <assert.h>
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/* This step is expressed in units of T. Changing this requires changes to
+ * docs in ResizeLin constructor.  */
+#define LIN_DEFAULT_STEP 256
+
+/*
+ * Resizing macros giving different resize methods.
+ */
+
+/* If needed is greater than existing, give twice needed. */
+#define EXPN_UP( existing, needed ) \
+		needed > existing ? (needed<<1) : existing
+	
+/* If needed is less than 1 quarter existing, give twice needed. */
+#define EXPN_DOWN( existing, needed ) \
+		needed < (existing>>2) ? (needed<<1) : existing
+
+/* If needed is greater than existing, give needed plus step. */
+#define LIN_UP( existing, needed ) \
+	needed > existing ? (needed+step) : existing
+
+/* If needed is less than existing - 2 * step then give needed plus step. */
+#define LIN_DOWN( existing, needed ) \
+	needed < (existing-(step<<1)) ? (needed+step) : existing
+
+/* Return existing. */
+#define CONST_UP( existing, needed ) existing
+
+/* Return existing. */
+#define CONST_DOWN( existing, needed ) existing
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class ResizeLin
+ * \brief Linear table resizer.
+ *
+ * When an up resize or a down resize is needed, ResizeLin allocates the space
+ * needed plus some user defined step. The result is that when growing the
+ * vector in a linear fashion, the number of resizes is also linear.
+ *
+ * If only up resizing is done, then there will never be more than step unused
+ * spaces in the vector. If down resizing is done as well, there will never be
+ * more than 2*step unused spaces in the vector. The up resizing and down
+ * resizing policies are offset to improve performance when repeatedly
+ * inserting and removing a small number of elements relative to the step.
+ * This scheme guarantees that repetitive inserting and removing of a small
+ * number of elements will never result in repetative reallocation.
+ *
+ * The vectors pass sizes to the resizer in units of T, so the step gets
+ * interpreted as units of T.
+ */
+
+/*@}*/
+
+/* Linear resizing. */
+class ResizeLin
+{
+protected:
+	/**
+	 * \brief Default constructor.
+	 *
+	 * Intializes resize step to 256 units of the table type T.
+	 */
+	ResizeLin() : step(LIN_DEFAULT_STEP) { }
+
+	/**
+	 * \brief Determine the new table size when up resizing.
+	 *
+	 * If the existing size is insufficient for the space needed, then allocate
+	 * the space needed plus the step. The step is in units of T.
+	 */
+	inline long upResize( long existing, long needed )
+		{ return LIN_UP(existing, needed); }
+
+	/**
+	 * \brief Determine the new table size when down resizing.
+	 *
+	 * If space needed is less than the existing - 2*step, then allocate the
+	 * space needed space plus the step. The step is in units of T.
+	 */
+	inline long downResize( long existing, long needed )
+		{ return LIN_DOWN(existing, needed); }
+
+public:
+	/**
+	 * \brief Step for linear resize.
+	 *
+	 * Amount of extra space in units of T added each time a resize must take
+	 * place. This may be changed at any time. The step should be >= 0.
+	 */
+	long step;
+};
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class ResizeCtLin
+ * \brief Linear table resizer with compile time step.
+ *
+ * When an up resize or a down resize is needed, ResizeCtLin allocates the
+ * space needed plus some compile time defined step. The result is that when
+ * growing the vector in a linear fashion, the number of resizes is also
+ * linear.
+ *
+ * If only up resizing is done, then there will never be more than step unused
+ * spaces in the vector. If down resizing is done as well, there will never be
+ * more than 2*step unused spaces in the vector. The up resizing and down
+ * resizing policies are offset to improve performance when repeatedly
+ * inserting and removing a small number of elements relative to the step.
+ * This scheme guarantees that repetitive inserting and removing of a small
+ * number of elements will never result in repetative reallocation.
+ *
+ * The vectors pass sizes to the resizer in units of T, so the step gets
+ * interpreted as units of T.
+ */
+
+/*@}*/
+
+/* Linear resizing. */
+template <long step> class ResizeCtLin
+{
+protected:
+	/**
+	 * \brief Determine the new table size when up resizing.
+	 *
+	 * If the existing size is insufficient for the space needed, then allocate
+	 * the space needed plus the step. The step is in units of T.
+	 */
+	inline long upResize( long existing, long needed )
+		{ return LIN_UP(existing, needed); }
+
+	/**
+	 * \brief Determine the new table size when down resizing.
+	 *
+	 * If space needed is less than the existing - 2*step, then allocate the
+	 * space needed space plus the step. The step is in units of T.
+	 */
+	inline long downResize( long existing, long needed )
+		{ return LIN_DOWN(existing, needed); }
+};
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class ResizeConst
+ * \brief Constant table resizer.
+ *
+ * When an up resize is needed the existing size is always used. ResizeConst
+ * does not allow dynamic resizing. To use ResizeConst, the vector needs to be
+ * constructed with and initial allocation amount otherwise it will be
+ * unusable.
+ */
+
+/*@}*/
+
+/* Constant table resizing. */
+class ResizeConst
+{
+protected:
+	/* Assert don't need more than exists. Return existing. */
+	static inline long upResize( long existing, long needed );
+
+	/**
+	 * \brief Determine the new table size when down resizing.
+	 *
+	 * Always returns the existing table size.
+	 */
+	static inline long downResize( long existing, long needed )
+		{ return CONST_DOWN(existing, needed); }
+};
+
+/**
+ * \brief Determine the new table size when up resizing.
+ *
+ * If the existing size is insufficient for the space needed, then an assertion
+ * will fail. Otherwise returns the existing size.
+ */
+inline long ResizeConst::upResize( long existing, long needed )
+{	
+	assert( needed <= existing ); 
+	return CONST_UP(existing, needed); 
+}
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class ResizeRunTime
+ * \brief Run time settable table resizer.
+ *
+ * ResizeRunTime can have it's up and down resizing policies set at run time.
+ * Both up and down policies can be set independently to one of Exponential,
+ * Linear, or Constant. See the documentation for ResizeExpn, ResizeLin, and
+ * ResizeConst for the details of the resizing policies. 
+ *
+ * The policies may be changed at any time. The default policies are
+ * both Exponential.
+ */
+
+/*@}*/
+
+/* Run time resizing. */
+class ResizeRunTime
+{
+protected:
+	/**
+	 * \brief Default constuctor.
+	 *
+	 * The up and down resizing it initialized to Exponetial. The step
+	 * defaults to 256 units of T.
+	 */
+	inline ResizeRunTime();
+
+	/**
+	 * \brief Resizing policies.
+	 */
+	enum ResizeType {
+		Exponential,  /*!< Exponential resizing. */
+		Linear,       /*!< Linear resizing. */
+		Constant      /*!< Constant table size. */
+	};
+
+	inline long upResize( long existing, long needed );
+	inline long downResize( long existing, long needed );
+
+public:
+	/**
+	 * \brief Step for linear resize.
+	 *
+	 * Amount of extra space in units of T added each time a resize must take
+	 * place. This may be changed at any time. The step should be >= 0.
+	 */
+	long step;
+
+	/**
+	 * \brief Up resizing policy.
+	 */
+	ResizeType upResizeType;
+
+	/**
+	 * \brief Down resizing policy.
+	 */
+	ResizeType downResizeType;
+};
+
+inline ResizeRunTime::ResizeRunTime()
+:
+	step( LIN_DEFAULT_STEP ),
+	upResizeType( Exponential ),
+	downResizeType( Exponential )
+{
+}
+
+/**
+ * \brief Determine the new table size when up resizing.
+ *
+ * Type of up resizing is determined by upResizeType. Exponential, Linear and
+ * Constant resizing is the same as that of ResizeExpn, ResizeLin and
+ * ResizeConst.
+ */
+inline long ResizeRunTime::upResize( long existing, long needed )
+{
+	switch ( upResizeType ) {
+	case Exponential:
+		return EXPN_UP(existing, needed);
+	case Linear:
+		return LIN_UP(existing, needed);
+	case Constant:
+		assert( needed <= existing ); 
+		return CONST_UP(existing, needed);
+	}
+	return 0;
+};
+
+/**
+ * \brief Determine the new table size when down resizing.
+ *
+ * Type of down resizing is determined by downResiizeType. Exponential, Linear
+ * and Constant resizing is the same as that of ResizeExpn, ResizeLin and
+ * ResizeConst.
+ */
+inline long ResizeRunTime::downResize( long existing, long needed )
+{
+	switch ( downResizeType ) {
+	case Exponential:
+		return EXPN_DOWN(existing, needed);
+	case Linear:
+		return LIN_DOWN(existing, needed);
+	case Constant:
+		return CONST_DOWN(existing, needed);
+	}
+	return 0;
+}
+
+/* Don't need these anymore. */
+#undef EXPN_UP
+#undef EXPN_DOWN
+#undef LIN_UP
+#undef LIN_DOWN
+#undef CONST_UP
+#undef CONST_DOWN
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_RESIZE_H */
diff --git a/aapl/sbstmap.h b/aapl/sbstmap.h
new file mode 100644
index 00000000..9436a472
--- /dev/null
+++ b/aapl/sbstmap.h
@@ -0,0 +1,121 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_SBSTMAP_H
+#define _AAPL_SBSTMAP_H
+
+#include "compare.h"
+#include "svector.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \brief Element for BstMap.
+ *
+ * Stores the key and value pair. 
+ */
+template <class Key, class Value> struct SBstMapEl
+{
+	SBstMapEl() {}
+	SBstMapEl(const Key &key) : key(key) {}
+	SBstMapEl(const Key &key, const Value &val) : key(key), value(val) {}
+
+	/** \brief The key */
+	Key key;
+
+	/** \brief The value. */
+	Value value;
+};
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class SBstMap
+ * \brief Copy-on-write binary search table for key and value pairs.
+ *
+ * This is a map style binary search table that employs the copy-on-write
+ * mechanism for table data. BstMap stores key and value pairs in each
+ * element. The key and value can be any type. A compare class for the key
+ * must be supplied.
+ */
+
+/*@}*/
+
+#define BST_TEMPL_DECLARE class Key, class Value, \
+		class Compare = CmpOrd<Key>, class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Key, class Value, class Compare, class Resize
+#define BST_TEMPL_USE Key, Value, Compare, Resize
+#define GET_KEY(el) ((el).key)
+#define BstTable SBstMap
+#define Vector SVector
+#define Table STable
+#define Element SBstMapEl<Key, Value>
+#define BSTMAP
+#define SHARED_BST
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BstTable
+#undef Vector
+#undef Table
+#undef Element
+#undef BSTMAP
+#undef SHARED_BST
+
+/**
+ * \fn SBstMap::insert(const Key &key, BstMapEl<Key, Value> **lastFound)
+ * \brief Insert the given key.
+ *
+ * If the given key does not already exist in the table then a new element
+ * having key is inserted. They key copy constructor and value default
+ * constructor are used to place the pair in the table. If lastFound is given,
+ * it is set to the new entry created. If the insert fails then lastFound is
+ * set to the existing pair of the same key.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn SBstMap::insertMulti(const Key &key)
+ * \brief Insert the given key even if it exists already.
+ *
+ * If the key exists already then the new element having key is placed next
+ * to some other pair of the same key. InsertMulti cannot fail. The key copy
+ * constructor and the value default constructor are used to place the pair in
+ * the table.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_SBSTMAP_H */
diff --git a/aapl/sbstset.h b/aapl/sbstset.h
new file mode 100644
index 00000000..fe8ddf6c
--- /dev/null
+++ b/aapl/sbstset.h
@@ -0,0 +1,94 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_SBSTSET_H
+#define _AAPL_SBSTSET_H
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class SBstSet
+ * \brief Copy-on-write binary search table for types that are the key.
+ *
+ * This is a set style binary search table that employs the copy-on-write
+ * mechanism for storing table data. BstSet is suitable for types that
+ * comprise the entire key. Rather than look into the element to retrieve the
+ * key, the element is the key.  A class that contains a comparison routine
+ * for the key must be given.
+ */
+
+/*@}*/
+
+#include "compare.h"
+#include "svector.h"
+
+#define BST_TEMPL_DECLARE class Key, class Compare = CmpOrd<Key>, \
+		class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Key, class Compare, class Resize
+#define BST_TEMPL_USE Key, Compare, Resize
+#define GET_KEY(el) (el)
+#define BstTable SBstSet
+#define Vector SVector
+#define Table STable
+#define Element Key
+#define BSTSET
+#define SHARED_BST
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BstTable
+#undef Vector
+#undef Table
+#undef Element
+#undef BSTSET
+#undef SHARED_BST
+
+/**
+ * \fn SBstSet::insert(const Key &key, Key **lastFound)
+ * \brief Insert the given key.
+ *
+ * If the given key does not already exist in the table then it is inserted.
+ * The key's copy constructor is used to place the item in the table. If
+ * lastFound is given, it is set to the new entry created. If the insert fails
+ * then lastFound is set to the existing key of the same value.
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn SBstSet::insertMulti(const Key &key)
+ * \brief Insert the given key even if it exists already.
+ *
+ * If the key exists already then it is placed next to some other key of the
+ * same value. InsertMulti cannot fail. The key's copy constructor is used to
+ * place the item in the table.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_SBSTSET_H */
diff --git a/aapl/sbsttable.h b/aapl/sbsttable.h
new file mode 100644
index 00000000..100b87ec
--- /dev/null
+++ b/aapl/sbsttable.h
@@ -0,0 +1,93 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_SBSTTABLE_H
+#define _AAPL_SBSTTABLE_H
+
+#include "compare.h"
+#include "svector.h"
+
+/**
+ * \addtogroup bst 
+ * @{
+ */
+
+/** 
+ * \class SBstTable
+ * \brief Copy-on-write binary search table for structures that contain a key.
+ *
+ * This is a basic binary search table that employs a copy-on-write data
+ * storage mechanism. It can be used to contain a structure that has a key and
+ * possibly some data. The key should be a member of the element class and
+ * accessible with getKey(). A class containing the compare routine must be
+ * supplied.
+ */
+
+/*@}*/
+
+#define BST_TEMPL_DECLARE class Element, class Key, \
+		class Compare = CmpOrd<Key>, class Resize = ResizeExpn
+#define BST_TEMPL_DEF class Element, class Key, class Compare, class Resize
+#define BST_TEMPL_USE Element, Key, Compare, Resize
+#define GET_KEY(el) ((el).getKey())
+#define BstTable SBstTable
+#define Vector SVector
+#define Table STable
+#define BSTTABLE
+#define SHARED_BST
+
+#include "bstcommon.h"
+
+#undef BST_TEMPL_DECLARE
+#undef BST_TEMPL_DEF
+#undef BST_TEMPL_USE
+#undef GET_KEY
+#undef BstTable
+#undef Vector
+#undef Table
+#undef BSTTABLE
+#undef SHARED_BST
+
+/**
+ * \fn SBstTable::insert(const Key &key, Element **lastFound)
+ * \brief Insert a new element with the given key.
+ *
+ * If the given key does not already exist in the table a new element is
+ * inserted with the given key. A constructor taking only const Key& is used
+ * to initialize the new element. If lastFound is given, it is set to the new
+ * element created. If the insert fails then lastFound is set to the existing
+ * element with the same key. 
+ *
+ * \returns The new element created upon success, null upon failure.
+ */
+
+/**
+ * \fn SBstTable::insertMulti(const Key &key)
+ * \brief Insert a new element even if the key exists already.
+ *
+ * If the key exists already then the new element is placed next to some
+ * element with the same key. InsertMulti cannot fail. A constructor taking
+ * only const Key& is used to initialize the new element.
+ *
+ * \returns The new element created.
+ */
+
+#endif /* _AAPL_SBSTTABLE_H */
diff --git a/aapl/svector.h b/aapl/svector.h
new file mode 100644
index 00000000..db3a5656
--- /dev/null
+++ b/aapl/svector.h
@@ -0,0 +1,1350 @@
+/*
+ *  Copyright 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_SVECTOR_H
+#define _AAPL_SVECTOR_H
+
+#include <new>
+#include <string.h>
+#include <stdlib.h>
+#include <assert.h>
+#include "table.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class SVector
+ * \brief Copy-on-write dynamic array.
+ *
+ * SVector is a variant of Vector that employs copy-on-write behaviour. The
+ * SVector copy constructor and = operator make shallow copies. If a vector
+ * that references shared data is modified with insert, replace, append,
+ * prepend, setAs or remove, a new copy is made so as not to interfere with
+ * the shared data. However, shared individual elements may be modified by
+ * bypassing the SVector interface.
+ *
+ * SVector is a dynamic array that can be used to contain complex data
+ * structures that have constructors and destructors as well as simple types
+ * such as integers and pointers.
+ *
+ * SVector supports inserting, overwriting, and removing single or multiple
+ * elements at once. Constructors and destructors are called wherever
+ * appropriate.  For example, before an element is overwritten, it's
+ * destructor is called.
+ *
+ * SVector provides automatic resizing of allocated memory as needed and
+ * offers different allocation schemes for controlling how the automatic
+ * allocation is done.  Two senses of the the length of the data is
+ * maintained: the amount of raw memory allocated to the vector and the number
+ * of actual elements in the vector. The various allocation schemes control
+ * how the allocated space is changed in relation to the number of elements in
+ * the vector.
+ */
+
+/*@}*/
+
+/* SVector */
+template < class T, class Resize = ResizeExpn > class SVector :
+	public STable<T>, public Resize
+{
+private:
+	typedef STable<T> BaseTable;
+
+public:
+	/**
+	 * \brief Initialize an empty vector with no space allocated.  
+	 *
+	 * If a linear resizer is used, the step defaults to 256 units of T. For a
+	 * runtime vector both up and down allocation schemes default to
+	 * Exponential.
+	 */
+	SVector() { }
+
+	/**
+	 * \brief Create a vector that contains an initial element.
+	 *
+	 * The vector becomes one element in length. The element's copy
+	 * constructor is used to place the value in the vector.
+	 */
+	SVector(const T &val)             { setAs(&val, 1); }
+
+	/**
+	 * \brief Create a vector that contains an array of elements.
+	 *
+	 * The vector becomes len elements in length.  Copy constructors are used
+	 * to place the new elements in the vector. 
+	 */
+	SVector(const T *val, long len)   { setAs(val, len); }
+
+	/* Shallow copy. */
+	SVector( const SVector &v );
+
+	/**
+	 * \brief Free all memory used by the vector. 
+	 *
+	 * The vector is reset to zero elements. Destructors are called on all
+	 * elements in the vector. The space allocated for the vector is freed.
+	 */
+	~SVector() { empty(); }
+
+	/* Delete all items. */
+	void empty();
+
+	/**
+	 * \brief Deep copy another vector into this vector.
+	 *
+	 * Copies the entire contents of the other vector into this vector. Any
+	 * existing contents are first deleted. Equivalent to setAs.
+	 */
+	void deepCopy( const SVector &v )     { setAs(v.data, v.length()); }
+
+	/* Perform a shallow copy of another vector. */
+	SVector &operator=( const SVector &v );
+
+
+	/*@{*/
+	/**
+	 * \brief Insert one element at position pos.
+	 *
+	 * Elements in the vector from pos onward are shifted one space to the
+	 * right. The copy constructor is used to place the element into this
+	 * vector. If pos is greater than the length of the vector then undefined
+	 * behaviour results. If pos is negative then it is treated as an offset
+	 * relative to the length of the vector.
+	 */
+	void insert(long pos, const T &val)     { insert(pos, &val, 1); }
+
+	/* Insert an array of values. */
+	void insert(long pos, const T *val, long len);
+
+	/**
+	 * \brief Insert all the elements from another vector at position pos.
+	 *
+	 * Elements in this vector from pos onward are shifted v.length() spaces
+	 * to the right. The element's copy constructor is used to copy the items
+	 * into this vector. The other vector is left unchanged. If pos is off the
+	 * end of the vector, then undefined behaviour results. If pos is negative
+	 * then it is treated as an offset relative to the length of the vector.
+	 * Equivalent to vector.insert(pos, other.data, other.length()).
+	 */
+	void insert(long pos, const SVector &v) { insert(pos, v.data, v.length()); }
+
+	/* Insert len copies of val into the vector. */
+	void insertDup(long pos, const T &val, long len);
+
+	/**
+	 * \brief Insert one new element using the default constrcutor.
+	 *
+	 * Elements in the vector from pos onward are shifted one space to the right.
+	 * The default constructor is used to init the new element. If pos is greater
+	 * than the length of the vector then undefined behaviour results. If pos is
+	 * negative then it is treated as an offset relative to the length of the
+	 * vector.
+	 */
+	void insertNew(long pos)                { insertNew(pos, 1); }
+
+	/* Insert len new items using default constructor. */
+	void insertNew(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+	/** 
+	 * \brief Remove one element at position pos.
+	 *
+	 * The element's destructor is called. Elements to the right of pos are
+	 * shifted one space to the left to take up the free space. If pos is greater
+	 * than or equal to the length of the vector then undefined behavior results.
+	 * If pos is negative then it is treated as an offset relative to the length
+	 * of the vector.
+	 */
+	void remove(long pos)                   { remove(pos, 1); }
+
+	/* Delete a number of elements. */
+	void remove(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+	/**
+	 * \brief Replace one element at position pos.
+	 *
+	 * If there is an existing element at position pos (if pos is less than the
+	 * length of the vector) then its destructor is called before the space is
+	 * used. The copy constructor is used to place the element into the vector.
+	 * If pos is greater than the length of the vector then undefined behaviour
+	 * results.  If pos is negative then it is treated as an offset relative to
+	 * the length of the vector.
+	 */
+	void replace(long pos, const T &val)     { replace(pos, &val, 1); }
+
+	/* Replace with an array of values. */
+	void replace(long pos, const T *val, long len);
+
+	/**
+	 * \brief Replace at position pos with all the elements of another vector.
+	 *
+	 * Replace at position pos with all the elements of another vector. The other
+	 * vector is left unchanged. If there are existing elements at the positions
+	 * to be replaced, then destructors are called before the space is used. Copy
+	 * constructors are used to place the elements into this vector. It is
+	 * allowable for the pos and length of the other vector to specify a
+	 * replacement that overwrites existing elements and creates new ones.  If pos
+	 * is greater than the length of the vector then undefined behaviour results.
+	 * If pos is negative, then it is treated as an offset relative to the length
+	 * of the vector.
+	 */
+	void replace(long pos, const SVector &v) { replace(pos, v.data, v.length()); }
+
+	/* Replace len items with len copies of val. */
+	void replaceDup(long pos, const T &val, long len);
+
+	/**
+	 * \brief Replace at position pos with one new element.
+	 *
+	 * If there is an existing element at the position to be replaced (pos is
+	 * less than the length of the vector) then the element's destructor is
+	 * called before the space is used. The default constructor is used to
+	 * initialize the new element. If pos is greater than the length of the
+	 * vector then undefined behaviour results. If pos is negative, then it is
+	 * treated as an offset relative to the length of the vector.
+	 */
+	void replaceNew(long pos)                { replaceNew(pos, 1); }
+
+	/* Replace len items at pos with newly constructed objects. */
+	void replaceNew(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+
+	/**
+	 * \brief Set the contents of the vector to be val exactly.
+	 *
+	 * The vector becomes one element in length. Destructors are called on any
+	 * existing elements in the vector. The element's copy constructor is used to
+	 * place the val in the vector.
+	 */
+	void setAs(const T &val)             { setAs(&val, 1); }
+
+	/* Set to the contents of an array. */
+	void setAs(const T *val, long len);
+
+	/**
+	 * \brief Set the vector to exactly the contents of another vector.
+	 *
+	 * The vector becomes v.length() elements in length. Destructors are called
+	 * on any existing elements. Copy constructors are used to place the new
+	 * elements in the vector.
+	 */
+	void setAs(const SVector &v)         { setAs(v.data, v.length()); }
+
+	/* Set as len copies of item. */
+	void setAsDup(const T &item, long len);
+
+	/**
+	 * \brief Set the vector to exactly one new item.
+	 *
+	 * The vector becomes one element in length. Destructors are called on any
+	 * existing elements in the vector. The default constructor is used to
+	 * init the new item.
+	 */
+	void setAsNew()                      { setAsNew(1); }
+
+	/* Set as newly constructed objects using the default constructor. */
+	void setAsNew(long len);
+	/*@}*/
+
+	/*@{*/
+	/**
+	 * \brief Append one elment to the end of the vector.
+	 *
+	 * Copy constructor is used to place the element in the vector.
+	 */
+	void append(const T &val)                { replace(BaseTable::length(), &val, 1); }
+
+	/**
+	 * \brief Append len elements to the end of the vector. 
+	 *
+	 * Copy constructors are used to place the elements in the vector. 
+	 */
+	void append(const T *val, long len)       { replace(BaseTable::length(), val, len); }
+
+	/**
+	 * \brief Append the contents of another vector.
+	 *
+	 * The other vector is left unchanged. Copy constructors are used to place
+	 * the elements in the vector.
+	 */
+	void append(const SVector &v)            
+			{ replace(BaseTable::length(), v.data, v.length()); }
+
+	/**
+	 * \brief Append len copies of item.
+	 *
+	 * The copy constructor is used to place the item in the vector.
+	 */
+	void appendDup(const T &item, long len)   { replaceDup(BaseTable::length(), item, len); }
+
+	/**
+	 * \brief Append a single newly created item. 
+	 *
+	 * The new element is initialized with the default constructor.
+	 */
+	void appendNew()                         { replaceNew(BaseTable::length(), 1); }
+
+	/**
+	 * \brief Append len newly created items.
+	 *
+	 * The new elements are initialized with the default constructor.
+	 */
+	void appendNew(long len)                  { replaceNew(BaseTable::length(), len); }
+	/*@}*/
+
+
+	/*@{*/
+	/**
+	 * \brief Prepend one elment to the front of the vector.
+	 *
+	 * Copy constructor is used to place the element in the vector.
+	 */
+	void prepend(const T &val)               { insert(0, &val, 1); }
+
+	/**
+	 * \brief Prepend len elements to the front of the vector. 
+	 *
+	 * Copy constructors are used to place the elements in the vector. 
+	 */
+	void prepend(const T *val, long len)      { insert(0, val, len); }
+
+	/**
+	 * \brief Prepend the contents of another vector.
+	 *
+	 * The other vector is left unchanged. Copy constructors are used to place
+	 * the elements in the vector.
+	 */
+	void prepend(const SVector &v)           { insert(0, v.data, v.length()); }
+
+	/**
+	 * \brief Prepend len copies of item.
+	 *
+	 * The copy constructor is used to place the item in the vector.
+	 */
+	void prependDup(const T &item, long len)  { insertDup(0, item, len); }
+
+	/**
+	 * \brief Prepend a single newly created item. 
+	 *
+	 * The new element is initialized with the default constructor.
+	 */
+	void prependNew()                        { insertNew(0, 1); }
+
+	/**
+	 * \brief Prepend len newly created items.
+	 *
+	 * The new elements are initialized with the default constructor.
+	 */
+	void prependNew(long len)                 { insertNew(0, len); }
+	/*@}*/
+
+	/* Convenience access. */
+	T &operator[](int i) const { return BaseTable::data[i]; }
+	long size() const           { return BaseTable::length(); }
+
+	/* Various classes for setting the iterator */
+	struct Iter;
+	struct IterFirst { IterFirst( const SVector &v ) : v(v) { } const SVector &v; };
+	struct IterLast { IterLast( const SVector &v ) : v(v) { } const SVector &v; };
+	struct IterNext { IterNext( const Iter &i ) : i(i) { } const Iter &i; };
+	struct IterPrev { IterPrev( const Iter &i ) : i(i) { } const Iter &i; };
+
+	/** 
+	 * \brief Shared Vector Iterator. 
+	 * \ingroup iterators
+	 */
+	struct Iter
+	{
+		/* Construct, assign. */
+		Iter() : ptr(0), ptrBeg(0), ptrEnd(0) { }
+
+		/* Construct. */
+		Iter( const SVector &v );
+		Iter( const IterFirst &vf );
+		Iter( const IterLast &vl );
+		inline Iter( const IterNext &vn );
+		inline Iter( const IterPrev &vp );
+
+		/* Assign. */
+		Iter &operator=( const SVector &v );
+		Iter &operator=( const IterFirst &vf );
+		Iter &operator=( const IterLast &vl );
+		inline Iter &operator=( const IterNext &vf );
+		inline Iter &operator=( const IterPrev &vl );
+
+		/** \brief Less than end? */
+		bool lte() const { return ptr != ptrEnd; }
+
+		/** \brief At end? */
+		bool end() const { return ptr == ptrEnd; }
+
+		/** \brief Greater than beginning? */
+		bool gtb() const { return ptr != ptrBeg; }
+
+		/** \brief At beginning? */
+		bool beg() const { return ptr == ptrBeg; }
+
+		/** \brief At first element? */
+		bool first() const { return ptr == ptrBeg+1; }
+
+		/** \brief At last element? */
+		bool last() const { return ptr == ptrEnd-1; }
+
+		/* Return the position. */
+		long pos() const { return ptr - ptrBeg - 1; }
+		T &operator[](int i) const { return ptr[i]; }
+
+		/** \brief Implicit cast to T*. */
+		operator T*() const   { return ptr; }
+
+		/** \brief Dereference operator returns T&. */
+		T &operator *() const { return *ptr; }
+
+		/** \brief Arrow operator returns T*. */
+		T *operator->() const { return ptr; }
+
+		/** \brief Move to next item. */
+		T *operator++()       { return ++ptr; }
+
+		/** \brief Move to next item. */
+		T *operator++(int)    { return ptr++; }
+
+		/** \brief Move to next item. */
+		T *increment()        { return ++ptr; }
+
+		/** \brief Move to previous item. */
+		T *operator--()       { return --ptr; }
+
+		/** \brief Move to previous item. */
+		T *operator--(int)    { return ptr--; }
+
+		/** \brief Move to previous item. */
+		T *decrement()        { return --ptr; }
+
+		/** \brief Return the next item. Does not modify this. */
+		inline IterNext next() const { return IterNext(*this); }
+
+		/** \brief Return the previous item. Does not modify this. */
+		inline IterPrev prev() const { return IterPrev(*this); }
+
+		/** \brief The iterator is simply a pointer. */
+		T *ptr;
+
+		/* For testing endpoints. */
+		T *ptrBeg, *ptrEnd;
+	};
+
+	/** \brief Return first element. */
+	IterFirst first() { return IterFirst( *this ); }
+
+	/** \brief Return last element. */
+	IterLast last() { return IterLast( *this ); }
+
+protected:
+ 	void makeRawSpaceFor(long pos, long len);
+
+	void setAsCommon(long len);
+	long replaceCommon(long pos, long len);
+	long insertCommon(long pos, long len);
+
+	void upResize(long len);
+	void upResizeDup(long len);
+	void upResizeFromEmpty(long len);
+	void downResize(long len);
+	void downResizeDup(long len);
+};
+
+/**
+ * \brief Perform a shallow copy of the vector.
+ *
+ * Takes a reference to the contents of the other vector.
+ */
+template <class T, class Resize> SVector<T, Resize>::
+		SVector(const SVector<T, Resize> &v)
+{
+	/* Take a reference to other, if any data is allocated. */
+	if ( v.data == 0 )
+		BaseTable::data = 0;
+	else {
+		/* Get the source header, up the refcount and ref it. */
+		STabHead *srcHead = ((STabHead*) v.data) - 1;
+		srcHead->refCount += 1;
+		BaseTable::data = (T*) (srcHead + 1);
+	}
+}
+
+/**
+ * \brief Shallow copy another vector into this vector.
+ *
+ * Takes a reference to the other vector. The contents of this vector are
+ * first emptied. 
+ *
+ * \returns A reference to this.
+ */
+template <class T, class Resize> SVector<T, Resize> &
+		SVector<T, Resize>:: operator=( const SVector &v )
+{
+	/* First clean out the current contents. */
+	empty();
+
+	/* Take a reference to other, if any data is allocated. */
+	if ( v.data == 0 )
+		BaseTable::data = 0;
+	else {
+		/* Get the source header, up the refcount and ref it. */
+		STabHead *srcHead = ((STabHead*) v.data) - 1;
+		srcHead->refCount += 1;
+		BaseTable::data = (T*) (srcHead + 1);
+	}
+	return *this;
+}
+
+/* Init a vector iterator with just a vector. */
+template <class T, class Resize> SVector<T, Resize>::
+		Iter::Iter( const SVector &v ) 
+{
+	long length;
+	if ( v.data == 0 || (length=(((STabHead*)v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = v.data;
+		ptrBeg = v.data-1;
+		ptrEnd = v.data+length;
+	}
+}
+
+/* Init a vector iterator with the first of a vector. */
+template <class T, class Resize> SVector<T, Resize>::
+		Iter::Iter( const IterFirst &vf ) 
+{
+	long length;
+	if ( vf.v.data == 0 || (length=(((STabHead*)vf.v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vf.v.data;
+		ptrBeg = vf.v.data-1;
+		ptrEnd = vf.v.data+length;
+	}
+}
+
+/* Init a vector iterator with the last of a vector. */
+template <class T, class Resize> SVector<T, Resize>::
+		Iter::Iter( const IterLast &vl ) 
+{
+	long length;
+	if ( vl.v.data == 0 || (length=(((STabHead*)vl.v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vl.v.data+length-1;
+		ptrBeg = vl.v.data-1;
+		ptrEnd = vl.v.data+length;
+	}
+}
+
+/* Init a vector iterator with the next of some other iterator. */
+template <class T, class Resize> SVector<T, Resize>::
+		Iter::Iter( const IterNext &vn ) 
+:
+	ptr(vn.i.ptr+1), 
+	ptrBeg(vn.i.ptrBeg),
+	ptrEnd(vn.i.ptrEnd)
+{
+}
+
+/* Init a vector iterator with the prev of some other iterator. */
+template <class T, class Resize> SVector<T, Resize>::
+		Iter::Iter( const IterPrev &vp ) 
+:
+	ptr(vp.i.ptr-1),
+	ptrBeg(vp.i.ptrBeg),
+	ptrEnd(vp.i.ptrEnd)
+{
+}
+
+/* Set a vector iterator with some vector. */
+template <class T, class Resize> typename SVector<T, Resize>::Iter &
+		SVector<T, Resize>::Iter::operator=( const SVector &v )    
+{
+	long length;
+	if ( v.data == 0 || (length=(((STabHead*)v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = v.data; 
+		ptrBeg = v.data-1; 
+		ptrEnd = v.data+length; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the first element in a vector. */
+template <class T, class Resize> typename SVector<T, Resize>::Iter &
+		SVector<T, Resize>::Iter::operator=( const IterFirst &vf )    
+{
+	long length;
+	if ( vf.v.data == 0 || (length=(((STabHead*)vf.v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vf.v.data; 
+		ptrBeg = vf.v.data-1; 
+		ptrEnd = vf.v.data+length; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the last element in a vector. */
+template <class T, class Resize> typename SVector<T, Resize>::Iter &
+		SVector<T, Resize>::Iter::operator=( const IterLast &vl )    
+{
+	long length;
+	if ( vl.v.data == 0 || (length=(((STabHead*)vl.v.data)-1)->tabLen) == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vl.v.data+length-1; 
+		ptrBeg = vl.v.data-1; 
+		ptrEnd = vl.v.data+length; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the next of some other iterator. */
+template <class T, class Resize> typename SVector<T, Resize>::Iter &
+		SVector<T, Resize>::Iter::operator=( const IterNext &vn )    
+{
+	ptr = vn.i.ptr+1; 
+	ptrBeg = vn.i.ptrBeg;
+	ptrEnd = vn.i.ptrEnd;
+	return *this;
+}
+
+/* Set a vector iterator with the prev of some other iterator. */
+template <class T, class Resize> typename SVector<T, Resize>::Iter &
+		SVector<T, Resize>::Iter::operator=( const IterPrev &vp )    
+{
+	ptr = vp.i.ptr-1; 
+	ptrBeg = vp.i.ptrBeg;
+	ptrEnd = vp.i.ptrEnd;
+	return *this;
+}
+
+/* Up resize the data for len elements using Resize::upResize to tell us the
+ * new length. Reads and writes allocLen. Does not read or write length.
+ * Assumes that there is some data allocated already. */
+template <class T, class Resize> void SVector<T, Resize>::
+		upResize(long len)
+{
+	/* Get the current header. */
+	STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+	/* Ask the resizer what the new length will be. */
+	long newLen = Resize::upResize(head->allocLen, len);
+
+	/* Did the data grow? */
+	if ( newLen > head->allocLen ) {
+		head->allocLen = newLen;
+
+		/* Table exists already, resize it up. */
+		head = (STabHead*) realloc( head, sizeof(STabHead) + 
+				sizeof(T) * newLen );
+		if ( head == 0 )
+			throw std::bad_alloc();
+
+		/* Save the data pointer. */
+		BaseTable::data = (T*) (head + 1);
+	}
+}
+
+/* Allocates a new buffer for an up resize that requires a duplication of the
+ * data. Uses Resize::upResize to get the allocation length.  Reads and writes
+ * allocLen. This upResize does write the new length.  Assumes that there is
+ * some data allocated already. */
+template <class T, class Resize> void SVector<T, Resize>::
+		upResizeDup(long len)
+{
+	/* Get the current header. */
+	STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+	/* Ask the resizer what the new length will be. */
+	long newLen = Resize::upResize(head->allocLen, len);
+
+	/* Dereferencing the existing data, decrement the refcount. */
+	head->refCount -= 1;
+
+	/* Table exists already, resize it up. */
+	head = (STabHead*) malloc( sizeof(STabHead) + sizeof(T) * newLen );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	head->refCount = 1;
+	head->allocLen = newLen;
+	head->tabLen = len;
+
+	/* Save the data pointer. */
+	BaseTable::data = (T*) (head + 1);
+}
+
+/* Up resize the data for len elements using Resize::upResize to tell us the
+ * new length. Reads and writes allocLen. This upresize DOES write length.
+ * Assumes that no data is allocated. */
+template <class T, class Resize> void SVector<T, Resize>::
+		upResizeFromEmpty(long len)
+{
+	/* There is no table yet. If the len is zero, then there is no need to
+	 * create a table. */
+	if ( len > 0 ) {
+		/* Ask the resizer what the new length will be. */
+		long newLen = Resize::upResize(0, len);
+
+		/* If len is greater than zero then we are always allocating the table. */
+		STabHead *head = (STabHead*) malloc( sizeof(STabHead) + 
+				sizeof(T) * newLen );
+		if ( head == 0 )
+			throw std::bad_alloc();
+
+		/* Set up the header and save the data pointer. Note that we set the
+		 * length here. This differs from the other upResizes. */
+		head->refCount = 1;
+		head->allocLen = newLen;
+		head->tabLen = len;
+		BaseTable::data = (T*) (head + 1);
+	}
+}
+
+/* Down resize the data for len elements using Resize::downResize to determine
+ * the new length. Reads and writes allocLen. Does not read or write length. */
+template <class T, class Resize> void SVector<T, Resize>::
+		downResize(long len)
+{
+	/* If there is already no length, then there is nothing we can do. */
+	if ( BaseTable::data != 0 ) {
+		/* Get the current header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* Ask the resizer what the new length will be. */
+		long newLen = Resize::downResize( head->allocLen, len );
+
+		/* Did the data shrink? */
+		if ( newLen < head->allocLen ) {
+			if ( newLen == 0 ) {
+				/* Simply free the data. */
+				free( head );
+				BaseTable::data = 0;
+			}
+			else {
+				/* Save the new allocated length. */
+				head->allocLen = newLen;
+
+				/* Not shrinking to size zero, realloc it to the smaller size. */
+				head = (STabHead*) realloc( head, sizeof(STabHead) + 
+						sizeof(T) * newLen );
+				if ( head == 0 )
+					throw std::bad_alloc();
+				
+				/* Save the new data ptr. */
+				BaseTable::data = (T*) (head + 1);
+			}
+		}
+	}
+}
+
+/* Allocate a new buffer for a down resize and duplication of the array.  The
+ * new array will be len long and allocation size will be determined using
+ * Resize::downResize with the old array's allocLen. Does not actually copy
+ * any data. Reads and writes allocLen and writes the new len. */
+template <class T, class Resize> void SVector<T, Resize>::
+		downResizeDup(long len)
+{
+	/* If there is already no length, then there is nothing we can do. */
+	if ( BaseTable::data != 0 ) {
+		/* Get the current header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* Ask the resizer what the new length will be. */
+		long newLen = Resize::downResize( head->allocLen, len );
+
+		/* Detaching from the existing head, decrement the refcount. */
+		head->refCount -= 1;
+
+		/* Not shrinking to size zero, malloc it to the smaller size. */
+		head = (STabHead*) malloc( sizeof(STabHead) + sizeof(T) * newLen );
+		if ( head == 0 )
+			throw std::bad_alloc();
+
+		/* Save the new allocated length. */
+		head->refCount = 1;
+		head->allocLen = newLen;
+		head->tabLen = len;
+
+		/* Save the data pointer. */
+		BaseTable::data = (T*) (head + 1);
+	}
+}
+
+/**
+ * \brief Free all memory used by the vector. 
+ *
+ * The vector is reset to zero elements. Destructors are called on all
+ * elements in the vector. The space allocated for the vector is freed.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		empty()
+{
+	if ( BaseTable::data != 0 ) {
+		/* Get the header and drop the refcount on the data. */
+		STabHead *head = ((STabHead*) BaseTable::data) - 1;
+		head->refCount -= 1;
+
+		/* If the refcount just went down to zero nobody else is referencing
+		 * the data. */
+		if ( head->refCount == 0 ) {
+			/* Call All destructors. */
+			T *pos = BaseTable::data;
+			for ( long i = 0; i < head->tabLen; pos++, i++ )
+				pos->~T();
+
+			/* Free the data space. */
+			free( head );
+		}
+
+		/* Clear the pointer. */
+		BaseTable::data = 0;
+	}
+}
+
+/* Prepare for setting the contents of the vector to some array len long.
+ * Handles reusing the existing space, detaching from a common space or
+ * growing from zero length automatically. */
+template <class T, class Resize> void SVector<T, Resize>::
+		setAsCommon(long len)
+{
+	if ( BaseTable::data != 0 ) {
+		/* Get the header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* If the refCount is one, then we can reuse the space. Otherwise we
+		 * must detach from the referenced data create new space. */
+		if ( head->refCount == 1 ) {
+			/* Call All destructors. */
+			T *pos = BaseTable::data;
+			for ( long i = 0; i < head->tabLen; pos++, i++ )
+				pos->~T();
+
+			/* Adjust the allocated length. */
+			if ( len < head->tabLen )
+				downResize( len );
+			else if ( len > head->tabLen )
+				upResize( len );
+
+			if ( BaseTable::data != 0 ) {
+				/* Get the header again and set the length. */
+				head = ((STabHead*)BaseTable::data) - 1;
+				head->tabLen = len;
+			}
+		}
+		else {
+			/* Just detach from the data. */
+			head->refCount -= 1;
+			BaseTable::data = 0;
+			
+			/* Make enough space. This will set the length. */
+			upResizeFromEmpty( len );
+		}
+	}
+	else {
+		/* The table is currently empty. Make enough space. This will set the
+		 * length. */
+		upResizeFromEmpty( len );
+	}
+}
+
+/**
+ * \brief Set the contents of the vector to be len elements exactly. 
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. Copy constructors are used to place the
+ * new elements in the vector. 
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		setAs(const T *val, long len)
+{
+	/* Common stuff for setting the array to len long. */
+	setAsCommon( len );
+
+	/* Copy data in. */
+	T *dst = BaseTable::data;
+	const T *src = val;
+	for ( long i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+}
+
+
+/**
+ * \brief Set the vector to len copies of item.
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. The element's copy constructor is used to
+ * copy the item into the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		setAsDup(const T &item, long len)
+{
+	/* Do the common stuff for setting the array to len long. */
+	setAsCommon( len );
+
+	/* Copy item in one spot at a time. */
+	T *dst = BaseTable::data;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(item);
+}
+
+/**
+ * \brief Set the vector to exactly len new items.
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. Default constructors are used to init the
+ * new items.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		setAsNew(long len)
+{
+	/* Do the common stuff for setting the array to len long. */
+	setAsCommon( len );
+
+	/* Create items using default constructor. */
+	T *dst = BaseTable::data;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+}
+
+/* Make space in vector for a replacement at pos of len items. Handles reusing
+ * existing space, detaching or growing from zero space. */
+template <class T, class Resize> long SVector<T, Resize>::
+		replaceCommon(long pos, long len)
+{
+	if ( BaseTable::data != 0 ) {
+		/* Get the header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* If we are given a negative position to replace at then treat it as
+		 * a position relative to the length. This doesn't have any meaning
+		 * unless the length is at least one. */
+		if ( pos < 0 )
+			pos = head->tabLen + pos;
+
+		/* The end is the one past the last item that we want to write to. */
+		long i, endPos = pos + len;
+
+		if ( head->refCount == 1 ) {
+			/* We can reuse the space. Make sure we have enough space. */
+			if ( endPos > head->tabLen ) {
+				upResize( endPos );
+
+				/* Get the header again, whose addr may have changed after
+				 * resizing. */
+				head = ((STabHead*)BaseTable::data) - 1;
+
+				/* Delete any objects we need to delete. */
+				T *item = BaseTable::data + pos;
+				for ( i = pos; i < head->tabLen; i++, item++ )
+					item->~T();
+		
+				/* We are extending the vector, set the new data length. */
+				head->tabLen = endPos;
+			}
+			else {
+				/* Delete any objects we need to delete. */
+				T *item = BaseTable::data + pos;
+				for ( i = pos; i < endPos; i++, item++ )
+					item->~T();
+			}
+		}
+		else {
+			/* Use endPos to calc the end of the vector. */
+			long newLen = endPos;
+			if ( newLen < head->tabLen )
+				newLen = head->tabLen;
+
+			/* Duplicate and grow up to endPos. This will set the length. */
+			upResizeDup( newLen );
+
+			/* Copy from src up to pos. */
+			const T *src = (T*) (head + 1);
+			T *dst = BaseTable::data;
+			for ( i = 0; i < pos; i++, dst++, src++)
+				new(dst) T(*src);
+
+			/* Copy any items after the replace range. */
+			for ( i += len, src += len, dst += len; 
+					i < head->tabLen; i++, dst++, src++ )
+				new(dst) T(*src);
+		}
+	}
+	else {
+		/* There is no data initially, must grow from zero. This will set the
+		 * new length. */
+		upResizeFromEmpty( len );
+	}
+
+	return pos;
+}
+
+
+/**
+ * \brief Replace len elements at position pos.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. Copy constructors are used
+ * to place the elements into the vector. It is allowable for the pos and
+ * length to specify a replacement that overwrites existing elements and
+ * creates new ones.  If pos is greater than the length of the vector then
+ * undefined behaviour results. If pos is negative, then it is treated as an
+ * offset relative to the length of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		replace(long pos, const T *val, long len)
+{
+	/* Common work for replacing in the vector. */
+	pos = replaceCommon( pos, len );
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	const T *src = val;
+	for ( long i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+}
+
+/**
+ * \brief Replace at position pos with len copies of an item.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. The copy constructor is
+ * used to place the element into this vector. It is allowable for the pos and
+ * length to specify a replacement that overwrites existing elements and
+ * creates new ones. If pos is greater than the length of the vector then
+ * undefined behaviour results.  If pos is negative, then it is treated as an
+ * offset relative to the length of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		replaceDup(long pos, const T &val, long len)
+{
+	/* Common replacement stuff. */
+	pos = replaceCommon( pos, len );
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(val);
+}
+
+/**
+ * \brief Replace at position pos with len new elements.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. The default constructor is
+ * used to initialize the new elements. It is allowable for the pos and length
+ * to specify a replacement that overwrites existing elements and creates new
+ * ones. If pos is greater than the length of the vector then undefined
+ * behaviour results. If pos is negative, then it is treated as an offset
+ * relative to the length of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		replaceNew(long pos, long len)
+{
+	/* Do the common replacement stuff. */
+	pos = replaceCommon( pos, len );
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+}
+
+/**
+ * \brief Remove len elements at position pos.
+ *
+ * Destructor is called on all elements removed. Elements to the right of pos
+ * are shifted len spaces to the left to take up the free space. If pos is
+ * greater than or equal to the length of the vector then undefined behavior
+ * results. If pos is negative then it is treated as an offset relative to the
+ * length of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		remove(long pos, long len)
+{
+	/* If there is no data, we can't delete anything anyways. */
+	if ( BaseTable::data != 0 ) {
+		/* Get the header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* If we are given a negative position to remove at then
+		 * treat it as a position relative to the length. */
+		if ( pos < 0 )
+			pos = head->tabLen + pos;
+
+		/* The first position after the last item deleted. */
+		long endPos = pos + len;
+
+		/* The New data length. */
+		long i, newLen = head->tabLen - len;
+
+		if ( head->refCount == 1 ) {
+			/* We are the only ones using the data. We can reuse 
+			 * the existing space. */
+
+			/* The place in the data we are deleting at. */
+			T *dst = BaseTable::data + pos;
+
+			/* Call Destructors. */
+			T *item = BaseTable::data + pos;
+			for ( i = 0; i < len; i += 1, item += 1 )
+				item->~T();
+
+			/* Shift data over if necessary. */
+			long lenToSlideOver = head->tabLen - endPos;	
+			if ( len > 0 && lenToSlideOver > 0 )
+				memmove(BaseTable::data + pos, dst + len, sizeof(T)*lenToSlideOver);
+
+			/* Shrink the data if necessary. */
+			downResize( newLen );
+
+			if ( BaseTable::data != 0 ) {
+				/* Get the header again (because of the resize) and set the
+				 * new data length. */
+				head = ((STabHead*)BaseTable::data) - 1;
+				head->tabLen = newLen;
+			}
+		}
+		else {
+			/* Must detach from the common data. Just copy the non-deleted
+			 * items from the common data. */
+
+			/* Duplicate and grow down to newLen. This will set the length. */
+			downResizeDup( newLen );
+
+			/* Copy over just the non-deleted parts. */
+			const T *src = (T*) (head + 1);
+			T *dst = BaseTable::data;
+			for ( i = 0; i < pos; i++, dst++, src++ )
+				new(dst) T(*src);
+
+			/* ... and the second half. */
+			for ( i += len, src += len; i < head->tabLen; i++, src++, dst++ )
+				new(dst) T(*src);
+		}
+	}
+}
+
+/* Shift over existing data. Handles reusing existing space, detaching or
+ * growing from zero space. */
+template <class T, class Resize> long SVector<T, Resize>::
+		insertCommon(long pos, long len)
+{
+	if ( BaseTable::data != 0 ) {
+		/* Get the header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* If we are given a negative position to insert at then treat it as a
+		 * position relative to the length. This only has meaning if there is
+		 * existing data. */
+		if ( pos < 0 )
+			pos = head->tabLen + pos;
+
+		/* Calculate the new length. */
+		long i, newLen = head->tabLen + len;
+
+		if ( head->refCount == 1 ) {
+			/* Up resize, we are growing. */
+			upResize( newLen );
+
+			/* Get the header again, (the addr may have changed after
+			 * resizing). */
+			head = ((STabHead*)BaseTable::data) - 1;
+
+			/* Shift over data at insert spot if needed. */
+			if ( len > 0 && pos < head->tabLen ) {
+				memmove( BaseTable::data + pos + len, BaseTable::data + pos,
+						sizeof(T)*(head->tabLen - pos) );
+			}
+
+			/* Grow the length by the len inserted. */
+			head->tabLen += len;
+		}
+		else {
+			/* Need to detach from the existing array. Copy over the other
+			 * parts. This will set the length. */
+			upResizeDup( newLen );
+
+			/* Copy over the parts around the insert. */
+			const T *src = (T*) (head + 1);
+			T *dst = BaseTable::data;
+			for ( i = 0; i < pos; i++, dst++, src++ )
+				new(dst) T(*src);
+
+			/* ... and the second half. */
+			for ( dst += len; i < head->tabLen; i++, src++, dst++ )
+				new(dst) T(*src);
+		}
+	}
+	else {
+		/* There is no existing data. Start from zero. This will set the
+		 * length. */
+		upResizeFromEmpty( len );
+	}
+
+	return pos;
+}
+
+
+/**
+ * \brief Insert len elements at position pos.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * The copy constructor is used to place the elements into this vector. If pos
+ * is greater than the length of the vector then undefined behaviour results.
+ * If pos is negative then it is treated as an offset relative to the length
+ * of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		insert(long pos, const T *val, long len)
+{
+	/* Do the common insertion stuff. */
+	pos = insertCommon( pos, len );
+
+	/* Copy data in element by element. */
+	T *dst = BaseTable::data + pos;
+	const T *src = val;
+	for ( long i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+}
+
+/**
+ * \brief Insert len copies of item at position pos.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * The copy constructor is used to place the element into this vector. If pos
+ * is greater than the length of the vector then undefined behaviour results.
+ * If pos is negative then it is treated as an offset relative to the length
+ * of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		insertDup(long pos, const T &item, long len)
+{
+	/* Do the common insertion stuff. */
+	pos = insertCommon( pos, len );
+
+	/* Copy the data item in one at a time. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(item);
+}
+
+
+/**
+ * \brief Insert len new elements using the default constructor.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * Default constructors are used to init the new elements. If pos is off the
+ * end of the vector then undefined behaviour results. If pos is negative then
+ * it is treated as an offset relative to the length of the vector.
+ */
+template <class T, class Resize> void SVector<T, Resize>::
+		insertNew(long pos, long len)
+{
+	/* Do the common insertion stuff. */
+	pos = insertCommon( pos, len );
+
+	/* Init new data with default constructors. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+}
+
+/* Makes space for len items, Does not init the items in any way.  If pos is
+ * greater than the length of the vector then undefined behaviour results.
+ * Updates the length of the vector. */
+template <class T, class Resize> void SVector<T, Resize>::
+		makeRawSpaceFor(long pos, long len)
+{
+	if ( BaseTable::data != 0 ) {
+		/* Get the header. */
+		STabHead *head = ((STabHead*)BaseTable::data) - 1;
+
+		/* Calculate the new length. */
+		long i, newLen = head->tabLen + len;
+
+		if ( head->refCount == 1 ) {
+			/* Up resize, we are growing. */
+			upResize( newLen );
+
+			/* Get the header again, (the addr may have changed after
+			 * resizing). */
+			head = ((STabHead*)BaseTable::data) - 1;
+
+			/* Shift over data at insert spot if needed. */
+			if ( len > 0 && pos < head->tabLen ) {
+				memmove( BaseTable::data + pos + len, BaseTable::data + pos,
+						sizeof(T)*(head->tabLen - pos) );
+			}
+
+			/* Grow the length by the len inserted. */
+			head->tabLen += len;
+		}
+		else {
+			/* Need to detach from the existing array. Copy over the other
+			 * parts. This will set the length. */
+			upResizeDup( newLen );
+
+			/* Copy over the parts around the insert. */
+			const T *src = (T*) (head + 1);
+			T *dst = BaseTable::data;
+			for ( i = 0; i < pos; i++, dst++, src++ )
+				new(dst) T(*src);
+
+			/* ... and the second half. */
+			for ( dst += len; i < head->tabLen; i++, src++, dst++ )
+				new(dst) T(*src);
+		}
+	}
+	else {
+		/* There is no existing data. Start from zero. This will set the
+		 * length. */
+		upResizeFromEmpty( len );
+	}
+}
+
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+
+#endif /* _AAPL_SVECTOR_H */
diff --git a/aapl/table.h b/aapl/table.h
new file mode 100644
index 00000000..c1f2b7bd
--- /dev/null
+++ b/aapl/table.h
@@ -0,0 +1,252 @@
+/*
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_TABLE_H
+#define _AAPL_TABLE_H
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class Table
+ * \brief Base class for dynamic arrays.
+ *
+ * Table is used as the common data storage class for vectors. It does not
+ * provide any methods to operate on the data and as such it is not intended
+ * to be used directly. It exists so that algorithms that operatate on dynamic
+ * arrays can be written without knowing about the various vector classes that
+ * my exist.
+ */
+
+/*@}*/
+
+/* Table class. */
+template <class T> class Table
+{
+public:
+	/* Default Constructor. */
+	inline Table();
+
+	/**
+	 * \brief Get the length of the vector.
+	 *
+	 * \returns the length of the vector.
+	 */
+	long length() const
+		{ return tabLen; }
+
+	/**
+	 * \brief Table data.
+	 *
+	 * The pointer to the elements in the vector. Modifying the vector may
+	 * cause this pointer to change.
+	 */
+	T *data;
+
+	/**
+	 * \brief Table length.
+	 *
+	 * The number of items of type T in the table.
+	 */
+	long tabLen;
+
+	/**
+	 * \brief Allocated length.
+	 *
+	 * The number of items for which there is room in the current allocation.
+	 */
+	long allocLen;
+};
+
+/**
+ * \brief Default constructor
+ *
+ * Initialize table data to empty.
+ */
+template <class T> inline Table<T>::Table()
+:
+	data(0),
+	tabLen(0),
+	allocLen(0)
+{
+}
+
+/* Default shared table header class. */
+struct STabHead
+{
+	/**
+	 * \brief Table length.
+	 *
+	 * The number of items of type T in the table.
+	 */
+	long tabLen;
+
+	/**
+	 * \brief Allocated length.
+	 *
+	 * The number of items for which there is room in the current allocation.
+	 */
+	long allocLen;
+
+	/**
+	 * \brief Ref Count.
+	 *
+	 * The number of shared vectors referencing this data.
+	 */
+	long refCount;
+};
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class STable
+ * \brief Base class for implicitly shared dynamic arrays.
+ *
+ * STable is used as the common data storage class for shared vectors. It does
+ * not provide any methods to operate on the data and as such it is not
+ * intended to be used directly. It exists so that algorithms that operatate
+ * on dynamic arrays can be written without knowing about the various shared
+ * vector classes that my exist.
+ */
+
+/*@}*/
+
+/* STable class. */
+template <class T> class STable
+{
+public:
+	/* Default Constructor. */
+	inline STable();
+
+	/**
+	 * \brief Get the length of the shared vector.
+	 *
+	 * \returns the length of the shared vector.
+	 */
+	long length() const
+		{ return data == 0 ? 0 : (((STabHead*)data) - 1)->tabLen; }
+	
+	/**
+	 * \brief Get header of the shared vector.
+	 *
+	 * \returns the header of the shared vector.
+	 */
+	STabHead *header() const
+		{ return data == 0 ? 0 : (((STabHead*)data) - 1); }
+
+	/**
+	 * \brief Table data.
+	 *
+	 * The pointer to the elements in the vector. The shared table header is
+	 * located just behind the data. Modifying the vector may cause this
+	 * pointer to change.
+	 */
+	T *data;
+};
+
+/**
+ * \brief Default constructor
+ *
+ * Initialize shared table data to empty.
+ */
+template <class T> inline STable<T>::STable()
+:
+	data(0)
+{
+}
+
+/* If needed is greater than existing, give twice needed. */
+#define EXPN_UP( existing, needed ) \
+		needed > existing ? (needed<<1) : existing
+	
+/* If needed is less than 1 quarter existing, give twice needed. */
+#define EXPN_DOWN( existing, needed ) \
+		needed < (existing>>2) ? (needed<<1) : existing
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class ResizeExpn
+ * \brief Exponential table resizer. 
+ *
+ * ResizeExpn is the default table resizer. When an up resize is needed, space
+ * is doubled. When a down resize is needed, space is halved.  The result is
+ * that when growing the vector in a linear fashion, the number of resizes of
+ * the allocated space behaves logarithmically.
+ *
+ * If only up resizes are done, there will never be more than 2 times the
+ * needed space allocated. If down resizes are done as well, there will never
+ * be more than 4 times the needed space allocated.  ResizeExpn uses this 50%
+ * usage policy on up resizing and 25% usage policy on down resizing to
+ * improve performance when repeatedly inserting and removing a small number
+ * of elements relative to the size of the array.  This scheme guarantees that
+ * repetitive inserting and removing of a small number of elements will never
+ * result in repetative reallocation.
+ *
+ * The sizes passed to the resizer from the vectors are in units of T.
+ */
+
+/*@}*/
+
+/* Exponential resizer. */
+class ResizeExpn
+{
+protected:
+	/**
+	 * \brief Determine the new table size when up resizing.
+	 *
+	 * If the existing size is insufficient for the space needed then allocate
+	 * twice the space needed. Otherwise use the existing size.
+	 *
+	 * \returns The new table size.
+	 */
+	static inline long upResize( long existing, long needed )
+		{ return EXPN_UP( existing, needed ); }
+
+	/**
+	 * \brief Determine the new table size when down resizing.
+	 *
+	 * If the space needed is less than one quarter of the existing size then
+	 * allocate twice the space needed. Otherwise use the exitsing size.
+	 *
+	 * \returns The new table size.
+	 */
+	static inline long downResize( long existing, long needed )
+		{ return EXPN_DOWN( existing, needed ); }
+};
+
+#undef EXPN_UP
+#undef EXPN_DOWN
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_TABLE_H */
diff --git a/aapl/vector.h b/aapl/vector.h
new file mode 100644
index 00000000..835607b1
--- /dev/null
+++ b/aapl/vector.h
@@ -0,0 +1,1189 @@
+/*
+ *  Copyright 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Aapl.
+ *
+ *  Aapl is free software; you can redistribute it and/or modify it under the
+ *  terms of the GNU Lesser General Public License as published by the Free
+ *  Software Foundation; either version 2.1 of the License, or (at your option)
+ *  any later version.
+ *
+ *  Aapl is distributed in the hope that it will be useful, but WITHOUT ANY
+ *  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ *  FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License for
+ *  more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with Aapl; if not, write to the Free Software Foundation, Inc., 59
+ *  Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ */
+
+#ifndef _AAPL_VECTOR_H
+#define _AAPL_VECTOR_H
+
+#include <new>
+#include <string.h>
+#include <stdlib.h>
+#include <assert.h>
+#include "table.h"
+
+#ifdef AAPL_NAMESPACE
+namespace Aapl {
+#endif
+
+/**
+ * \addtogroup vector
+ * @{
+ */
+
+/** \class Vector
+ * \brief Dynamic array.
+ *
+ * This is typical vector implementation. It is a dynamic array that can be
+ * used to contain complex data structures that have constructors and
+ * destructors as well as simple types such as integers and pointers.
+ *
+ * Vector supports inserting, overwriting, and removing single or multiple
+ * elements at once. Constructors and destructors are called wherever
+ * appropriate.  For example, before an element is overwritten, it's
+ * destructor is called.
+ *
+ * Vector provides automatic resizing of allocated memory as needed and offers
+ * different allocation schemes for controlling how the automatic allocation
+ * is done.  Two senses of the the length of the data is maintained: the
+ * amount of raw memory allocated to the vector and the number of actual
+ * elements in the vector. The various allocation schemes control how the
+ * allocated space is changed in relation to the number of elements in the
+ * vector.
+ *
+ * \include ex_vector.cpp
+ */
+
+/*@}*/
+
+template < class T, class Resize = ResizeExpn > class Vector
+	: public Table<T>, public Resize
+{
+private:
+	typedef Table<T> BaseTable;
+
+public:
+	/**
+	 * \brief Initialize an empty vector with no space allocated.  
+	 *
+	 * If a linear resizer is used, the step defaults to 256 units of T. For a
+	 * runtime vector both up and down allocation schemes default to
+	 * Exponential.
+	 */
+	Vector() { }
+
+	/**
+	 * \brief Create a vector that contains an initial element.
+	 *
+	 * The vector becomes one element in length. The element's copy
+	 * constructor is used to place the value in the vector.
+	 */
+	Vector(const T &val)             { setAs(&val, 1); }
+
+	/**
+	 * \brief Create a vector that contains an array of elements.
+	 *
+	 * The vector becomes len elements in length.  Copy constructors are used
+	 * to place the new elements in the vector. 
+	 */
+	Vector(const T *val, long len)   { setAs(val, len); }
+
+	/* Deep copy. */
+	Vector( const Vector &v );
+
+	/* Free all mem used by the vector. */
+	~Vector() { empty(); }
+
+	/* Delete all items. */
+	void empty();
+
+	/* Abandon the contents of the vector without deleteing. */
+	void abandon();
+
+	/* Transfers the elements of another vector into this vector. First emptys
+	 * the current vector. */
+	void transfer( Vector &v );
+
+	/* Perform a deep copy of another vector into this vector. */
+	Vector &operator=( const Vector &v );
+
+	/* Stack operations. */
+	void push( const T &t ) { append( t ); }
+	void pop() { remove( BaseTable::tabLen - 1 ); }
+	T &top() { return BaseTable::data[BaseTable::tabLen - 1]; }
+
+	/*@{*/
+	/**
+	 * \brief Insert one element at position pos.
+	 *
+	 * Elements in the vector from pos onward are shifted one space to the
+	 * right. The copy constructor is used to place the element into this
+	 * vector. If pos is greater than the length of the vector then undefined
+	 * behaviour results. If pos is negative then it is treated as an offset
+	 * relative to the length of the vector.
+	 */
+	void insert(long pos, const T &val)    { insert(pos, &val, 1); }
+
+	/* Insert an array of values. */
+	void insert(long pos, const T *val, long len);
+
+	/**
+	 * \brief Insert all the elements from another vector at position pos.
+	 *
+	 * Elements in this vector from pos onward are shifted v.tabLen spaces to
+	 * the right. The element's copy constructor is used to copy the items
+	 * into this vector. The other vector is left unchanged. If pos is off the
+	 * end of the vector, then undefined behaviour results. If pos is negative
+	 * then it is treated as an offset relative to the length of the vector.
+	 * Equivalent to vector.insert(pos, other.data, other.tabLen).
+	 */
+	void insert(long pos, const Vector &v) { insert(pos, v.data, v.tabLen); }
+
+	/* Insert len copies of val into the vector. */
+	void insertDup(long pos, const T &val, long len);
+
+	/**
+	 * \brief Insert one new element using the default constrcutor.
+	 *
+	 * Elements in the vector from pos onward are shifted one space to the
+	 * right.  The default constructor is used to init the new element. If pos
+	 * is greater than the length of the vector then undefined behaviour
+	 * results. If pos is negative then it is treated as an offset relative to
+	 * the length of the vector.
+	 */
+	void insertNew(long pos)               { insertNew(pos, 1); }
+
+	/* Insert len new items using default constructor. */
+	void insertNew(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+	/**
+	 * \brief Remove one element at position pos.
+	 *
+	 * The element's destructor is called. Elements to the right of pos are
+	 * shifted one space to the left to take up the free space. If pos is greater
+	 * than or equal to the length of the vector then undefined behavior results.
+	 * If pos is negative then it is treated as an offset relative to the length
+	 * of the vector.
+	 */
+	void remove(long pos)                 { remove(pos, 1); }
+
+	/* Delete a number of elements. */
+	void remove(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+	/**
+	 * \brief Replace one element at position pos.
+	 *
+	 * If there is an existing element at position pos (if pos is less than
+	 * the length of the vector) then its destructor is called before the
+	 * space is used. The copy constructor is used to place the element into
+	 * the vector.  If pos is greater than the length of the vector then
+	 * undefined behaviour results.  If pos is negative then it is treated as
+	 * an offset relative to the length of the vector.
+	 */
+	void replace(long pos, const T &val)    { replace(pos, &val, 1); }
+
+	/* Replace with an array of values. */
+	void replace(long pos, const T *val, long len);
+
+	/**
+	 * \brief Replace at position pos with all the elements of another vector.
+	 *
+	 * Replace at position pos with all the elements of another vector. The
+	 * other vector is left unchanged. If there are existing elements at the
+	 * positions to be replaced, then destructors are called before the space
+	 * is used. Copy constructors are used to place the elements into this
+	 * vector. It is allowable for the pos and length of the other vector to
+	 * specify a replacement that overwrites existing elements and creates new
+	 * ones.  If pos is greater than the length of the vector then undefined
+	 * behaviour results.  If pos is negative, then it is treated as an offset
+	 * relative to the length of the vector.
+	 */
+	void replace(long pos, const Vector &v) { replace(pos, v.data, v.tabLen); }
+
+	/* Replace len items with len copies of val. */
+	void replaceDup(long pos, const T &val, long len);
+
+	/**
+	 * \brief Replace at position pos with one new element.
+	 *
+	 * If there is an existing element at the position to be replaced (pos is
+	 * less than the length of the vector) then the element's destructor is
+	 * called before the space is used. The default constructor is used to
+	 * initialize the new element. If pos is greater than the length of the
+	 * vector then undefined behaviour results. If pos is negative, then it is
+	 * treated as an offset relative to the length of the vector.
+	 */
+	void replaceNew(long pos)               { replaceNew(pos, 1); }
+
+	/* Replace len items at pos with newly constructed objects. */
+	void replaceNew(long pos, long len);
+	/*@}*/
+
+	/*@{*/
+	/**
+	 * \brief Set the contents of the vector to be val exactly.
+	 *
+	 * The vector becomes one element in length. Destructors are called on any
+	 * existing elements in the vector. The element's copy constructor is used
+	 * to place the val in the vector.
+	 */
+	void setAs(const T &val)             { setAs(&val, 1); }
+
+	/* Set to the contents of an array. */
+	void setAs(const T *val, long len);
+
+	/**
+	 * \brief Set the vector to exactly the contents of another vector.
+	 *
+	 * The vector becomes v.tabLen elements in length. Destructors are called
+	 * on any existing elements. Copy constructors are used to place the new
+	 * elements in the vector.
+	 */
+	void setAs(const Vector &v)          { setAs(v.data, v.tabLen); }
+
+	/* Set as len copies of item. */
+	void setAsDup(const T &item, long len);
+
+	/**
+	 * \brief Set the vector to exactly one new item.
+	 *
+	 * The vector becomes one element in length. Destructors are called on any
+	 * existing elements in the vector. The default constructor is used to
+	 * init the new item.
+	 */
+	void setAsNew()                      { setAsNew(1); }
+
+	/* Set as newly constructed objects using the default constructor. */
+	void setAsNew(long len);
+	/*@}*/
+
+	/*@{*/
+	/** 
+	 * \brief Append one elment to the end of the vector.
+	 *
+	 * Copy constructor is used to place the element in the vector.
+	 */
+	void append(const T &val)                { replace(BaseTable::tabLen, &val, 1); }
+
+	/**
+	 * \brief Append len elements to the end of the vector. 
+	 *
+	 * Copy constructors are used to place the elements in the vector. 
+	 */
+	void append(const T *val, long len)       { replace(BaseTable::tabLen, val, len); }
+
+	/**
+	 * \brief Append the contents of another vector.
+	 *
+	 * The other vector is left unchanged. Copy constructors are used to place the
+	 * elements in the vector.
+	 */
+	void append(const Vector &v)             { replace(BaseTable::tabLen, v.data, v.tabLen); }
+
+	/**
+	 * \brief Append len copies of item.
+	 *
+	 * The copy constructor is used to place the item in the vector.
+	 */
+	void appendDup(const T &item, long len)   { replaceDup(BaseTable::tabLen, item, len); }
+
+	/**
+	 * \brief Append a single newly created item. 
+	 *
+	 * The new element is initialized with the default constructor.
+	 */
+	void appendNew()                         { replaceNew(BaseTable::tabLen, 1); }
+
+	/**
+	 * \brief Append len newly created items.
+	 *
+	 * The new elements are initialized with the default constructor.
+	 */
+	void appendNew(long len)                  { replaceNew(BaseTable::tabLen, len); }
+	/*@}*/
+	
+	/*@{*/
+	/** \fn Vector::prepend(const T &val)
+	 * \brief Prepend one elment to the front of the vector.
+	 *
+	 * Copy constructor is used to place the element in the vector.
+	 */
+	void prepend(const T &val)               { insert(0, &val, 1); }
+
+	/**
+	 * \brief Prepend len elements to the front of the vector. 
+	 *
+	 * Copy constructors are used to place the elements in the vector. 
+	 */
+	void prepend(const T *val, long len)      { insert(0, val, len); }
+
+	/**
+	 * \brief Prepend the contents of another vector.
+	 *
+	 * The other vector is left unchanged. Copy constructors are used to place the
+	 * elements in the vector.
+	 */
+	void prepend(const Vector &v)            { insert(0, v.data, v.tabLen); }
+
+	/**
+	 * \brief Prepend len copies of item.
+	 *
+	 * The copy constructor is used to place the item in the vector.
+	 */
+	void prependDup(const T &item, long len)  { insertDup(0, item, len); }
+
+	/**
+	 * \brief Prepend a single newly created item. 
+	 *
+	 * The new element is initialized with the default constructor.
+	 */
+	void prependNew()                        { insertNew(0, 1); }
+
+	/**
+	 * \brief Prepend len newly created items.
+	 *
+	 * The new elements are initialized with the default constructor.
+	 */
+	void prependNew(long len)                 { insertNew(0, len); }
+	/*@}*/
+
+	/* Convenience access. */
+	T &operator[](int i) const { return BaseTable::data[i]; }
+	long size() const           { return BaseTable::tabLen; }
+
+	/* Forward this so a ref can be used. */
+	struct Iter;
+
+	/* Various classes for setting the iterator */
+	struct IterFirst { IterFirst( const Vector &v ) : v(v) { } const Vector &v; };
+	struct IterLast { IterLast( const Vector &v ) : v(v) { } const Vector &v; };
+	struct IterNext { IterNext( const Iter &i ) : i(i) { } const Iter &i; };
+	struct IterPrev { IterPrev( const Iter &i ) : i(i) { } const Iter &i; };
+
+	/** 
+	 * \brief Vector Iterator.
+	 * \ingroup iterators
+	 */
+	struct Iter
+	{
+		/* Construct, assign. */
+		Iter() : ptr(0), ptrBeg(0), ptrEnd(0) { }
+
+		/* Construct. */
+		Iter( const Vector &v );
+		Iter( const IterFirst &vf );
+		Iter( const IterLast &vl );
+		inline Iter( const IterNext &vn );
+		inline Iter( const IterPrev &vp );
+
+		/* Assign. */
+		Iter &operator=( const Vector &v );
+		Iter &operator=( const IterFirst &vf );
+		Iter &operator=( const IterLast &vl );
+		inline Iter &operator=( const IterNext &vf );
+		inline Iter &operator=( const IterPrev &vl );
+
+		/** \brief Less than end? */
+		bool lte() const { return ptr != ptrEnd; }
+
+		/** \brief At end? */
+		bool end() const { return ptr == ptrEnd; }
+
+		/** \brief Greater than beginning? */
+		bool gtb() const { return ptr != ptrBeg; }
+
+		/** \brief At beginning? */
+		bool beg() const { return ptr == ptrBeg; }
+
+		/** \brief At first element? */
+		bool first() const { return ptr == ptrBeg+1; }
+
+		/** \brief At last element? */
+		bool last() const { return ptr == ptrEnd-1; }
+
+		/* Return the position. */
+		long pos() const { return ptr - ptrBeg - 1; }
+		T &operator[](int i) const { return ptr[i]; }
+
+		/** \brief Implicit cast to T*. */
+		operator T*() const   { return ptr; }
+
+		/** \brief Dereference operator returns T&. */
+		T &operator *() const { return *ptr; }
+
+		/** \brief Arrow operator returns T*. */
+		T *operator->() const { return ptr; }
+
+		/** \brief Move to next item. */
+		T *operator++()       { return ++ptr; }
+
+		/** \brief Move to next item. */
+		T *operator++(int)    { return ptr++; }
+
+		/** \brief Move to next item. */
+		T *increment()        { return ++ptr; }
+
+		/** \brief Move n items forward. */
+		T *operator+=(long n)       { return ptr+=n; }
+
+		/** \brief Move to previous item. */
+		T *operator--()       { return --ptr; }
+
+		/** \brief Move to previous item. */
+		T *operator--(int)    { return ptr--; }
+
+		/** \brief Move to previous item. */
+		T *decrement()        { return --ptr; }
+		
+		/** \brief Move n items back. */
+		T *operator-=(long n)       { return ptr-=n; }
+
+		/** \brief Return the next item. Does not modify this. */
+		inline IterNext next() const { return IterNext(*this); }
+
+		/** \brief Return the previous item. Does not modify this. */
+		inline IterPrev prev() const { return IterPrev(*this); }
+
+		/** \brief The iterator is simply a pointer. */
+		T *ptr;
+
+		/* For testing endpoints. */
+		T *ptrBeg, *ptrEnd;
+	};
+
+	/** \brief Return first element. */
+	IterFirst first() { return IterFirst( *this ); }
+
+	/** \brief Return last element. */
+	IterLast last() { return IterLast( *this ); }
+
+protected:
+ 	void makeRawSpaceFor(long pos, long len);
+
+	void upResize(long len);
+	void downResize(long len);
+};
+
+/* Init a vector iterator with just a vector. */
+template <class T, class Resize> Vector<T, Resize>::Iter::Iter( const Vector &v ) 
+{
+	if ( v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = v.data;
+		ptrBeg = v.data-1;
+		ptrEnd = v.data+v.tabLen;
+	}
+}
+
+/* Init a vector iterator with the first of a vector. */
+template <class T, class Resize> Vector<T, Resize>::Iter::Iter( 
+		const IterFirst &vf ) 
+{
+	if ( vf.v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vf.v.data;
+		ptrBeg = vf.v.data-1;
+		ptrEnd = vf.v.data+vf.v.tabLen;
+	}
+}
+
+/* Init a vector iterator with the last of a vector. */
+template <class T, class Resize> Vector<T, Resize>::Iter::Iter( 
+		const IterLast &vl ) 
+{
+	if ( vl.v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vl.v.data+vl.v.tabLen-1;
+		ptrBeg = vl.v.data-1;
+		ptrEnd = vl.v.data+vl.v.tabLen;
+	}
+}
+
+/* Init a vector iterator with the next of some other iterator. */
+template <class T, class Resize> Vector<T, Resize>::Iter::Iter( 
+		const IterNext &vn ) 
+:
+	ptr(vn.i.ptr+1), 
+	ptrBeg(vn.i.ptrBeg),
+	ptrEnd(vn.i.ptrEnd)
+{
+}
+
+/* Init a vector iterator with the prev of some other iterator. */
+template <class T, class Resize> Vector<T, Resize>::Iter::Iter( 
+		const IterPrev &vp ) 
+:
+	ptr(vp.i.ptr-1),
+	ptrBeg(vp.i.ptrBeg),
+	ptrEnd(vp.i.ptrEnd)
+{
+}
+
+/* Set a vector iterator with some vector. */
+template <class T, class Resize> typename Vector<T, Resize>::Iter &
+		Vector<T, Resize>::Iter::operator=( const Vector &v )    
+{
+	if ( v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = v.data; 
+		ptrBeg = v.data-1; 
+		ptrEnd = v.data+v.tabLen; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the first element in a vector. */
+template <class T, class Resize> typename Vector<T, Resize>::Iter &
+		Vector<T, Resize>::Iter::operator=( const IterFirst &vf )    
+{
+	if ( vf.v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vf.v.data; 
+		ptrBeg = vf.v.data-1; 
+		ptrEnd = vf.v.data+vf.v.tabLen; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the last element in a vector. */
+template <class T, class Resize> typename Vector<T, Resize>::Iter &
+		Vector<T, Resize>::Iter::operator=( const IterLast &vl )    
+{
+	if ( vl.v.tabLen == 0 )
+		ptr = ptrBeg = ptrEnd = 0;
+	else {
+		ptr = vl.v.data+vl.v.tabLen-1; 
+		ptrBeg = vl.v.data-1; 
+		ptrEnd = vl.v.data+vl.v.tabLen; 
+	}
+	return *this;
+}
+
+/* Set a vector iterator with the next of some other iterator. */
+template <class T, class Resize> typename Vector<T, Resize>::Iter &
+		Vector<T, Resize>::Iter::operator=( const IterNext &vn )    
+{
+	ptr = vn.i.ptr+1; 
+	ptrBeg = vn.i.ptrBeg;
+	ptrEnd = vn.i.ptrEnd;
+	return *this;
+}
+
+/* Set a vector iterator with the prev of some other iterator. */
+template <class T, class Resize> typename Vector<T, Resize>::Iter &
+		Vector<T, Resize>::Iter::operator=( const IterPrev &vp )    
+{
+	ptr = vp.i.ptr-1; 
+	ptrBeg = vp.i.ptrBeg;
+	ptrEnd = vp.i.ptrEnd;
+	return *this;
+}
+
+/**
+ * \brief Forget all elements in the vector.
+ *
+ * The contents of the vector are reset to null without without the space
+ * being freed.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		abandon()
+{
+	BaseTable::data = 0;
+	BaseTable::tabLen = 0;
+	BaseTable::allocLen = 0;
+}
+
+/**
+ * \brief Transfer the contents of another vector into this vector.
+ *
+ * The dynamic array of the other vector is moved into this vector by
+ * reference. If this vector is non-empty then its contents are first deleted.
+ * Afterward the other vector will be empty.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		transfer( Vector &v )
+{
+	empty();
+
+	BaseTable::data = v.data;
+	BaseTable::tabLen = v.tabLen;
+	BaseTable::allocLen = v.allocLen;
+
+	v.abandon();
+}
+
+/**
+ * \brief Deep copy another vector into this vector.
+ *
+ * Copies the entire contents of the other vector into this vector. Any
+ * existing contents are first deleted. Equivalent to setAs.
+ *
+ * \returns A reference to this.
+ */
+template<class T, class Resize> Vector<T, Resize> &Vector<T, Resize>::
+		operator=( const Vector &v )
+{
+	setAs(v.data, v.tabLen); 
+	return *this;
+}
+
+/* Up resize the data for len elements using Resize::upResize to tell us the
+ * new tabLen. Reads and writes allocLen. Does not read or write tabLen. */
+template<class T, class Resize> void Vector<T, Resize>::
+		upResize(long len)
+{
+	/* Ask the resizer what the new tabLen will be. */
+	long newLen = Resize::upResize(BaseTable::allocLen, len);
+
+	/* Did the data grow? */
+	if ( newLen > BaseTable::allocLen ) {
+		BaseTable::allocLen = newLen;
+		if ( BaseTable::data != 0 ) {
+			/* Table exists already, resize it up. */
+			BaseTable::data = (T*) realloc( BaseTable::data, sizeof(T) * newLen );
+			if ( BaseTable::data == 0 )
+				throw std::bad_alloc();
+		}
+		else {
+			/* Create the data. */
+			BaseTable::data = (T*) malloc( sizeof(T) * newLen );
+			if ( BaseTable::data == 0 )
+				throw std::bad_alloc();
+		}
+	}
+}
+
+/* Down resize the data for len elements using Resize::downResize to determine
+ * the new tabLen. Reads and writes allocLen. Does not read or write tabLen. */
+template<class T, class Resize> void Vector<T, Resize>::
+		downResize(long len)
+{
+	/* Ask the resizer what the new tabLen will be. */
+	long newLen = Resize::downResize( BaseTable::allocLen, len );
+
+	/* Did the data shrink? */
+	if ( newLen < BaseTable::allocLen ) {
+		BaseTable::allocLen = newLen;
+		if ( newLen == 0 ) {
+			/* Simply free the data. */
+			free( BaseTable::data );
+			BaseTable::data = 0;
+		}
+		else {
+			/* Not shrinking to size zero, realloc it to the smaller size. */
+			BaseTable::data = (T*) realloc( BaseTable::data, sizeof(T) * newLen );
+			if ( BaseTable::data == 0 )
+				throw std::bad_alloc();
+		}
+	}
+}
+
+/**
+ * \brief Perform a deep copy of the vector.
+ *
+ * The contents of the other vector are copied into this vector. This vector
+ * gets the same allocation size as the other vector. All items are copied
+ * using the element's copy constructor.
+ */
+template<class T, class Resize> Vector<T, Resize>::
+		Vector(const Vector<T, Resize> &v)
+{
+	BaseTable::tabLen = v.tabLen;
+	BaseTable::allocLen = v.allocLen;
+
+	if ( BaseTable::allocLen > 0 ) {
+		/* Allocate needed space. */
+		BaseTable::data = (T*) malloc(sizeof(T) * BaseTable::allocLen);
+		if ( BaseTable::data == 0 )
+			throw std::bad_alloc();
+
+		/* If there are any items in the src data, copy them in. */
+		T *dst = BaseTable::data, *src = v.data;
+		for (long pos = 0; pos < BaseTable::tabLen; pos++, dst++, src++ )
+			new(dst) T(*src);
+	}
+	else {
+		/* Nothing allocated. */
+		BaseTable::data = 0;
+	}
+}
+
+/** \fn Vector::~Vector()
+ * \brief Free all memory used by the vector. 
+ *
+ * The vector is reset to zero elements. Destructors are called on all
+ * elements in the vector. The space allocated for the vector is freed.
+ */
+
+
+/**
+ * \brief Free all memory used by the vector. 
+ *
+ * The vector is reset to zero elements. Destructors are called on all
+ * elements in the vector. The space allocated for the vector is freed.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		empty()
+{
+	if ( BaseTable::data != 0 ) {
+		/* Call All destructors. */
+		T *pos = BaseTable::data;
+		for ( long i = 0; i < BaseTable::tabLen; pos++, i++ )
+			pos->~T();
+
+		/* Free the data space. */
+		free( BaseTable::data );
+		BaseTable::data = 0;
+		BaseTable::tabLen = BaseTable::allocLen = 0;
+	}
+}
+
+/**
+ * \brief Set the contents of the vector to be len elements exactly. 
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. Copy constructors are used to place the
+ * new elements in the vector. 
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		setAs(const T *val, long len)
+{
+	/* Call All destructors. */
+	long i;
+	T *pos = BaseTable::data;
+	for ( i = 0; i < BaseTable::tabLen; pos++, i++ )
+		pos->~T();
+
+	/* Adjust the allocated length. */
+	if ( len < BaseTable::tabLen )
+		downResize( len );
+	else if ( len > BaseTable::tabLen )
+		upResize( len );
+
+	/* Set the new data length to exactly len. */
+	BaseTable::tabLen = len;	
+	
+	/* Copy data in. */
+	T *dst = BaseTable::data;
+	const T *src = val;
+	for ( i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+}
+
+/**
+ * \brief Set the vector to len copies of item.
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. The element's copy constructor is used to
+ * copy the item into the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		setAsDup(const T &item, long len)
+{
+	/* Call All destructors. */
+	T *pos = BaseTable::data;
+	for ( long i = 0; i < BaseTable::tabLen; pos++, i++ )
+		pos->~T();
+
+	/* Adjust the allocated length. */
+	if ( len < BaseTable::tabLen )
+		downResize( len );
+	else if ( len > BaseTable::tabLen )
+		upResize( len );
+
+	/* Set the new data length to exactly len. */
+	BaseTable::tabLen = len;	
+	
+	/* Copy item in one spot at a time. */
+	T *dst = BaseTable::data;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(item);
+}
+
+/**
+ * \brief Set the vector to exactly len new items.
+ *
+ * The vector becomes len elements in length. Destructors are called on any
+ * existing elements in the vector. Default constructors are used to init the
+ * new items.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		setAsNew(long len)
+{
+	/* Call All destructors. */
+	T *pos = BaseTable::data;
+	for ( long i = 0; i < BaseTable::tabLen; pos++, i++ )
+		pos->~T();
+
+	/* Adjust the allocated length. */
+	if ( len < BaseTable::tabLen )
+		downResize( len );
+	else if ( len > BaseTable::tabLen )
+		upResize( len );
+
+	/* Set the new data length to exactly len. */
+	BaseTable::tabLen = len;	
+	
+	/* Create items using default constructor. */
+	T *dst = BaseTable::data;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+}
+
+
+/**
+ * \brief Replace len elements at position pos.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. Copy constructors are used
+ * to place the elements into the vector. It is allowable for the pos and
+ * length to specify a replacement that overwrites existing elements and
+ * creates new ones.  If pos is greater than the length of the vector then
+ * undefined behaviour results. If pos is negative, then it is treated as an
+ * offset relative to the length of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		replace(long pos, const T *val, long len)
+{
+	long endPos, i;
+	T *item;
+
+	/* If we are given a negative position to replace at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+
+	/* The end is the one past the last item that we want
+	 * to write to. */
+	endPos = pos + len;
+
+	/* Make sure we have enough space. */
+	if ( endPos > BaseTable::tabLen ) {
+		upResize( endPos );
+
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < BaseTable::tabLen; i++, item++ )
+			item->~T();
+		
+		/* We are extending the vector, set the new data length. */
+		BaseTable::tabLen = endPos;
+	}
+	else {
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < endPos; i++, item++ )
+			item->~T();
+	}
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	const T *src = val;
+	for ( i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+}
+
+/**
+ * \brief Replace at position pos with len copies of an item.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. The copy constructor is
+ * used to place the element into this vector. It is allowable for the pos and
+ * length to specify a replacement that overwrites existing elements and
+ * creates new ones. If pos is greater than the length of the vector then
+ * undefined behaviour results.  If pos is negative, then it is treated as an
+ * offset relative to the length of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		replaceDup(long pos, const T &val, long len)
+{
+	long endPos, i;
+	T *item;
+
+	/* If we are given a negative position to replace at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+
+	/* The end is the one past the last item that we want
+	 * to write to. */
+	endPos = pos + len;
+
+	/* Make sure we have enough space. */
+	if ( endPos > BaseTable::tabLen ) {
+		upResize( endPos );
+
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < BaseTable::tabLen; i++, item++ )
+			item->~T();
+		
+		/* We are extending the vector, set the new data length. */
+		BaseTable::tabLen = endPos;
+	}
+	else {
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < endPos; i++, item++ )
+			item->~T();
+	}
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(val);
+}
+
+/**
+ * \brief Replace at position pos with len new elements.
+ *
+ * If there are existing elements at the positions to be replaced, then
+ * destructors are called before the space is used. The default constructor is
+ * used to initialize the new elements. It is allowable for the pos and length
+ * to specify a replacement that overwrites existing elements and creates new
+ * ones. If pos is greater than the length of the vector then undefined
+ * behaviour results. If pos is negative, then it is treated as an offset
+ * relative to the length of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		replaceNew(long pos, long len)
+{
+	long endPos, i;
+	T *item;
+
+	/* If we are given a negative position to replace at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+
+	/* The end is the one past the last item that we want
+	 * to write to. */
+	endPos = pos + len;
+
+	/* Make sure we have enough space. */
+	if ( endPos > BaseTable::tabLen ) {
+		upResize( endPos );
+
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < BaseTable::tabLen; i++, item++ )
+			item->~T();
+		
+		/* We are extending the vector, set the new data length. */
+		BaseTable::tabLen = endPos;
+	}
+	else {
+		/* Delete any objects we need to delete. */
+		item = BaseTable::data + pos;
+		for ( i = pos; i < endPos; i++, item++ )
+			item->~T();
+	}
+
+	/* Copy data in using copy constructor. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+}
+
+/**
+ * \brief Remove len elements at position pos.
+ *
+ * Destructor is called on all elements removed. Elements to the right of pos
+ * are shifted len spaces to the left to take up the free space. If pos is
+ * greater than or equal to the length of the vector then undefined behavior
+ * results. If pos is negative then it is treated as an offset relative to the
+ * length of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		remove(long pos, long len)
+{
+	long newLen, lenToSlideOver, endPos;
+	T *dst, *item;
+
+	/* If we are given a negative position to remove at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+
+	/* The first position after the last item deleted. */
+	endPos = pos + len;
+
+	/* The new data length. */
+	newLen = BaseTable::tabLen - len;
+
+	/* The place in the data we are deleting at. */
+	dst = BaseTable::data + pos;
+
+	/* Call Destructors. */
+	item = dst;
+	for ( long i = 0; i < len; i += 1, item += 1 )
+		item->~T();
+	
+	/* Shift data over if necessary. */
+	lenToSlideOver = BaseTable::tabLen - endPos;	
+	if ( len > 0 && lenToSlideOver > 0 )
+		memmove(dst, dst + len, sizeof(T)*lenToSlideOver);
+
+	/* Shrink the data if necessary. */
+	downResize( newLen );
+
+	/* Set the new data length. */
+	BaseTable::tabLen = newLen;
+}
+
+/**
+ * \brief Insert len elements at position pos.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * The copy constructor is used to place the elements into this vector. If pos
+ * is greater than the length of the vector then undefined behaviour results.
+ * If pos is negative then it is treated as an offset relative to the length
+ * of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		insert(long pos, const T *val, long len)
+{
+	/* If we are given a negative position to insert at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+	
+	/* Calculate the new length. */
+	long newLen = BaseTable::tabLen + len;
+
+	/* Up resize, we are growing. */
+	upResize( newLen );
+
+	/* Shift over data at insert spot if needed. */
+	if ( len > 0 && pos < BaseTable::tabLen ) {
+		memmove(BaseTable::data + pos + len, BaseTable::data + pos,
+				sizeof(T)*(BaseTable::tabLen-pos));
+	}
+
+	/* Copy data in element by element. */
+	T *dst = BaseTable::data + pos;
+	const T *src = val;
+	for ( long i = 0; i < len; i++, dst++, src++ )
+		new(dst) T(*src);
+
+	/* Set the new length. */
+	BaseTable::tabLen = newLen;
+}
+
+/**
+ * \brief Insert len copies of item at position pos.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * The copy constructor is used to place the element into this vector. If pos
+ * is greater than the length of the vector then undefined behaviour results.
+ * If pos is negative then it is treated as an offset relative to the length
+ * of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		insertDup(long pos, const T &item, long len)
+{
+	/* If we are given a negative position to insert at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+	
+	/* Calculate the new length. */
+	long newLen = BaseTable::tabLen + len;
+
+	/* Up resize, we are growing. */
+	upResize( newLen );
+
+	/* Shift over data at insert spot if needed. */
+	if ( len > 0 && pos < BaseTable::tabLen ) {
+		memmove(BaseTable::data + pos + len, BaseTable::data + pos,
+				sizeof(T)*(BaseTable::tabLen-pos));
+	}
+
+	/* Copy the data item in one at a time. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T(item);
+
+	/* Set the new length. */
+	BaseTable::tabLen = newLen;
+}
+
+/**
+ * \brief Insert len new elements using the default constructor.
+ *
+ * Elements in the vector from pos onward are shifted len spaces to the right.
+ * Default constructors are used to init the new elements. If pos is off the
+ * end of the vector then undefined behaviour results. If pos is negative then
+ * it is treated as an offset relative to the length of the vector.
+ */
+template<class T, class Resize> void Vector<T, Resize>::
+		insertNew(long pos, long len)
+{
+	/* If we are given a negative position to insert at then
+	 * treat it as a position relative to the length. */
+	if ( pos < 0 )
+		pos = BaseTable::tabLen + pos;
+	
+	/* Calculate the new length. */
+	long newLen = BaseTable::tabLen + len;
+
+	/* Up resize, we are growing. */
+	upResize( newLen );
+
+	/* Shift over data at insert spot if needed. */
+	if ( len > 0 && pos < BaseTable::tabLen ) {
+		memmove(BaseTable::data + pos + len, BaseTable::data + pos,
+				sizeof(T)*(BaseTable::tabLen-pos));
+	}
+
+	/* Init new data with default constructors. */
+	T *dst = BaseTable::data + pos;
+	for ( long i = 0; i < len; i++, dst++ )
+		new(dst) T();
+
+	/* Set the new length. */
+	BaseTable::tabLen = newLen;
+}
+
+/* Makes space for len items, Does not init the items in any way.  If pos is
+ * greater than the length of the vector then undefined behaviour results.
+ * Updates the length of the vector. */
+template<class T, class Resize> void Vector<T, Resize>::
+		makeRawSpaceFor(long pos, long len)
+{
+	/* Calculate the new length. */
+	long newLen = BaseTable::tabLen + len;
+
+	/* Up resize, we are growing. */
+	upResize( newLen );
+
+	/* Shift over data at insert spot if needed. */
+	if ( len > 0 && pos < BaseTable::tabLen ) {
+		memmove(BaseTable::data + pos + len, BaseTable::data + pos,
+			sizeof(T)*(BaseTable::tabLen-pos));
+	}
+
+	/* Save the new length. */
+	BaseTable::tabLen = newLen;
+}
+
+#ifdef AAPL_NAMESPACE
+}
+#endif
+
+#endif /* _AAPL_VECTOR_H */
diff --git a/colm.vim b/colm.vim
new file mode 100644
index 00000000..b32441a5
--- /dev/null
+++ b/colm.vim
@@ -0,0 +1,89 @@
+" Vim syntax file
+"
+" Language: Colm
+" Author: Adrian Thurston
+
+syntax clear
+
+"
+" Regular Language Types
+"
+
+" Identifiers
+syntax match rlId "[a-zA-Z_][a-zA-Z_0-9]*" contained
+
+" Literals
+syntax match rlLiteral "'\(\\.\|[^'\\]\)*'[i]*" contained
+syntax match rlLiteral "\"\(\\.\|[^\"\\]\)*\"[i]*" contained
+syntax match rlLiteral "\[\(\\.\|[^\]\\]\)*\]" contained
+
+" Numbers
+syntax match rlNumber "[0-9][0-9]*" contained
+syntax match rlNumber "0x[0-9a-fA-F][0-9a-fA-F]*" contained
+
+" Operators
+syntax match rlOtherOps ":>" contained
+syntax match rlOtherOps ":>>" contained
+syntax match rlOtherOps "<:" contained
+
+syntax cluster rlTypes contains=rlId,rlLiteral,rlNumber,rlOtherOps
+syntax region rlTypeRegion matchgroup=regionDelimiter start="/" end="/"
+	\ contains=@rlTypes
+
+syntax region cflTypeRegion matchgroup=regionDelimiter start="\[" end="\]"
+	\ contains=cflTypeRegion,patRegion,otLit,typeKeywords
+syntax region patRegion matchgroup=String start="\"" end="\"" end="\n"
+	\ contains=char,cflTypeRegion
+
+syntax match char "[^\"\[]" contained
+syntax match char "\\." contained
+
+syntax match otLit "\~.*$"
+syntax match otLit "'\(\\.\|[^'\\]\)*'[i]*"
+
+"
+" Other stuff
+"
+
+syntax match tlComment "#.*$"
+syntax match tlIdentifier "[a-zA-Z_][a-zA-Z_0-9]*"
+syntax match tlNumber "[0-9][0-9]*"
+syntax match tlNumber "nil"
+syntax match tlNumber "true"
+syntax match tlNumber "false"
+
+syntax keyword Type
+	\ commit include literal iter
+	\ namespace lex reducefirst global include 
+	\ construct parse parse_stop match require
+	\ preeof
+
+syntax keyword typeKeywords
+	\ int str bool any ref vector map list ptr
+
+syntax keyword Keyword
+	\ reject else elsif return yield for while if
+	\ typeid in break 
+	\ new deref
+
+syntax match tokenName "[a-zA-Z_][a-zA-Z_0-9]*" contained
+
+syntax region defTypes matchgroup=defKeywords
+	\ start="\<rl\>" start="\<def\>" start="\<token\>" start="\<ignore\>"
+	\ matchgroup=Function end="[a-zA-Z_][a-zA-Z0-9_]*" end="/"me=e-1
+
+"
+" Specifying Groups
+"
+hi link tlComment Comment
+hi link tlNumber Number
+hi link otLit String
+hi link rlNumber Number
+hi link rlLiteral String
+hi link defKeywords Type
+hi link typeKeywords Type
+hi link regionDelimiter Type
+hi link char String
+hi link tokenName Function
+ 
+let b:current_syntax = "colm"
diff --git a/colm/Makefile.in b/colm/Makefile.in
new file mode 100644
index 00000000..61b57867
--- /dev/null
+++ b/colm/Makefile.in
@@ -0,0 +1,123 @@
+#
+#   Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Colm.
+#
+#   Colm is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Colm is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Colm; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+INCS += -I../common -I../aapl
+DEFS +=
+
+CFLAGS += -g -Wall -Wwrite-strings
+LDFLAGS +=
+
+# Frequently changed ones first.
+CC_SRCS = \
+	compile.cpp \
+	bytecode.cpp \
+	fsmrun.cpp \
+	pdarun.cpp \
+	input.cpp \
+	lmparse.cpp \
+	lmscan.cpp \
+	parsetree.cpp \
+	parsedata.cpp \
+	fsmstate.cpp \
+	fsmbase.cpp \
+	fsmattach.cpp \
+	fsmmin.cpp \
+	fsmgraph.cpp \
+	pdagraph.cpp \
+	pdabuild.cpp \
+	pdacodegen.cpp \
+	fsmcodegen.cpp \
+	redfsm.cpp \
+	fsmexec.cpp \
+	main.cpp \
+	list.cpp \
+	map.cpp \
+	string.cpp \
+	redbuild.cpp \
+	closure.cpp \
+	fsmap.cpp \
+	dotgen.cpp \
+	tree.cpp
+
+RUNTIME_SRC = fsmrun.cpp pdarun.cpp bytecode.cpp list.cpp \
+	map.cpp string.cpp input.cpp tree.cpp
+GEN_SRC = lmscan.cpp lmparse.h lmparse.cpp 
+
+RUNTIME = runtime.a
+
+LIBS = ../common/common.a
+
+#*************************************
+
+PREFIX = @prefix@
+
+BUILD_PARSERS = @BUILD_PARSERS@
+
+# Programs
+CXX = @CXX@
+
+# Get objects and dependencies from sources.
+OBJS = $(CC_SRCS:%.cpp=%.o)
+DEPS = $(CC_SRCS:%.cpp=.%.d)
+RUNTIME_OBJS = $(RUNTIME_SRC:%.cpp=%.o)
+
+# Rules.
+all: colm $(RUNTIME)
+
+colm: $(GEN_SRC) $(OBJS) $(LIBS)
+	$(CXX) $(LDFLAGS) -o $@ $(OBJS) $(LIBS)
+
+$(RUNTIME): $(RUNTIME_OBJS)
+	ar -cr $@ $(RUNTIME_OBJS)
+
+ifeq ($(BUILD_PARSERS),true)
+
+lmparse.h: lmparse.kh
+	kelbt -o $@ $<
+
+lmparse.cpp: lmparse.kl lmparse.kh
+	kelbt -o $@ $<
+
+lmscan.cpp: lmparse.h
+
+lmscan.cpp: lmscan.rl
+	ragel -G2 -o $@ $<
+
+endif
+
+%.o: %.cpp
+	@$(CXX) -M $(DEFS) $(INCS) $< > .$*.d
+	$(CXX) -c $(CFLAGS) $(DEFS) $(INCS) -o $@ $<
+
+distclean: clean
+	rm -f Makefile 
+
+ifeq ($(BUILD_PARSERS),true)
+EXTRA_CLEAN = $(GEN_SRC)
+endif
+
+clean:
+	rm -f tags .*.d *.o colm $(EXTRA_CLEAN) $(RUNTIME)
+
+install: all
+	install -d $(PREFIX)/bin
+	install -s colm $(PREFIX)/bin/colm
+
+-include $(DEPS)
diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
new file mode 100644
index 00000000..30a76deb
--- /dev/null
+++ b/colm/bytecode.cpp
@@ -0,0 +1,4092 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "bytecode.h"
+#include "astring.h"
+#include "pdarun.h"
+#include "dlistval.h"
+#include "fsmrun.h"
+#include "pdarun.h"
+#include <iostream>
+#include <sstream>
+#include <alloca.h>
+#include <sys/mman.h>
+
+using std::cout;
+using std::cerr;
+using std::endl;
+
+#define push(i) (*(--sp) = (i))
+#define pop() (*sp++)
+#define top() (*sp)
+#define ptop() (sp)
+#define popn(n) (sp += (n))
+#define pushn(n) (sp -= (n))
+#define local(o) (frame[o])
+#define plocal(o) (&frame[o])
+#define local_iframe(o) (iframe[o])
+#define plocal_iframe(o) (&iframe[o])
+
+#define read_byte( i ) do { \
+	i = ((uchar) *instr++); \
+} while(0)
+
+#define read_word( i ) do { \
+	i = ((Word) *instr++); \
+	i |= ((Word) *instr++) << 8; \
+	i |= ((Word) *instr++) << 16; \
+	i |= ((Word) *instr++) << 24; \
+} while(0)
+
+#define read_tree( i ) do { \
+	Word w; \
+	w = ((Word) *instr++); \
+	w |= ((Word) *instr++) << 8; \
+	w |= ((Word) *instr++) << 16; \
+	w |= ((Word) *instr++) << 24; \
+	i = (Tree*) w; \
+} while(0)
+
+#define read_half( i ) do { \
+	i = ((Word) *instr++); \
+	i |= ((Word) *instr++) << 8; \
+} while(0)
+
+static Tree **vm_stack;
+
+Kid *alloc_attrs( Program *prg, long length )
+{
+	Kid *cur = 0;
+	for ( long i = 0; i < length; i++ ) {
+		Kid *next = cur;
+		cur = prg->kidPool.allocate();
+		cur->next = next;
+	}
+	return cur;
+}
+
+void free_attrs( Program *prg, Kid *attrs )
+{
+	Kid *cur = attrs;
+	while ( cur != 0 ) {
+		Kid *next = cur->next;
+		prg->kidPool.free( cur );
+		cur = next;
+	}
+}
+
+void set_attr( Tree *tree, long pos, Tree *val )
+{
+	Kid *cur = tree->child;
+	for ( long i = 0; i < pos; i++ )
+		cur = cur->next;
+	cur->tree = val;
+}
+
+Tree *get_attr( Tree *tree, long pos )
+{
+	Kid *cur = tree->child;
+	for ( long i = 0; i < pos; i++ )
+		cur = cur->next;
+	return cur->tree;
+}
+
+Kid *copy_obj_data( Program *prg, long length, Kid *src )
+{
+	Kid *cur = 0;
+	for ( long i = 0; i < length; i++ ) {
+		Kid *next = cur;
+		cur = prg->kidPool.allocate();
+		cur->next = next;
+	}
+
+	Kid *dest = cur;
+	for ( long i = 0; i < length; i++ ) {
+		dest->tree = src->tree;
+		dest = dest->next;
+		src = src->next;
+	}
+	return cur;
+}
+
+Kid *kid_list_concat( Kid *list1, Kid *list2 )
+{
+	if ( list1 == 0 )
+		return list2;
+	else if ( list2 == 0 )
+		return list1;
+
+	Kid *dest = list1;
+	while ( dest->next != 0 )
+		dest = dest->next;
+	dest->next = list2;
+	return list1;
+}
+
+/* Type conversions. */
+List *list( Tree *tree ) { return (List*) tree; }
+Map *map( Tree *tree )  { return (Map*) tree; }
+Str *str( Tree *tree )  { return (Str*) tree; }
+
+void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter );
+Tree *split_tree( Program *prg, Tree *t );
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
+
+Stream *open_stream_file( Program *prg, FILE *file )
+{
+	Stream *res = (Stream*)prg->mapElPool.allocate();
+	res->id = LEL_ID_STREAM;
+	res->file = file;
+	res->in = new InputStreamFile( file );
+	res->scanner = new FsmRun( prg->rtd->fsmTables );
+	res->scanner->attachInputStream( res->in );
+	return res;
+}
+
+Stream *open_stream_fd( Program *prg, long fd )
+{
+	Stream *res = (Stream*)prg->mapElPool.allocate();
+	res->id = LEL_ID_STREAM;
+	res->in = new InputStreamFD( fd );
+	res->scanner = new FsmRun( prg->rtd->fsmTables );
+	res->scanner->attachInputStream( res->in );
+	return res;
+}
+
+Tree *open_file( Program *prg, Tree *name )
+{
+	Head *head = ((Str*)name)->value;
+	FILE *file = fopen( string_data(head), "rb" );
+	Tree *res = 0;
+
+	if ( file != 0 ) {
+		res = (Tree*) open_stream_file( prg, file );
+		res = prg->treePool.allocate();
+		res->id = LEL_ID_STREAM;
+		((Stream *)res)->file = file;
+	}
+
+	return res;
+}
+
+void check_parse_tree( Tree *tree )
+{
+	if ( tree->refs != 1 )
+		cerr << "tree->refs: " << tree->refs << endl;
+	
+	Kid *child = tree->child;
+	while ( child != 0 ) {
+		check_parse_tree( child->tree );
+		child = child->next;
+	}
+}
+
+void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
+{
+	/* If the tree already has an alg (it has been parsed) then we need to
+	 * send a copy of it because the parsing that we are about to do requires
+	 * a fresh alg. */
+	if ( tree->alg != 0 ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "copying tree in send because alg is set" << endl;
+		#endif
+		Kid *unused = 0;
+		tree = copy_real_tree( prg, tree, 0, unused );
+		tree_upref( tree );
+	}
+
+	assert( tree->alg == 0 );
+	tree->alg = prg->algPool.allocate();
+
+	if ( tree->id >= prg->rtd->firstNonTermId )
+		tree->id = prg->rtd->lelInfo[tree->id].termDupId;
+
+	tree->alg->flags |= AF_ARTIFICIAL;
+	if ( ignore )
+		tree->alg->flags |= AF_IGNORE;
+
+	/* FIXME: Do we need to remove the ignore tokens 
+	 * at this point? Will it cause a leak? */
+
+	Kid *kid = prg->kidPool.allocate();
+	kid->tree = tree;
+
+	if ( parser->queue == 0 )
+		parser->queue = parser->queueLast = kid;
+	else {
+		parser->queueLast->next = kid;
+		parser->queueLast = kid;
+	}
+}
+
+Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs )
+{
+	Tree **const sp = root;
+	Tree **base = ptop() + nargs;
+
+	Int *idInt = (Int*)base[-1];
+	Str *textStr = (Str*)base[-2];
+
+	long id = idInt->value;
+	Head *tokdata = string_copy( prg, textStr->value );
+
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Tree *tree;
+
+	if ( lelInfo[id].ignore ) {
+		tree = prg->treePool.allocate();
+		tree->refs = 1;
+		tree->id = id;
+		tree->tokdata = tokdata;
+	}
+	else {
+		long objectLength = lelInfo[id].objectLength;
+		Kid *attrs = alloc_attrs( prg, objectLength );
+
+		tree = prg->treePool.allocate();
+		tree->id = id;
+		tree->refs = 1;
+		tree->tokdata = tokdata;
+
+		tree->child = attrs;
+
+		assert( nargs-2 <= objectLength );
+		for ( long id = 0; id < nargs-2; id++ ) {
+			set_attr( tree, id, base[-3-id] );
+			tree_upref( get_attr( tree, id) );
+		}
+	}
+	return tree;
+}
+
+Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, int nargs )
+{
+	Tree **const sp = root;
+	Tree **base = ptop() + nargs;
+
+	Int *idInt = (Int*)base[-1];
+
+	long id = idInt->value;
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+
+	Tree *tree = prg->treePool.allocate();
+	tree->id = id;
+	tree->refs = 1;
+
+	long objectLength = lelInfo[id].objectLength;
+	Kid *attrs = alloc_attrs( prg, objectLength );
+
+	Kid *last = 0, *child = 0;
+	for ( long id = 0; id < nargs-1; id++ ) {
+		Kid *kid = prg->kidPool.allocate();
+		kid->tree = base[-2-id];
+		tree_upref( kid->tree );
+
+		if ( last == 0 )
+			child = kid;
+		else
+			last->next = kid;
+
+		last = kid;
+	}
+
+	tree->child = kid_list_concat( attrs, child );
+
+	return tree;
+}
+
+Tree *parse( Tree **&sp, Program *prg, Stream *stream, 
+		long parserId, long stopId, CodeVect *&cv )
+{
+	PdaTables *tables = prg->rtd->parsers[parserId];
+	PdaRun parser( sp, prg, tables, stream->scanner, stopId );
+	parser.run();
+	parser.commit();
+	Tree *tree = parser.getParsedRoot( stopId > 0 );
+	tree_upref( tree );
+	parser.clean();
+
+	cv = new CodeVect;
+	cv->transfer( parser.allReverseCode );
+	return tree;
+}
+
+Tree *undo_parse( Tree **&sp, Program *prg, Stream *stream, 
+		long parserId, Tree *tree, CodeVect *rev )
+{
+	PdaTables *tables = prg->rtd->parsers[parserId];
+	PdaRun parser( sp, prg, tables, stream->scanner, 0 );
+	parser.undoParse( tree, rev );
+	return 0;
+}
+
+Tree *stream_pull( Program *prg, Stream *stream, Tree *length )
+{
+	long len = ((Int*)length)->value;
+	Head *tokdata = stream->scanner->extractToken( len );
+
+	Str *str = (Str*) prg->treePool.allocate();
+	str->id = LEL_ID_STR;
+	str->value = tokdata;
+
+	return (Tree*)str;
+}
+
+void undo_pull( Program *prg, Stream *stream, Tree *str )
+{
+	const char *data = string_data( ( (Str*)str )->value );
+	long length = string_length( ( (Str*)str )->value );
+	stream->scanner->sendBackText( data, length );
+}
+
+Word stream_push( Tree **&sp, Program *prg, Stream *stream, Tree *any )
+{
+	std::stringstream ss;
+	print_tree( ss, sp, prg, any );
+	stream->scanner->streamPush( ss.str().c_str(), ss.str().size());
+	return ss.str().size();
+}
+
+void undo_stream_push( Tree **&sp, Program *prg, Stream *stream, Word len )
+{
+	stream->scanner->undoStreamPush( len );
+}
+
+
+void print_str( Head *str )
+{
+	cout.write( (char*)(str->data), str->length );
+}
+
+void print_ignore_list( Tree **&sp, Program *prg, Tree *tree )
+{
+	Kid *ignore = tree_ignore( prg, tree );
+
+	/* Record the root of the stack and push everything. */
+	Tree **root = ptop();
+	while ( tree_is_ignore( prg, ignore ) ) {
+		push( (SW)ignore );
+		ignore = ignore->next;
+	}
+
+	/* Pop them off and print. */
+	while ( ptop() != root ) {
+		ignore = (Kid*) pop();
+		print_tree( sp, prg, ignore->tree );
+	}
+}
+
+void print_kid( ostream &out, Tree **&sp, Program *prg, Kid *kid, bool printIgnore )
+{
+	Tree **root = ptop();
+	Kid *child;
+
+rec_call:
+	/* If not currently skipping ignore data, then print it. Ignore data can
+	 * be associated with terminals and nonterminals. */
+	if ( printIgnore && tree_ignore( prg, kid->tree ) != 0 ) {
+		/* Ignorelists are reversed. */
+		print_ignore_list( sp, prg, kid->tree );
+		printIgnore = false;
+	}
+
+	if ( kid->tree->id < prg->rtd->firstNonTermId ) {
+		/* Always turn on ignore printing when we get to a token. */
+		printIgnore = true;
+
+		if ( kid->tree->id == LEL_ID_INT )
+			out << ((Int*)kid->tree)->value;
+		else if ( kid->tree->id == LEL_ID_BOOL ) {
+			if ( ((Int*)kid->tree)->value )
+				out << "true";
+			else
+				out << "false";
+		}
+		else if ( kid->tree->id == LEL_ID_PTR )
+			out << '#' << (void*) ((Pointer*)kid->tree)->value;
+		else if ( kid->tree->id == LEL_ID_STR )
+			print_str( ((Str*)kid->tree)->value );
+		else if ( kid->tree->id == LEL_ID_STREAM )
+			out << '#' << (void*) ((Stream*)kid->tree)->file;
+		else if ( kid->tree->tokdata != 0 && 
+				string_length( kid->tree->tokdata ) > 0 )
+		{
+			out.write( string_data( kid->tree->tokdata ), 
+					string_length( kid->tree->tokdata ) );
+		}
+	}
+	else {
+		/* Non-terminal. */
+		child = tree_child( prg, kid->tree );
+		if ( child != 0 ) {
+			push( (SW)kid );
+			kid = child;
+			while ( kid != 0 ) {
+				goto rec_call;
+				rec_return:
+				kid = kid->next;
+			}
+			kid = (Kid*)pop();
+		}
+	}
+
+	if ( ptop() != root )
+		goto rec_return;
+}
+
+void print_tree( Tree **&sp, Program *prg, Tree *tree )
+{
+	if ( tree == 0 )
+		cout << "NIL";
+	else {
+		Kid kid;
+		kid.tree = tree;
+		kid.next = 0;
+		print_kid( cout, sp, prg, &kid, false );
+	}
+}
+
+void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree )
+{
+	if ( tree == 0 )
+		cout << "NIL";
+	else {
+		Kid kid;
+		kid.tree = tree;
+		kid.next = 0;
+		print_kid( out, sp, prg, &kid, false );
+	}
+}
+
+void xml_escape_data( const char *data, long len )
+{
+	for ( int i = 0; i < len; i++ ) {
+		if ( 32 <= data[i] && data[i] <= 126 )
+			cout << data[i];
+		else
+			cout << "&#" << ((unsigned)data[i]) << ';';
+	}
+}
+
+void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
+{
+	Tree **root = ptop();
+	int i = 0;
+
+rec_call:
+	for ( i = 0; i < depth; i++ )
+		cout << "  ";
+
+	if ( kid->tree == 0 )
+		cout << "NIL" << endl;
+	else {
+		cout << '<' << prg->rtd->lelInfo[kid->tree->id].name;
+		if ( kid->tree->child != 0 ) {
+			cout << '>' << endl;
+			push( (SW) kid );
+			kid = kid->tree->child;
+			while ( kid != 0 ) {
+				depth++;
+				goto rec_call;
+				rec_return:
+				depth--;
+				kid = kid->next;
+
+				/* If the parent kid is a repeat then skip this node and go
+				 * right to the first child (repeated item). */
+				if ( prg->rtd->lelInfo[((Kid*)top())->tree->id].repeat )
+					kid = kid->tree->child;
+			}
+			kid = (Kid*) pop();
+
+			for ( i = 0; i < depth; i++ )
+				cout << "  ";
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_PTR ) {
+			cout << '>' << (void*)((Pointer*)kid->tree)->value << 
+					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_BOOL ) {
+			if ( ((Int*)kid->tree)->value )
+				cout << ">true</";
+			else
+				cout << ">false</";
+			cout << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_INT ) {
+			cout << '>' << ((Int*)kid->tree)->value << 
+					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_STR ) {
+			Head *head = (Head*) ((Str*)kid->tree)->value;
+
+			cout << '>';
+			xml_escape_data( (char*)(head->data), head->length );
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( 0 < kid->tree->id && kid->tree->id < prg->rtd->firstNonTermId &&
+				kid->tree->tokdata != 0 && 
+				string_length( kid->tree->tokdata ) > 0 && 
+				!prg->rtd->lelInfo[kid->tree->id].literal )
+		{
+			cout << '>';
+			xml_escape_data( string_data( kid->tree->tokdata ), 
+					string_length( kid->tree->tokdata ) );
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else
+			cout << "/>" << endl;
+	}
+
+	if ( ptop() != root )
+		goto rec_return;
+}
+
+void xml_print_tree( Tree **&sp, Program *prg, Tree *tree )
+{
+	Kid kid;
+	kid.tree = tree;
+	kid.next = 0;
+	xml_print_kid( sp, prg, &kid, 0 );
+}
+
+Tree *get_rhs_el( Program *prg, Tree *lhs, long position )
+{
+	Kid *pos = tree_child( prg, lhs );
+	while ( position > 0 ) {
+		pos = pos->next;
+		position -= 1;
+	}
+	return pos->tree;
+}
+
+Tree **alloc_obj_data( long length )
+{
+	Tree **attrs = 0;
+	if ( length > 0 ) {
+		attrs = new Tree*[length];
+		memset( attrs, 0, sizeof(Tree*)*length );
+	}
+	return attrs;
+}
+
+void set_field( Program *prg, Tree *tree, long field, Tree *value )
+{
+	assert( tree->refs == 1 );
+	if ( value != 0 )
+		assert( value->refs >= 1 );
+	set_attr( tree, field, value );
+}
+
+Tree *get_field( Tree *tree, Word field )
+{
+	return get_attr( tree, field );
+}
+
+Tree *get_field_split( Program *prg, Tree *tree, Word field )
+{
+	Tree *val = get_attr( tree, field );
+	Tree *split = split_tree( prg, val );
+	set_attr( tree, field, split );
+	return split;
+}
+
+void set_local( Tree **frame, long field, Tree *tree )
+{
+	if ( tree != 0 )
+		assert( tree->refs >= 1 );
+	local(field) = tree;
+}
+
+Tree *get_local_split( Program *prg, Tree **frame, long field )
+{
+	Tree *val = local(field);
+	Tree *split = split_tree( prg, val );
+	local(field) = split;
+	return split;
+}
+
+Tree *get_ptr_val( Pointer *ptr )
+{
+	return ptr->value->tree;
+}
+
+Tree *get_ptr_val_split( Program *prg, Pointer *ptr )
+{
+	Tree *val = ptr->value->tree;
+	Tree *split = split_tree( prg, val );
+	ptr->value->tree = split;
+	return split;
+}
+
+void list_free( Program *prg, List *list )
+{
+	ListEl *el = list->head;
+	while ( el != 0 ) {
+		ListEl *next = el->next;
+		tree_downref( prg, el->value );
+		prg->listElPool.free( el );
+		el = next;
+	}
+	prg->mapElPool.free( (MapEl*)list );
+}
+
+
+void map_free( Program *prg, Map *map )
+{
+	MapEl *el = map->head;
+	while ( el != 0 ) {
+		MapEl *next = el->next;
+		tree_downref( prg, el->key );
+		tree_downref( prg, el->tree );
+		prg->mapElPool.free( el );
+		el = next;
+	}
+	prg->mapElPool.free( (MapEl*)map );
+}
+
+void stream_free( Program *prg, Stream *s )
+{
+	delete s->scanner;
+	delete s->in;
+	if ( s->file != 0 )
+		fclose( s->file );
+	prg->mapElPool.free( (MapEl*)s );
+}
+
+void downref_local_trees( Program *prg, Tree **frame, char *trees, long treesLen )
+{
+	for ( long i = 0; i < treesLen; i++ ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "local tree downref: " << (long)trees[i] << endl;
+		#endif
+
+		tree_downref( prg, local(trees[i]) );
+	}
+}
+
+void upref_uiter_args( Tree **frame, long nargs )
+{
+	for ( long l = IFR_AA; l < IFR_AA + nargs; l++ ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "upref local " << l << endl;
+		#endif
+		tree_upref( local(l) );
+	}
+}
+
+void set_triter_cur( TreeIter *iter, Tree *tree )
+{
+	iter->ref.kid->tree = tree;
+}
+
+UserIter *uiter_create( Tree **&sp, Program *prg, FunctionInfo *fi, long searchId )
+{
+	pushn( sizeof(UserIter) / sizeof(Word) );
+	void *mem = ptop();
+
+	UserIter *uiter = new(mem) UserIter( ptop(), fi->argSize, searchId );
+	return uiter;
+}
+
+void iter_find( Program *prg, Tree **&sp, TreeIter *iter, bool tryFirst )
+{
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	Tree **top = iter->stackRoot;
+
+rec_call:
+	if ( tryFirst && ( iter->ref.kid->tree->id == iter->searchId || anyTree ) )
+		return;
+	else if ( iter->ref.kid->tree->child != 0 ) {
+		push( (SW) iter->ref.next );
+		push( (SW) iter->ref.kid );
+		iter->ref.kid = iter->ref.kid->tree->child;
+		iter->ref.next = (Ref*)ptop();
+		while ( iter->ref.kid != 0 ) {
+			tryFirst = true;
+			goto rec_call;
+			rec_return:
+			iter->ref.kid = iter->ref.kid->next;
+		}
+		iter->ref.kid = (Kid*)pop();
+		iter->ref.next = (Ref*)pop();
+	}
+
+	if ( top != ptop() )
+		goto rec_return;
+	
+	iter->ref.kid = 0;
+}
+
+Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the root. */
+		iter->ref = iter->rootRef;
+		iter_find( prg, sp, iter, true );
+	}
+	else {
+		/* Have a previous item, continue searching from there. */
+		iter_find( prg, sp, iter, false );
+	}
+
+	iter->stackSize = iter->stackRoot - ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the first child. */
+		if ( iter->rootRef.kid->tree->child == 0 ) {
+			iter->ref.kid = 0;
+			iter->ref.next = 0;
+		}
+		else {
+			push( (SW) iter->rootRef.next );
+			push( (SW) iter->rootRef.kid );
+			iter->ref.kid = iter->rootRef.kid->tree->child;
+			iter->ref.next = (Ref*)ptop();
+		}
+	}
+	else {
+		iter->ref.kid = iter->ref.kid->next;
+	}
+
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	if ( ! anyTree ) {
+		/* Have a previous item, go to the next sibling. */
+		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
+			iter->ref.kid = iter->ref.kid->next;
+		}
+	}
+
+	iter->stackSize = iter->stackRoot - ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the first child. */
+		if ( iter->rootRef.kid->tree->child == 0 ) {
+			iter->ref.kid = 0;
+			iter->ref.next = 0;
+		}
+		else {
+			push( (SW) iter->rootRef.next );
+			push( (SW) iter->rootRef.kid );
+
+			Kid *last = iter->rootRef.kid->tree->child;
+			while ( last->next != 0 )
+				last = last->next;
+
+			iter->ref.kid = last;
+			iter->ref.next = (Ref*)ptop();
+		}
+	}
+	else {
+		/* Have a previous item, go to the prev sibling. */
+		Kid *wasAt = iter->ref.kid;
+		Kid *parent = (Kid*) top();
+		Kid *cur = 0, *next = parent->tree->child;
+
+		while ( next != wasAt ) {
+			cur = next;
+			next = next->next;
+		}
+
+		iter->ref.kid = cur;
+	}
+
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	if ( ! anyTree ) {
+		/* Have a previous item, go to the next sibling. */
+		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
+			iter->ref.kid = iter->ref.kid->next;
+		}
+	}
+
+	iter->stackSize = iter->stackRoot - ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+void tree_iter_destroy( Tree **&sp, TreeIter *iter )
+{
+	long curStackSize = iter->stackRoot - ptop();
+	assert( iter->stackSize == curStackSize );
+	popn( iter->stackSize );
+}
+
+void user_iter_destroy( Tree **&sp, UserIter *uiter )
+{
+	/* We should always be coming from a yield. The current stack size will be
+	 * nonzero and the stack size in the iterator will be correct. */
+	long curStackSize = uiter->stackRoot - ptop();
+	assert( uiter->stackSize == curStackSize );
+
+	long argSize = uiter->argSize;
+
+	popn( uiter->stackRoot - ptop() );
+	popn( sizeof(UserIter) / sizeof(Word) );
+	popn( argSize );
+}
+
+Tree *tree_iter_deref_cur( TreeIter *iter )
+{
+	return iter->ref.kid == 0 ? 0 : iter->ref.kid->tree;
+}
+
+Tree *tree_search( Kid *kid, long id )
+{
+	if ( kid->tree->id == id )
+		return kid->tree;
+
+	Tree *res = 0;
+	if ( kid->tree->child != 0 )
+		res = tree_search( kid->tree->child, id );
+	
+	if ( res == 0 && kid->next != 0 )
+		res = tree_search( kid->next, id );
+
+	return res;	
+}
+
+Tree *tree_search( Tree *tree, long id )
+{
+	Tree *res = 0;
+	if ( tree->id == id )
+		res = tree;
+	else if ( tree->child != 0 )
+		res = tree_search( tree->child, id );
+	return res;
+}
+
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
+{
+	assert( tree->refs >= 2 );
+
+	/* Need to keep a lookout for next down. If 
+	 * copying it, return the copy. */
+	Tree *newTree = prg->treePool.allocate();
+
+	newTree->id = tree->id;
+	newTree->tokdata = string_copy( prg, tree->tokdata );
+//	newTree->pos = tree->pos;
+
+	tree->refs -= 1;
+
+	/* Copy the child list, will handle attributes, ignores 
+	 * and the children. */
+	Kid *child = tree->child, *last = 0;
+	while ( child != 0 ) {
+		Kid *newChild = prg->kidPool.allocate();
+
+		/* Store the first child. */
+		if ( newTree->child == 0 )
+			newTree->child = newChild;
+
+		/* Watch out for next down. */
+		if ( child == oldNextDown )
+			newNextDown = newChild;
+
+		newChild->tree = child->tree;
+		newChild->next = 0;
+
+		/* May be an attribute. */
+		if ( newChild->tree != 0 )
+			newChild->tree->refs += 1;
+
+		if ( last != 0 )
+			last->next = newChild;
+
+		child = child->next;
+		last = newChild;
+	}
+	
+	return newTree;
+}
+
+List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
+{
+	if ( list->refs > 1 ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "splitting list: " << list << " refs: " << 
+				list->refs << endl;
+		#endif
+
+		/* Not a need copy. */
+		List *newList = (List*)prg->mapElPool.allocate();
+		newList->id = list->genericInfo->langElId;
+		newList->genericInfo = list->genericInfo;
+
+		list->refs -= 1;
+
+		ListEl *src = list->head;
+		while( src != 0 ) {
+			ListEl *newEl = prg->listElPool.allocate();
+			newEl->value = src->value;
+			tree_upref( newEl->value );
+
+			newList->append( newEl );
+
+			/* Watch out for next down. */
+			if ( (Kid*)src == oldNextDown )
+				newNextDown = (Kid*)newEl;
+
+			src = src->next;
+		}
+
+		list = newList;
+	}
+	return list;
+}
+
+	
+Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
+{
+	if ( map->refs > 1 ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "splitting map: " << map << " refs: " << 
+				map->refs << endl;
+		#endif
+
+		Map *newMap = (Map*)prg->mapElPool.allocate();
+		newMap->id = map->genericInfo->langElId;
+		newMap->genericInfo = map->genericInfo;
+		newMap->treeSize = map->treeSize;
+		newMap->root = 0;
+
+		/* If there is a root, copy the tree. */
+		if ( map->root != 0 ) {
+			newMap->root = newMap->copyBranch( prg, map->root, 
+					oldNextDown, newNextDown );
+		}
+
+		map->refs -= 1;
+
+		for ( MapEl *el = newMap->head; el != 0; el = el->next ) {
+			assert( map->genericInfo->typeArg == TYPE_TREE );
+			tree_upref( el->tree );
+		}
+
+		map = newMap;
+	}
+	return map;
+}
+
+Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	long genericId = lelInfo[tree->id].genericId;
+	if ( genericId > 0 ) {
+		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
+		if ( generic->type == GEN_LIST )
+			tree = (Tree*) copy_list( prg, (List*) tree, oldNextDown, newNextDown );
+		else if ( generic->type == GEN_MAP )
+			tree = (Tree*) copy_map( prg, (Map*) tree, oldNextDown, newNextDown );
+		else
+			assert(false);
+	}
+	else if ( tree->id == LEL_ID_PTR )
+		assert(false);
+	else if ( tree->id == LEL_ID_BOOL )
+		assert(false);
+	else if ( tree->id == LEL_ID_INT )
+		assert(false);
+	else if ( tree->id == LEL_ID_STR )
+		assert(false);
+	else
+		tree = copy_real_tree( prg, tree, oldNextDown, newNextDown );
+
+	assert( tree->refs == 0 );
+	return tree;
+}
+
+Tree *split_tree( Program *prg, Tree *tree )
+{
+	if ( tree != 0 ) {
+		assert( tree->refs >= 1 );
+
+		if ( tree->refs > 1 ) {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "splitting tree: " << tree << " refs: " << 
+					tree->refs << endl;
+			#endif
+
+			Kid *oldNextDown = 0, *newNextDown = 0;
+			tree = copy_tree( prg, tree, oldNextDown, newNextDown );
+			tree_upref( tree );
+		}
+
+		assert( tree->refs == 1 );
+	}
+	return tree;
+}
+
+Tree *create_generic( Program *prg, Word genericId )
+{
+	GenericInfo *genericInfo = &prg->rtd->genericInfo[genericId];
+	Tree *newGeneric = 0;
+	switch ( genericInfo->type ) {
+		case GEN_MAP: {
+			Map *map = (Map*)prg->mapElPool.allocate();
+			map->id = genericInfo->langElId;
+			map->genericInfo = genericInfo;
+			newGeneric = (Tree*) map;
+			break;
+		}
+		case GEN_LIST: {
+			List *list = (List*)prg->mapElPool.allocate();
+			list->id = genericInfo->langElId;
+			list->genericInfo = genericInfo;
+			newGeneric = (Tree*) list;
+			break;
+		}
+		default:
+			assert(false);
+			return 0;
+	}
+
+	return newGeneric;
+}
+
+bool map_insert( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	MapEl *mapEl = map->insert( prg, key );
+
+	if ( mapEl != 0 ) {
+		mapEl->tree = element;
+		return true;
+	}
+
+	return false;
+}
+
+void map_unremove( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	MapEl *mapEl = map->insert( prg, key );
+	assert( mapEl != 0 );
+	mapEl->tree = element;
+}
+
+Tree *map_uninsert( Program *prg, Map *map, Tree *key )
+{
+	MapEl *el = map->detach( key );
+	Tree *val = el->tree;
+	prg->mapElPool.free( el );
+	return val;
+}
+
+Tree *map_store( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	Tree *oldTree = 0;
+	MapEl *elInTree = 0;
+	MapEl *mapEl = map->insert( prg, key, &elInTree );
+
+	if ( mapEl != 0 )
+		mapEl->tree = element;
+	else {
+		/* Element with key exists. Overwriting the value. */
+		oldTree = elInTree->tree;
+		elInTree->tree = element;
+	}
+
+	return oldTree;
+}
+
+Tree *map_unstore( Program *prg, Map *map, Tree *key, Tree *existing )
+{
+	Tree *stored = 0;
+	if ( existing == 0 ) {
+		MapEl *mapEl = map->detach( key );
+		stored = mapEl->tree;
+		prg->mapElPool.free( mapEl );
+	}
+	else {
+		MapEl *mapEl = map->find( key );
+		stored = mapEl->tree;
+		mapEl->tree = existing;
+	}
+	return stored;
+}
+
+Tree *map_find( Map *map, Tree *key )
+{
+	MapEl *mapEl = map->find( key );
+	return mapEl == 0 ? 0 : mapEl->tree;
+}
+
+long map_length( Map *map )
+{
+	return map->length();
+}
+
+long list_length( List *list )
+{
+	return list->length();
+}
+
+void list_append( Program *prg, List *list, Tree *val )
+{
+	assert( list->refs == 1 );
+	if ( val != 0 )
+		assert( val->refs >= 1 );
+	ListEl *listEl = prg->listElPool.allocate();
+	listEl->value = val;
+	list->append( listEl );
+}
+
+Tree *list_remove_end( Program *prg, List *list )
+{
+	Tree *tree = list->tail->value;
+	prg->listElPool.free( list->detachLast() );
+	return tree;
+}
+
+Tree *get_list_mem( List *list, Word field )
+{
+	Tree *result = 0;
+	switch ( field ) {
+		case 0: 
+			result = list->head->value;
+			break;
+		case 1: 
+			result = list->tail->value;
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return result;
+}
+
+Tree *get_list_mem_split( Program *prg, List *list, Word field )
+{
+	Tree *sv = 0;
+	switch ( field ) {
+		case 0: 
+			sv = split_tree( prg, list->head->value );
+			list->head->value = sv; 
+			break;
+		case 1: 
+			sv = split_tree( prg, list->tail->value );
+			list->tail->value = sv; 
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return sv;
+}
+
+Tree *set_list_mem( List *list, Half field, Tree *value )
+{
+	assert( list->refs == 1 );
+	if ( value != 0 )
+		assert( value->refs >= 1 );
+
+	Tree *existing = 0;
+	switch ( field ) {
+		case 0:
+			existing = list->head->value;
+			list->head->value = value;
+			break;
+		case 1:
+			existing = list->tail->value;
+			list->tail->value = value;
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return existing;
+}
+
+struct TreePair
+{
+	TreePair() : key(0), val(0) {}
+
+	Tree *key;
+	Tree *val;
+};
+
+TreePair map_remove( Program *prg, Map *map, Tree *key )
+{
+	MapEl *mapEl = map->find( key );
+	TreePair result;
+	if ( mapEl != 0 ) {
+		map->detach( mapEl );
+		result.key = mapEl->key;
+		result.val = mapEl->tree;
+		prg->mapElPool.free( mapEl );
+	}
+
+	return result;
+}
+
+void split_ref( Tree **&sp, Program *prg, Ref *fromRef )
+{
+	/* Go up the chain of kids, turing the pointers down. */
+	Ref *last = 0, *ref = fromRef, *next = 0;
+	while ( ref->next != 0 ) {
+		next = ref->next;
+		ref->next = last;
+		last = ref;
+		ref = next;
+	}
+	ref->next = last;
+
+	/* Now traverse the list, which goes down. */
+	while ( ref != 0 ) {
+		if ( ref->kid->tree->refs > 1 ) {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "splitting tree: " << ref->kid << " refs: " << 
+					ref->kid->tree->refs << endl;
+			#endif
+
+			Ref *nextDown = ref->next;
+			while ( nextDown != 0 && nextDown->kid == ref->kid )
+				nextDown = nextDown->next;
+
+			Kid *oldNextKidDown = nextDown != 0 ? nextDown->kid : 0;
+			Kid *newNextKidDown = 0;
+
+			Tree *newTree = copy_tree( prg, ref->kid->tree, 
+					oldNextKidDown, newNextKidDown );
+			tree_upref( newTree );
+
+			while ( ref != 0 && ref != nextDown ) {
+				next = ref->next;
+				ref->next = 0;
+
+				ref->kid->tree = newTree;
+				ref = next;
+			}
+
+			/* Correct kid pointers down from ref. */
+			while ( nextDown != 0 && nextDown->kid == oldNextKidDown ) {
+				nextDown->kid = newNextKidDown;
+				nextDown = nextDown->next;
+			}
+		}
+		else {
+			/* Reset the list as we go down. */
+			next = ref->next;
+			ref->next = 0;
+			ref = next;
+		}
+	}
+}
+
+void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter )
+{
+	if ( iter->ref.kid == 0 )
+		return;
+	
+	split_ref( sp, prg, &iter->ref );
+}
+
+void set_ref_value( Ref *ref, Tree *v )
+{
+	Kid *firstKid = ref->kid;
+	while ( ref != 0 && ref->kid == firstKid ) {
+		ref->kid->tree = v;
+		ref = ref->next;
+	}
+}
+
+long cmp_tree( const Tree *tree1, const Tree *tree2 )
+{
+	long cmpres = 0;
+	if ( tree1 == 0 ) {
+		if ( tree2 == 0 )
+			return 0;
+		else
+			return -1;
+	}
+	else if ( tree2 == 0 )
+		return 1;
+	else if ( tree1->id < tree2->id )
+		return -1;
+	else if ( tree1->id > tree2->id )
+		return 1;
+	else if ( tree1->id == LEL_ID_PTR ) {
+		if ( ((Pointer*)tree1)->value < ((Pointer*)tree2)->value )
+			return -1;
+		else if ( ((Pointer*)tree1)->value > ((Pointer*)tree2)->value )
+			return 1;
+	}
+	else if ( tree1->id == LEL_ID_INT ) {
+		if ( ((Int*)tree1)->value < ((Int*)tree2)->value )
+			return -1;
+		else if ( ((Int*)tree1)->value > ((Int*)tree2)->value )
+			return 1;
+	}
+	else if ( tree1->id == LEL_ID_STR ) {
+		cmpres = cmp_string( ((Str*)tree1)->value, ((Str*)tree2)->value );
+		if ( cmpres != 0 )
+			return cmpres;
+	}
+	else {
+		if ( tree1->tokdata == 0 && tree2->tokdata != 0 )
+			return -1;
+		else if ( tree1->tokdata != 0 && tree2->tokdata == 0 )
+			return 1;
+		else if ( tree1->tokdata != 0 && tree2->tokdata != 0 ) {
+			cmpres = cmp_string( tree1->tokdata, tree2->tokdata );
+			if ( cmpres != 0 )
+				return cmpres;
+		}
+	}
+
+	Kid *kid1 = tree1->child;
+	Kid *kid2 = tree2->child;
+
+	while ( true ) {
+		if ( kid1 == 0 && kid2 == 0 )
+			return 0;
+		else if ( kid1 == 0 && kid2 != 0 )
+			return -1;
+		else if ( kid1 != 0 && kid2 == 0 )
+			return 1;
+		else {
+			cmpres = cmp_tree( kid1->tree, kid2->tree );
+			if ( cmpres != 0 )
+				return cmpres;
+		}
+		kid1 = kid1->next;
+		kid2 = kid2->next;
+	}
+}
+
+/* This must traverse in the same order that the bindId assignments are done
+ * in. */
+bool match_pattern( Tree **bindings, Program *prg, int pat, Kid *kid, bool checkNext )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+
+	#ifdef COLM_LOG_MATCH
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	cerr << "match_pattern " << ( pat == -1 ? "NULL" : lelInfo[nodes[pat].id].name ) <<
+			" vs " << ( kid == 0 ? "NULL" : lelInfo[kid->tree->id].name ) << endl;
+	#endif
+
+	/* match node, recurse on children. */
+	if ( pat != -1 && kid != 0 ) {
+		if ( nodes[pat].id == kid->tree->id ) {
+			/* If the pattern node has data, then this means we need to match
+			 * the data against the token data. */
+			if ( nodes[pat].data != 0 ) {
+				/* Check the length of token text. */
+				if ( nodes[pat].length != string_length( kid->tree->tokdata ) )
+					return false;
+
+				/* Check the token text data. */
+				if ( nodes[pat].length > 0 && memcmp( nodes[pat].data, 
+						string_data( kid->tree->tokdata ), nodes[pat].length ) != 0 )
+					return false;
+			}
+
+			/* No failure, all okay. */
+			if ( nodes[pat].bindId > 0 ) {
+				#ifdef COLM_LOG_MATCH
+				cerr << "bindId: " << nodes[pat].bindId << endl;
+				#endif
+				bindings[nodes[pat].bindId] = kid->tree;
+			}
+
+			/* If we didn't match a terminal duplicate of a nonterm then check
+			 * down the children. */
+			if ( !nodes[pat].stop ) {
+				/* Check for failure down child branch. */
+				bool childCheck = match_pattern( bindings, prg, 
+						nodes[pat].child, tree_child( prg, kid->tree ), true );
+				if ( ! childCheck )
+					return false;
+			}
+
+			/* If checking next, then look for failure there. */
+			if ( checkNext ) {
+				bool nextCheck = match_pattern( bindings, prg, 
+						nodes[pat].next, kid->next, true );
+				if ( ! nextCheck )
+					return false;
+			}
+
+			return true;
+		}
+	}
+	else if ( pat == -1 && kid == 0 ) {
+		/* Both null is a match. */
+		return 1;
+	}
+
+	return false;
+}
+
+Tree *construct_integer( Program *prg, long i )
+{
+	Int *integer = (Int*) prg->treePool.allocate();
+	integer->id = LEL_ID_INT;
+	integer->value = i;
+
+	return (Tree*)integer;
+}
+
+Tree *construct_string( Program *prg, Head *s )
+{
+	Str *str = (Str*) prg->treePool.allocate();
+	str->id = LEL_ID_STR;
+	str->value = s;
+
+	return (Tree*)str;
+}
+
+Tree *construct_pointer( Program *prg, Tree *tree )
+{
+	Kid *kid = prg->kidPool.allocate();
+	kid->tree = tree;
+	kid->next = prg->heap;
+	prg->heap = kid;
+
+	Pointer *pointer = (Pointer*) prg->treePool.allocate();
+	pointer->id = LEL_ID_PTR;
+	pointer->value = kid;
+	
+	return (Tree*)pointer;
+}
+
+Tree *construct_term( Program *prg, Word id, Head *tokdata )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+
+	Tree *tree = prg->treePool.allocate();
+	tree->id = id;
+	tree->refs = 0;
+	tree->tokdata = tokdata;
+
+	int objectLength = lelInfo[tree->id].objectLength;
+	tree->child = alloc_attrs( prg, objectLength );
+
+	return tree;
+}
+
+Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, int pat );
+
+Kid *construct_ignore_list( Program *prg, long pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	long ignore = nodes[pat].ignore;
+
+	Kid *first = 0, *last = 0;
+	while ( ignore >= 0 ) {
+		Head *ignoreData = string_alloc_const( prg, nodes[ignore].data, nodes[ignore].length );
+
+		Tree *ignTree = prg->treePool.allocate();
+		ignTree->refs = 1;
+		ignTree->id = nodes[ignore].id;
+		ignTree->tokdata = ignoreData;
+
+		Kid *ignKid = prg->kidPool.allocate();
+		ignKid->tree = ignTree;
+		ignKid->next = 0;
+
+		if ( last == 0 )
+			first = ignKid;
+		else
+			last->next = ignKid;
+
+		ignore = nodes[ignore].next;
+		last = ignKid;
+	}
+
+	return first;
+}
+
+/* Returns an uprefed tree. Saves us having to downref and bindings to zero to
+ * return a zero-ref tree. */
+Tree *construct_replacement_tree( Tree **bindings, Program *prg, int pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Tree *tree = 0;
+
+	if ( nodes[pat].bindId > 0 ) {
+		/* All bindings have been uprefed. */
+		tree = bindings[nodes[pat].bindId];
+
+		long ignore = nodes[pat].ignore;
+		if ( ignore >= 0 ) {
+			tree = split_tree( prg, tree );
+			tree->child = construct_ignore_list( prg, pat );
+		}
+	}
+	else {
+		tree = prg->treePool.allocate();
+		tree->id = nodes[pat].id;
+		tree->refs = 1;
+		tree->tokdata = nodes[pat].length == 0 ? 0 :
+				string_alloc_const( prg, 
+				nodes[pat].data, nodes[pat].length );
+
+		int objectLength = lelInfo[tree->id].objectLength;
+
+		Kid *attrs = alloc_attrs( prg, objectLength );
+		Kid *ignore = construct_ignore_list( prg, pat );
+		Kid *child = construct_replacement_kid( bindings, prg, 
+				0, nodes[pat].child );
+
+		tree->child = kid_list_concat( attrs, 
+				kid_list_concat( ignore, child ) );
+	}
+
+	return tree;
+}
+
+Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, int pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	Kid *kid = 0;
+
+	if ( pat != -1 ) {
+		kid = prg->kidPool.allocate();
+		kid->tree = construct_replacement_tree( bindings, prg, pat );
+
+		/* Recurse down next. */
+		Kid *next = construct_replacement_kid( bindings, prg, 
+				kid, nodes[pat].next );
+
+		kid->next = next;
+	}
+
+	return kid;
+}
+
+bool test_false( Program *prg, Tree *tree )
+{
+	bool flse = ( 
+		tree == 0 ||
+		tree == prg->falseVal ||
+		tree->id == LEL_ID_INT && ((Int*)tree)->value == 0 );
+	return flse;
+}
+
+/*
+ * Execution environment
+ */
+
+Program::Program( bool ctxDepParsing, RuntimeData *rtd )
+:
+	ctxDepParsing(ctxDepParsing),
+	rtd(rtd),
+	global(0),
+	heap(0),
+	stdinVal(0),
+	stdoutVal(0),
+	stderrVal(0)
+{
+	Int *trueInt = (Int*) treePool.allocate();
+	trueInt->id = LEL_ID_BOOL;
+	trueInt->refs = 1;
+	trueInt->value = 1;
+
+	Int *falseInt = (Int*) treePool.allocate();
+	falseInt->id = LEL_ID_BOOL;
+	falseInt->refs = 1;
+	falseInt->value = 0;
+
+	trueVal = (Tree*)trueInt;
+	falseVal = (Tree*)falseInt;
+}
+
+void Program::clearGlobal()
+{
+	/* Downref all the fields in the global object. */
+	for ( int g = 0; g < rtd->globalSize; g++ ) {
+		//assert( get_attr( global, g )->refs == 1 );
+		tree_downref( this, get_attr( global, g ) );
+	}
+
+	/* Free the global object. */
+	if ( rtd->globalSize > 0 )
+		free_attrs( this, global->child );
+	treePool.free( global );
+}
+
+void Program::freshGlobal()
+{
+	if ( global != 0 )
+		clearGlobal();
+
+	Tree *tree = treePool.allocate();
+	tree->child = alloc_attrs( this, rtd->globalSize );
+	tree->refs = 1;
+	global = tree;
+}
+
+void Program::clear()
+{
+	#ifdef COLM_LOG_BYTECODE
+	cerr << "clearing the prg" << endl;
+	#endif
+
+	clearGlobal();
+
+	/* Clear the heap. */
+	Kid *a = heap;
+	while ( a != 0 ) {
+		Kid *next = a->next;
+		tree_downref( this, a->tree );
+		kidPool.free( a );
+		a = next;
+	}
+
+	//assert( trueVal->refs == 1 );
+	//assert( falseVal->refs == 1 );
+	tree_downref( this, trueVal );
+	tree_downref( this, falseVal );
+
+	tree_downref( this, (Tree*)stdinVal );
+	tree_downref( this, (Tree*)stdoutVal );
+	tree_downref( this, (Tree*)stderrVal );
+
+	long kidLost = kidPool.numlost();
+	if ( kidLost )
+		cerr << "warning lost kids: " << kidLost << endl;
+
+	long treeLost = treePool.numlost();
+	if ( treeLost )
+		cerr << "warning lost trees: " << treeLost << endl;
+
+	long algLost = algPool.numlost();
+	if ( algLost )
+		cerr << "warning lost algs: " << algLost << endl;
+
+	long listLost = listElPool.numlost();
+	if ( listLost )
+		cerr << "warning lost listEls: " << listLost << endl;
+
+	long mapLost = mapElPool.numlost();
+	if ( mapLost )
+		cerr << "warning lost mapEls: " << mapLost << endl;
+
+	kidPool.clear();
+	treePool.clear();
+	algPool.clear();
+	listElPool.clear();
+	mapElPool.clear();
+
+	//reverseCode.empty();
+
+	memset( vm_stack, 0, sizeof(Tree*) * VM_STACK_SIZE);
+}
+
+void Program::run()
+{
+	assert( sizeof(Int)      <= sizeof(Tree) );
+	assert( sizeof(Str)      <= sizeof(Tree) );
+	assert( sizeof(Pointer)  <= sizeof(Tree) );
+	assert( sizeof(Map)      <= sizeof(MapEl) );
+	assert( sizeof(List)     <= sizeof(MapEl) );
+	assert( sizeof(Stream)   <= sizeof(MapEl) );
+
+	//vm_stack = new Tree*[VM_STACK_SIZE];
+	vm_stack = (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
+		PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, 0, 0 );
+	Tree **root = &vm_stack[VM_STACK_SIZE];
+
+	if ( rtd->rootCodeLen > 0 ) {
+		CodeVect reverseCode;
+		CodeVect allReverseCode;
+		Execution execution( this, reverseCode, 0, rtd->rootCode, 0, 0 );
+		execution.execute( root );
+
+		/* Pull out the reverse code and free it. */
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "freeing the root reverse code" << endl;
+		#endif
+
+		bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+		if ( hasrcode )
+			rcode_downref( root, this, allReverseCode.data );
+	}
+}
+
+Execution::Execution( Program *prg, CodeVect &reverseCode,
+		PdaRun *parser, Code *code, Tree *lhs, Head *matchText )
+: 
+	prg(prg), 
+	parser(parser), 
+	code(code), 
+	frame(0), iframe(0),
+	lhs(lhs),
+	matchText(matchText),
+	reject(false), 
+	reverseCode(reverseCode),
+	rcodeUnitLen(0)
+{
+	if ( lhs != 0 ) {
+		assert( lhs->refs == 1 );
+	}
+}
+
+void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *rev )
+{
+	while ( rev->length() > 0 ) {
+		/* Read the length */
+		Code *prcode = rev->data + rev->length() - 4;
+		Word len;
+		read_word_p( len, prcode );
+
+		/* Find the start of block. */
+		long start = rev->length() - len - 4;
+		prcode = rev->data + start;
+
+		/* Execute it. */
+		rcode_downref( stack_root, prg, prcode );
+
+		/* Backup over it. */
+		rev->tabLen -= len + 4;
+	}
+}
+
+void rcode_downref( Tree **stack_root, Program *prg, Code *instr )
+{
+again:
+	switch ( *instr++ ) {
+		case IN_PARSE_BKT: {
+			Half parserId;
+			Tree *stream, *tree;
+			Word wrev;
+			read_half( parserId );
+			read_tree( stream );
+			read_tree( tree );
+			read_word( wrev );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PARSE_BKT " << parserId << endl;
+			#endif
+
+			parsed_downref( stack_root, prg, tree );
+			rcode_downref_all( stack_root, prg, (CodeVect*)wrev );
+			tree_downref( prg, stream );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_STREAM_PULL_BKT: {
+			Tree *stream, *str;
+			read_tree( stream );
+			read_tree( str );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PULL_BKT" << endl;
+			#endif
+
+			tree_downref( prg, stream );
+			tree_downref( prg, str );
+			break;
+		}
+		case IN_STREAM_PUSH_BKT: {
+			Tree *stream;
+			Word len;
+			read_tree( stream );
+			read_word( len );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PUSH_BKT" << endl;
+			#endif
+
+			// FIXME: Implement
+			break;
+		}
+		case IN_LOAD_GLOBAL_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			#endif
+			break;
+		}
+		case IN_GET_FIELD_BKT: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_FIELD_BKT " << field << endl;
+			#endif
+			break;
+		}
+		case IN_SET_FIELD_BKT: {
+			short field;
+			Tree *val;
+			read_half( field );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_FIELD_BKT " << field << endl;
+			#endif
+
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_PTR_DEREF_BKT: {
+			Tree *ptr;
+			read_tree( ptr );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PTR_DEREF_BKT" << endl;
+			#endif
+
+			tree_downref( prg, ptr );
+			break;
+		}
+		case IN_SET_TOKEN_DATA_BKT: {
+			Word oldval;
+			read_word( oldval );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			#endif
+
+			Head *head = (Head*)oldval;
+			string_free( prg, head );
+			break;
+		}
+		case IN_LIST_APPEND_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_APPEND_BKT" << endl;
+			#endif
+			break;
+		}
+		case IN_LIST_REMOVE_END_BKT: {
+			Tree *val;
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			#endif
+
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_GET_LIST_MEM_BKT: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			#endif
+			break;
+		}
+		case IN_SET_LIST_MEM_BKT: {
+			Half field;
+			Tree *val;
+			read_half( field );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			#endif
+
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_MAP_INSERT_BKT: {
+			uchar inserted;
+			Tree *key;
+			read_byte( inserted );
+			read_tree( key );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_INSERT_BKT" << endl;
+			#endif
+			
+			tree_downref( prg, key );
+			break;
+		}
+		case IN_MAP_STORE_BKT: {
+			Tree *key, *val;
+			read_tree( key );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_STORE_BKT" << endl;
+			#endif
+
+			tree_downref( prg, key );
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_MAP_REMOVE_BKT: {
+			Tree *key, *val;
+			read_tree( key );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_REMOVE_BKT" << endl;
+			#endif
+
+			tree_downref( prg, key );
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_STOP: {
+			return;
+		}
+		default: {
+			cerr << "UNKNOWN INSTRUCTION: " << (ulong)instr[-1] << 
+					" -- reverse code downref" << endl;
+			exit(1);
+			break;
+		}
+	}
+	goto again;
+}
+
+void Execution::execute( Tree **root )
+{
+	Tree **sp = root;
+
+	/* If we have a lhs push it to the stack. */
+	bool haveLhs = lhs != 0;
+	if ( haveLhs )
+		push( lhs );
+
+	/* Execution loop. */
+	execute( sp, code );
+
+	/* Take the lhs off the stack. */
+	if ( haveLhs )
+		lhs = (Tree*) pop();
+
+	assert( sp == root );
+}
+
+bool makeReverseCode( CodeVect &all, CodeVect &reverseCode )
+{
+	/* Do we need to revert the left hand side? */
+
+	/* Check if there was anything generated. */
+	if ( reverseCode.length() == 0 )
+		return false;
+
+	long prevAllLength = all.length();
+
+	/* Go backwards, group by group, through the reverse code. Push each group
+	 * to the global reverse code stack. */
+	Code *p = reverseCode.data + reverseCode.length();
+	while ( p != reverseCode.data ) {
+		p--;
+		long len = *p;
+		p = p - len;
+		all.append( p, len );
+	}
+
+	/* Stop, then place a total length in the global stack. */
+	all.append( IN_STOP );
+	long length = all.length() - prevAllLength;
+	all.appendWord( length );
+
+	/* Clear the revere code buffer. */
+	reverseCode.tabLen = 0;
+
+	return true;
+}
+
+void Execution::rexecute( Tree **root, Code *rcode, CodeVect &allRev )
+{
+	/* Read the length */
+	Code *prcode = allRev.data + allRev.length() - 4;
+	Word len;
+	read_word_p( len, prcode );
+
+	/* Find the start of block. */
+	long start = allRev.length() - len - 4;
+	prcode = allRev.data + start;
+
+	/* Execute it. */
+	Tree **sp = root;
+	execute( sp, prcode );
+	assert( sp == root );
+
+	/* Backup over it. */
+	allRev.tabLen -= len + 4;
+}
+
+void Execution::execute( Tree **&sp, Code *instr )
+{
+again:
+	switch ( *instr++ ) {
+		case IN_LOAD_NIL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_NIL" << endl;
+			#endif
+
+			push( 0 );
+			break;
+		}
+		case IN_LOAD_TRUE: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_TRUE" << endl;
+			#endif
+
+			tree_upref( prg->trueVal );
+			push( prg->trueVal );
+			break;
+		}
+		case IN_LOAD_FALSE: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_FALSE" << endl;
+			#endif
+
+			tree_upref( prg->falseVal );
+			push( prg->falseVal );
+			break;
+		}
+		case IN_LOAD_INT: {
+			Word i;
+			read_word( i );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_INT " << i << endl;
+			#endif
+
+			Tree *tree = construct_integer( prg, i );
+			tree_upref( tree );
+			push( tree );
+			break;
+		}
+		case IN_LOAD_STR: {
+			Word offset;
+			read_word( offset );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_STR " << offset << endl;
+			#endif
+
+			Head *lit = make_literal( prg, offset );
+			Tree *tree = construct_string( prg, lit );
+			tree_upref( tree );
+			push( tree );
+			break;
+		}
+		case IN_PRINT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PRINT" << endl;
+			#endif
+
+			Tree *tree = pop();
+			print_tree( sp, prg, tree );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_PRINT_XML: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PRINT_XML" << endl;
+			#endif
+
+			Tree *tree = pop();
+			xml_print_tree( sp, prg, tree );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_LOAD_GLOBAL_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_GLOBAL_R" << endl;
+			#endif
+
+			tree_upref( prg->global );
+			push( prg->global );
+			break;
+		}
+		case IN_LOAD_GLOBAL_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_GLOBAL_WV" << endl;
+			#endif
+
+			tree_upref( prg->global );
+			push( prg->global );
+
+			/* Set up the reverse instruction. */
+			reverseCode.append( IN_LOAD_GLOBAL_BKT );
+			rcodeUnitLen = 1;
+			break;
+		}
+		case IN_LOAD_GLOBAL_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			#endif
+
+			tree_upref( prg->global );
+			push( prg->global );
+			break;
+		}
+		case IN_INIT_RHS_EL: {
+			Half position;
+			short field;
+			read_half( position );
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_INIT_RHS_EL " << position << " " << field << endl;
+			#endif
+
+			Tree *val = get_rhs_el( prg, lhs, position );
+			tree_upref( val );
+			local(field) = val;
+			break;
+		}
+		case IN_UITER_ADVANCE: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_ADVANCE " << field << endl;
+			#endif
+
+			/* Get the iterator. */
+			UserIter *uiter = (UserIter*) local(field);
+
+			long stackSize = uiter->stackRoot - ptop();
+			assert( uiter->stackSize == stackSize );
+
+			/* Fix the return instruction pointer. */
+			uiter->stackRoot[-IFR_AA + IFR_RIN] = (SW)instr;
+
+			instr = uiter->resume;
+			frame = uiter->frame;
+			iframe = &uiter->stackRoot[-IFR_AA];
+			break;
+		}
+		case IN_UITER_GET_CUR_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_GET_CUR_R " << field << endl;
+			#endif
+
+			UserIter *uiter = (UserIter*) local(field);
+			Tree *val = uiter->ref.kid->tree;
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_UITER_GET_CUR_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_GET_CUR_WC " << field << endl;
+			#endif
+
+			UserIter *uiter = (UserIter*) local(field);
+			split_ref( sp, prg, &uiter->ref );
+			Tree *split = uiter->ref.kid->tree;
+			tree_upref( split );
+			push( split );
+			break;
+		}
+		case IN_UITER_SET_CUR_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_SET_CUR_WC " << field << endl;
+			#endif
+
+			Tree *t = pop();
+			UserIter *uiter = (UserIter*) local(field);
+			split_ref( sp, prg, &uiter->ref );
+			Tree *old = uiter->ref.kid->tree;
+			uiter->ref.kid->tree = t;
+			tree_downref( prg, old );
+			break;
+		}
+		case IN_GET_LOCAL_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LOCAL_R " << field << endl;
+			#endif
+
+			Tree *val = local(field);
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_GET_LOCAL_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LOCAL_WC " << field << endl;
+			#endif
+
+			Tree *split = get_local_split( prg, frame, field );
+			tree_upref( split );
+			push( split );
+			break;
+		}
+		case IN_SET_LOCAL_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LOCAL_WC " << field << endl;
+			#endif
+
+			Tree *val = pop();
+			tree_downref( prg, local(field) );
+			set_local( frame, field, val );
+			break;
+		}
+		case IN_SAVE_RET: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SAVE_RET " << endl;
+			#endif
+
+			Tree *val = pop();
+			local(FR_RV) = val;
+			break;
+		}
+		case IN_GET_LOCAL_REF_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LOCAL_REF_R " << field << endl;
+			#endif
+
+			Ref *ref = (Ref*) plocal(field);
+			Tree *val = ref->kid->tree;
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_GET_LOCAL_REF_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LOCAL_REF_WC " << field << endl;
+			#endif
+
+			Ref *ref = (Ref*) plocal(field);
+			split_ref( sp, prg, ref );
+			Tree *val = ref->kid->tree;
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_SET_LOCAL_REF_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LOCAL_REF_WC " << field << endl;
+			#endif
+
+			Tree *val = pop();
+			Ref *ref = (Ref*) plocal(field);
+			split_ref( sp, prg, ref );
+			set_ref_value( ref, val );
+			break;
+		}
+		case IN_GET_FIELD_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_FIELD_R " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = get_field( obj, field );
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_GET_FIELD_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_FIELD_WC " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *split = get_field_split( prg, obj, field );
+			tree_upref( split );
+			push( split );
+			break;
+		}
+		case IN_GET_FIELD_WV: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_FIELD_WV " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *split = get_field_split( prg, obj, field );
+			tree_upref( split );
+			push( split );
+
+			/* Set up the reverse instruction. */
+			reverseCode.append( IN_GET_FIELD_BKT );
+			reverseCode.appendHalf( field );
+			rcodeUnitLen += 3;
+			break;
+		}
+		case IN_GET_FIELD_BKT: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_FIELD_BKT " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *split = get_field_split( prg, obj, field );
+			tree_upref( split );
+			push( split );
+			break;
+		}
+		case IN_SET_FIELD_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_FIELD_WC " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+			tree_downref( prg, obj );
+
+			/* Downref the old value. */
+			Tree *prev = get_field( obj, field );
+			tree_downref( prg, prev );
+
+			set_field( prg, obj, field, val );
+			break;
+		}
+		case IN_SET_FIELD_WV: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_FIELD_WV " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+			tree_downref( prg, obj );
+
+			/* Save the old value, then set the field. */
+			Tree *prev = get_field( obj, field );
+			set_field( prg, obj, field, val );
+
+			/* Set up the reverse instruction. */
+			reverseCode.append( IN_SET_FIELD_BKT );
+			reverseCode.appendHalf( field );
+			reverseCode.appendWord( (Word)prev );
+			rcodeUnitLen += 7;
+			reverseCode.append( rcodeUnitLen );
+			/* FLUSH */
+			break;
+		}
+		case IN_SET_FIELD_BKT: {
+			short field;
+			Tree *val;
+			read_half( field );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_FIELD_BKT " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			/* Downref the old value. */
+			Tree *prev = get_field( obj, field );
+			tree_downref( prg, prev );
+
+			set_field( prg, obj, field, val );
+			break;
+		}
+		case IN_SET_FIELD_LEAVE_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_FIELD_LEAVE_WC " << field << endl;
+			#endif
+
+			/* Note that we don't downref the object here because we are
+			 * leaving it on the stack. */
+			Tree *obj = pop();
+			Tree *val = pop();
+
+			/* Downref the old value. */
+			Tree *prev = get_field( obj, field );
+			tree_downref( prg, prev );
+
+			/* Set the field. */
+			set_field( prg, obj, field, val );
+
+			/* Leave the object on the top of the stack. */
+			push( obj );
+			break;
+		}
+		case IN_POP: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_POP" << endl;
+			#endif
+
+			Tree *val = pop();
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_STR_ATOI: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STR_ATOI" << endl;
+			#endif
+
+			Str *str = (Str*)pop();
+			Word res = str_atoi( str->value );
+			Tree *integer = construct_integer( prg, res );
+			tree_upref( integer );
+			push( integer );
+			tree_downref( prg, (Tree*)str );
+			break;
+		}
+		case IN_INT_TO_STR: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_INT_TO_STR" << endl;
+			#endif
+
+			Int *i = (Int*)pop();
+			Head *res = int_to_str( prg, i->value );
+			Tree *str = construct_string( prg, res );
+			tree_upref( str );
+			push( str );
+			tree_downref( prg, (Tree*) i );
+			break;
+		}
+		case IN_CONCAT_STR: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_CONCAT_STR" << endl;
+			#endif
+
+			Str *s2 = (Str*)pop();
+			Str *s1 = (Str*)pop();
+			Head *res = concat_str( s1->value, s2->value );
+			Tree *str = construct_string( prg, res );
+			tree_upref( str );
+			tree_downref( prg, (Tree*)s1 );
+			tree_downref( prg, (Tree*)s2 );
+			push( str );
+			break;
+		}
+		case IN_STR_UORD8: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STR_UORD8" << endl;
+			#endif
+
+			Str *str = (Str*)pop();
+			Word res = str_uord8( str->value );
+			Tree *tree = construct_integer( prg, res );
+			tree_upref( tree );
+			push( tree );
+			tree_downref( prg, (Tree*)str );
+			break;
+		}
+		case IN_STR_UORD16: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STR_UORD16" << endl;
+			#endif
+
+			Str *str = (Str*)pop();
+			Word res = str_uord16( str->value );
+			Tree *tree = construct_integer( prg, res );
+			tree_upref( tree );
+			push( tree );
+			tree_downref( prg, (Tree*)str );
+			break;
+		}
+
+		case IN_STR_LENGTH: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STR_LENGTH" << endl;
+			#endif
+
+			Str *str = (Str*)pop();
+			long len = string_length( str->value );
+			Tree *res = construct_integer( prg, len );
+			tree_upref( res );
+			push( res );
+			tree_downref( prg, (Tree*)str );
+			break;
+		}
+		case IN_JMP_FALSE: {
+			short dist;
+			read_half( dist );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_JMP_FALSE " << dist << endl;
+			#endif
+
+			Tree *tree = pop();
+			if ( test_false( prg, tree ) )
+				instr += dist;
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_JMP_TRUE: {
+			short dist;
+			read_half( dist );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_JMP_TRUE " << dist << endl;
+			#endif
+
+			Tree *tree = pop();
+			if ( !test_false( prg, tree ) )
+				instr += dist;
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_JMP: {
+			short dist;
+			read_half( dist );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_JMP " << dist << endl;
+			#endif
+
+			instr += dist;
+			break;
+		}
+		case IN_REJECT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_REJECT" << endl;
+			#endif
+			reject = true;
+			break;
+		}
+
+		/*
+		 * Binary comparison operators.
+		 */
+		case IN_TST_EQL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_EQL" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r ? prg->falseVal : prg->trueVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_NOT_EQL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_NOT_EQL" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_LESS: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_LESS" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r < 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_LESS_EQL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_LESS_EQL" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r <= 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+		}
+		case IN_TST_GRTR: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_GRTR" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r > 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_GRTR_EQL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_GRTR_EQL" << endl;
+			#endif
+
+			Tree *o2 = (Tree*)pop();
+			Tree *o1 = (Tree*)pop();
+			long r = cmp_tree( o1, o2 );
+			Tree *val = r >= 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_LOGICAL_AND: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_LOGICAL_AND" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long v2 = !test_false( prg, o2 );
+			long v1 = !test_false( prg, o1 );
+			Word r = v1 && v2;
+			Tree *val = r ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_TST_LOGICAL_OR: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TST_LOGICAL_OR" << endl;
+			#endif
+
+			Tree *o2 = pop();
+			Tree *o1 = pop();
+			long v2 = !test_false( prg, o2 );
+			long v1 = !test_false( prg, o1 );
+			Word r = v1 || v2;
+			Tree *val = r ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, o1 );
+			tree_downref( prg, o2 );
+			break;
+		}
+		case IN_NOT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_NOT" << endl;
+			#endif
+
+			Tree *tree = (Tree*)pop();
+			long r = test_false( prg, tree );
+			Tree *val = r ? prg->trueVal : prg->falseVal;
+			tree_upref( val );
+			push( val );
+			tree_downref( prg, tree );
+			break;
+		}
+
+		case IN_ADD_INT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_ADD_INT" << endl;
+			#endif
+
+			Int *o2 = (Int*)pop();
+			Int *o1 = (Int*)pop();
+			long r = o1->value + o2->value;
+			Tree *tree = construct_integer( prg, r );
+			tree_upref( tree );
+			push( tree );
+			tree_downref( prg, (Tree*)o1 );
+			tree_downref( prg, (Tree*)o2 );
+			break;
+		}
+		case IN_MULT_INT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MULT_INT" << endl;
+			#endif
+
+			Int *o2 = (Int*)pop();
+			Int *o1 = (Int*)pop();
+			long r = o1->value * o2->value;
+			Tree *tree = construct_integer( prg, r );
+			tree_upref( tree );
+			push( tree );
+			tree_downref( prg, (Tree*)o1 );
+			tree_downref( prg, (Tree*)o2 );
+			break;
+		}
+		case IN_SUB_INT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SUB_INT" << endl;
+			#endif
+
+			Int *o2 = (Int*)pop();
+			Int *o1 = (Int*)pop();
+			long r = o1->value - o2->value;
+			Tree *tree = construct_integer( prg, r );
+			tree_upref( tree );
+			push( tree );
+			tree_downref( prg, (Tree*)o1 );
+			tree_downref( prg, (Tree*)o2 );
+			break;
+		}
+		case IN_DUP_TOP: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_DUP_TOP" << endl;
+			#endif
+
+			Tree *val = top();
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_TRITER_FROM_REF: {
+			short field;
+			Half searchTypeId;
+			read_half( field );
+			read_half( searchTypeId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_FROM_REF " << field << " " << searchTypeId << endl;
+			#endif
+
+			Ref rootRef;
+			rootRef.kid = (Kid*)pop();
+			rootRef.next = (Ref*)pop();
+			void *mem = plocal(field);
+			new(mem) TreeIter( rootRef, searchTypeId, ptop() );
+			break;
+		}
+		case IN_TRITER_DESTROY: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_DESTROY " << field << endl;
+			#endif
+
+			TreeIter *iter = (TreeIter*) plocal(field);
+			tree_iter_destroy( sp, iter );
+			break;
+		}
+		case IN_TREE_SEARCH: {
+			Word id;
+			read_word( id );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TREE_SEARCH " << id << endl;
+			#endif
+
+			Tree *tree = pop();
+			Tree *res = tree_search( tree, id );
+			tree_upref( res );
+			push( res );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_TRITER_ADVANCE: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_ADVANCE " << field << endl;
+			#endif
+
+			TreeIter *iter = (TreeIter*) plocal(field);
+			Tree *res = tree_iter_advance( prg, sp, iter );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_TRITER_NEXT_CHILD: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_NEXT_CHILD " << field << endl;
+			#endif
+
+			TreeIter *iter = (TreeIter*) plocal(field);
+			Tree *res = tree_iter_next_child( prg, sp, iter );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_TRITER_PREV_CHILD: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_PREV_CHILD " << field << endl;
+			#endif
+
+			TreeIter *iter = (TreeIter*) plocal(field);
+			Tree *res = tree_iter_prev_child( prg, sp, iter );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_TRITER_GET_CUR_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_GET_CUR_R " << field << endl;
+			#endif
+			
+			TreeIter *iter = (TreeIter*) plocal(field);
+			Tree *tree = tree_iter_deref_cur( iter );
+			tree_upref( tree );
+			push( tree );
+			break;
+		}
+		case IN_TRITER_GET_CUR_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_GET_CUR_WC " << field << endl;
+			#endif
+			
+			TreeIter *iter = (TreeIter*) plocal(field);
+			split_iter_cur( sp, prg, iter );
+			Tree *tree = tree_iter_deref_cur( iter );
+			tree_upref( tree );
+			push( tree );
+			break;
+		}
+		case IN_TRITER_SET_CUR_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_SET_CUR_WC " << field << endl;
+			#endif
+
+			Tree *tree = pop();
+			TreeIter *iter = (TreeIter*) plocal(field);
+			split_iter_cur( sp, prg, iter );
+			Tree *old = tree_iter_deref_cur( iter );
+			set_triter_cur( iter, tree );
+			tree_downref( prg, old );
+			break;
+		}
+		case IN_MATCH: {
+			Half patternId;
+			read_half( patternId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MATCH " << patternId << endl;
+			#endif
+
+			Tree *tree = pop();
+
+			/* Run the match, push the result. */
+			int rootNode = prg->rtd->patReplInfo[patternId].offset;
+
+			/* Bindings are indexed starting at 1. Zero bindId to represent no
+			 * binding. We make a space for it here rather than do math at
+			 * access them. */
+			long numBindings = prg->rtd->patReplInfo[patternId].numBindings;
+			Tree *bindings[1+numBindings];
+			memset( bindings, 0, sizeof(Tree*)*(1+numBindings) );
+
+			Kid kid;
+			kid.tree = tree;
+			kid.next = 0;
+			bool matched = match_pattern( bindings, prg, rootNode, &kid, false );
+
+			if ( !matched )
+				memset( bindings, 0, sizeof(Tree*)*(1+numBindings) );
+			else {
+				for ( int b = 1; b <= numBindings; b++ )
+					assert( bindings[b] != 0 );
+			}
+
+			#ifdef COLM_LOG_MATCH
+			cerr << "match result: " << matched << endl;
+			#endif
+
+			Tree *result = matched ? tree : 0;
+			tree_upref( result );
+			push( result ? tree : 0 );
+			for ( int b = 1; b <= numBindings; b++ ) {
+				tree_upref( bindings[b] );
+				push( bindings[b] );
+			}
+
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_PARSE: {
+			Half parserId, stopId;
+			read_half( parserId );
+			read_half( stopId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PARSE " << parserId << " " << stopId << endl;
+			#endif
+
+			/* Comes back from parse upreffed. */
+			CodeVect *cv;
+			Tree *stream = pop();
+			Tree *res = parse( sp, prg, (Stream*)stream, parserId, stopId, cv );
+			push( res );
+
+			/* Single unit. */
+			tree_upref( res );
+			reverseCode.append( IN_PARSE_BKT );
+			reverseCode.appendHalf( parserId );
+			reverseCode.appendWord( (Word) stream );
+			reverseCode.appendWord( (Word) res );
+			reverseCode.appendWord( (Word) cv );
+			reverseCode.append( 15 );
+			break;
+		}
+		case IN_STREAM_PULL: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PULL" << endl;
+			#endif
+			Tree *len = pop();
+			Tree *stream = pop();
+			Tree *string = stream_pull( prg, (Stream*)stream, len );
+			tree_upref( string );
+			push( string );
+
+			/* Single unit. */
+			tree_upref( string );
+			reverseCode.append( IN_STREAM_PULL_BKT );
+			reverseCode.appendWord( (Word) stream );
+			reverseCode.appendWord( (Word) string );
+			reverseCode.append( 9 );
+
+			tree_downref( prg, len );
+			break;
+		}
+		case IN_STREAM_PULL_BKT: {
+			Tree *stream, *string;
+			read_tree( stream );
+			read_tree( string );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PULL_BKT" << endl;
+			#endif
+
+			undo_pull( prg, (Stream*)stream, string );
+			tree_downref( prg, stream );
+			tree_downref( prg, string );
+			break;
+		}
+		case IN_STREAM_PUSH: {
+			/* FIXME: Need to check the refcounting here. */
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PUSH" << endl;
+			#endif
+			Tree *tree = pop();
+			Tree *stream = pop();
+			Word len = stream_push( sp, prg, 
+					(Stream*)stream, tree );
+			push( 0 );
+
+			/* Single unit. */
+			reverseCode.append( IN_STREAM_PUSH_BKT );
+			reverseCode.appendWord( (Word)stream );
+			reverseCode.appendWord( len );
+			reverseCode.append( 9 );
+
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_STREAM_PUSH_BKT: {
+			Tree *stream;
+			Word len;
+			read_tree( stream );
+			read_word( len );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STREAM_PUSH_BKT" << endl;
+			#endif
+
+			undo_stream_push( sp, prg, (Stream*)stream, len );
+			break;
+		}
+		case IN_PARSE_BKT: {
+			Half parserId;
+			Tree *stream, *tree;
+			Word wrev;
+			read_half( parserId );
+			read_tree( stream );
+			read_tree( tree );
+			read_word( wrev );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PARSE_BKT " << parserId << endl;
+			#endif
+
+			undo_parse( sp, prg, (Stream*)stream, parserId, tree, (CodeVect*)wrev );
+			tree_downref( prg, stream );
+			break;
+		}
+		case IN_CONSTRUCT: {
+			Half patternId;
+			read_half( patternId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_CONSTRUCT " << patternId << endl;
+			#endif
+
+			int rootNode = prg->rtd->patReplInfo[patternId].offset;
+
+			/* Note that bindIds are indexed at one. Add one spot for them. */
+			int numBindings = prg->rtd->patReplInfo[patternId].numBindings;
+			Tree *bindings[1+numBindings];
+
+			for ( int b = 1; b <= numBindings; b++ ) {
+				bindings[b] = pop();
+				assert( bindings[b] != 0 );
+			}
+
+			Tree *replTree = 0;
+			PatReplNode *nodes = prg->rtd->patReplNodes;
+			LangElInfo *lelInfo = prg->rtd->lelInfo;
+			long genericId = lelInfo[nodes[rootNode].id].genericId;
+			if ( genericId > 0 ) {
+				replTree = create_generic( prg, genericId );
+				tree_upref( replTree );
+			}
+			else {
+				replTree = construct_replacement_tree( bindings, 
+						prg, rootNode );
+			}
+
+			push( replTree );
+			break;
+		}
+		case IN_CONSTRUCT_TERM: {
+			Half tokenId;
+			read_half( tokenId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_CONSTRUCT_TERM " << tokenId << endl;
+			#endif
+
+			/* Pop the string we are constructing the token from. */
+			Str *str = (Str*)pop();
+			Tree *res = construct_term( prg, tokenId, str->value );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_MAKE_TOKEN: {
+			uchar nargs;
+			read_byte( nargs );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAKE_TOKEN " << (ulong) nargs << endl;
+			#endif
+
+			Tree *result = make_token( sp, prg, parser, nargs );
+			for ( long i = 0; i < nargs; i++ )
+				tree_downref( prg, pop() );
+			push( result );
+			break;
+		}
+		case IN_MAKE_TREE: {
+			uchar nargs;
+			read_byte( nargs );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAKE_TREE " << (ulong) nargs << endl;
+			#endif
+
+			Tree *result = make_tree( sp, prg, parser, nargs );
+			for ( long i = 0; i < nargs; i++ )
+				tree_downref( prg, pop() );
+			push( result );
+			break;
+		}
+		case IN_SEND: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SEND" << endl;
+			#endif
+
+			Tree *tree = pop();
+			send( sp, prg, parser, tree, false );
+			push( 0 );
+			break;
+		}
+		case IN_IGNORE: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_IGNORE" << endl;
+			#endif
+
+			Tree *tree = pop();
+			send( sp, prg, parser, tree, true );
+			push( 0 );
+			break;
+		}
+		case IN_TREE_NEW: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TREE_NEW " << endl;
+			#endif
+
+			Tree *tree = pop();
+			Tree *res = construct_pointer( prg, tree );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_PTR_DEREF_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PTR_DEREF_R" << endl;
+			#endif
+
+			Pointer *ptr = (Pointer*)pop();
+			tree_downref( prg, (Tree*)ptr );
+
+			Tree *dval = get_ptr_val( ptr );
+			tree_upref( dval );
+			push( dval );
+			break;
+		}
+		case IN_PTR_DEREF_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PTR_DEREF_WC" << endl;
+			#endif
+
+			Pointer *ptr = (Pointer*)pop();
+			tree_downref( prg, (Tree*)ptr );
+
+			Tree *dval = get_ptr_val_split( prg, ptr );
+			tree_upref( dval );
+			push( dval );
+			break;
+		}
+		case IN_PTR_DEREF_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PTR_DEREF_WV" << endl;
+			#endif
+
+			Pointer *ptr = (Pointer*)pop();
+			/* Don't downref the pointer since it is going into the reverse
+			 * instruction. */
+
+			Tree *dval = get_ptr_val_split( prg, ptr );
+			tree_upref( dval );
+			push( dval );
+
+			/* This is an initial global load. Need to reverse execute it. */
+			reverseCode.append( IN_PTR_DEREF_BKT );
+			reverseCode.appendWord( (Word) ptr );
+			rcodeUnitLen = 5;
+			break;
+		}
+		case IN_PTR_DEREF_BKT: {
+			Word p;
+			read_word( p );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PTR_DEREF_BKT" << endl;
+			#endif
+
+			Pointer *ptr = (Pointer*)p;
+
+			Tree *dval = get_ptr_val_split( prg, ptr );
+			tree_upref( dval );
+			push( dval );
+
+			tree_downref( prg, (Tree*)ptr );
+			break;
+		}
+		case IN_REF_FROM_LOCAL: {
+			short int field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_REF_FROM_LOCAL " << field << endl;
+			#endif
+
+			/* First push the null next pointer, then the kid pointer. */
+			Tree **ptr = plocal(field);
+			push( 0 );
+			push( (SW)ptr );
+			break;
+		}
+		case IN_REF_FROM_REF: {
+			short int field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_REF_FROM_REF " << field << endl;
+			#endif
+
+			Ref *ref = (Ref*)plocal(field);
+			push( (SW)ref );
+			push( (SW)ref->kid );
+			break;
+		}
+		case IN_TRITER_REF_FROM_CUR: {
+			short int field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_TRITER_REF_FROM_CUR " << field << endl;
+			#endif
+
+			/* Push the next pointer first, then the kid. */
+			TreeIter *iter = (TreeIter*) plocal(field);
+			push( (SW)&iter->ref );
+			push( (SW)iter->ref.kid );
+			break;
+		}
+		case IN_UITER_REF_FROM_CUR: {
+			short int field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_REF_FROM_CUR " << field << endl;
+			#endif
+
+			/* Push the next pointer first, then the kid. */
+			UserIter *uiter = (UserIter*) local(field);
+			push( (SW)uiter->ref.next );
+			push( (SW)uiter->ref.kid );
+			break;
+		}
+		case IN_GET_TOKEN_DATA_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_TOKEN_DATA_R" << endl;
+			#endif
+
+			Tree *tree = (Tree*) pop();
+			Head *data = string_copy( prg, tree->tokdata );
+			Tree *str = construct_string( prg, data );
+			tree_upref( str );
+			push( str );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_SET_TOKEN_DATA_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_TOKEN_DATA_WC" << endl;
+			#endif
+
+			Tree *tree = pop();
+			Tree *val = pop();
+			Head *head = string_copy( prg, ((Str*)val)->value );
+			string_free( prg, tree->tokdata );
+			tree->tokdata = head;
+
+			tree_downref( prg, tree );
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_SET_TOKEN_DATA_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_TOKEN_DATA_WV" << endl;
+			#endif
+
+			Tree *tree = pop();
+			Tree *val = pop();
+
+			Head *oldval = tree->tokdata;
+			Head *head = string_copy( prg, ((Str*)val)->value );
+			tree->tokdata = head;
+
+			/* Set up reverse code. Needs no args. */
+			reverseCode.append( IN_SET_TOKEN_DATA_BKT );
+			reverseCode.appendWord( (Word)oldval );
+			rcodeUnitLen += 5;
+			reverseCode.append( rcodeUnitLen );
+
+			tree_downref( prg, tree );
+			tree_downref( prg, val );
+			break;
+		}
+		case IN_SET_TOKEN_DATA_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			#endif
+
+			Word oldval;
+			read_word( oldval );
+
+			Tree *tree = pop();
+			Head *head = (Head*)oldval;
+			string_free( prg, tree->tokdata );
+			tree->tokdata = head;
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_GET_TOKEN_POS_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_TOKEN_POS_R" << endl;
+			#endif
+
+			Tree *tree = (Tree*) pop();
+			Tree *integer = construct_integer( prg, 0 );
+			tree_upref( integer );
+			push( integer );
+			tree_downref( prg, tree );
+
+			/* Requires a new implementation. */
+			assert( false );
+			break;
+		}
+		case IN_GET_MATCH_LENGTH_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_MATCH_LENGTH_R" << endl;
+			#endif
+			Tree *integer = construct_integer( prg, string_length(matchText) );
+			tree_upref( integer );
+			push( integer );
+			break;
+		}
+		case IN_GET_MATCH_TEXT_R: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_MATCH_TEXT_R" << endl;
+			#endif
+			Head *s = string_copy( prg, matchText );
+			Tree *tree = construct_string( prg, s );
+			tree_upref( tree );
+			push( tree );
+			break;
+		}
+		case IN_LIST_LENGTH: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_LENGTH" << endl;
+			#endif
+
+			List *list = (List*) pop();
+			long len = list_length( list );
+			Tree *res = construct_integer( prg, len );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_LIST_APPEND_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_APPEND_WV" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+
+			tree_downref( prg, obj );
+
+			list_append( prg, (List*)obj, val );
+			tree_upref( prg->trueVal );
+			push( prg->trueVal );
+
+			/* Set up reverse code. Needs no args. */
+			reverseCode.append( IN_LIST_APPEND_BKT );
+			rcodeUnitLen += 1;
+			reverseCode.append( rcodeUnitLen );
+			/* FLUSH */
+			break;
+		}
+		case IN_LIST_APPEND_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_APPEND_WC" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+
+			tree_downref( prg, obj );
+
+			list_append( prg, (List*)obj, val );
+			tree_upref( prg->trueVal );
+			push( prg->trueVal );
+			break;
+		}
+		case IN_LIST_APPEND_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_APPEND_BKT" << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *tree = list_remove_end( prg, (List*)obj );
+			tree_downref( prg, tree );
+			break;
+		}
+		case IN_LIST_REMOVE_END_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_REMOVE_END_WC" << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *end = list_remove_end( prg, (List*)obj );
+			push( end );
+			break;
+		}
+		case IN_LIST_REMOVE_END_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_REMOVE_END_WV" << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *end = list_remove_end( prg, (List*)obj );
+			push( end );
+
+			/* Set up reverse. The result comes off the list downrefed.
+			 * Need it up referenced for the reverse code too. */
+			tree_upref( end );
+			reverseCode.append( IN_LIST_REMOVE_END_BKT );
+			reverseCode.appendWord( (Word)end );
+			rcodeUnitLen += 5;
+			reverseCode.append( rcodeUnitLen );
+			/* FLUSH */
+			break;
+		}
+		case IN_LIST_REMOVE_END_BKT: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			#endif
+
+			Tree *val;
+			read_tree( val );
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			list_append( prg, (List*)obj, val );
+			break;
+		}
+		case IN_GET_LIST_MEM_R: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LIST_MEM_R " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = get_list_mem( list(obj), field );
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_GET_LIST_MEM_WC: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LIST_MEM_WC " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = get_list_mem_split( prg, list(obj), field );
+			tree_upref( val );
+			push( val );
+			break;
+		}
+		case IN_GET_LIST_MEM_WV: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LIST_MEM_WV " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = get_list_mem_split( prg, list(obj), field );
+			tree_upref( val );
+			push( val );
+
+			/* Set up the reverse instruction. */
+			reverseCode.append( IN_GET_LIST_MEM_BKT );
+			reverseCode.appendHalf( field );
+			rcodeUnitLen += 3;
+			break;
+		}
+		case IN_GET_LIST_MEM_BKT: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *res = get_list_mem_split( prg, list(obj), field );
+			tree_upref( res );
+			push( res );
+			break;
+		}
+		case IN_SET_LIST_MEM_WC: {
+			Half field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LIST_MEM_WC " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = pop();
+			Tree *existing = set_list_mem( list(obj), field, val );
+			tree_downref( prg, existing );
+			break;
+		}
+		case IN_SET_LIST_MEM_WV: {
+			Half field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LIST_MEM_WV " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *val = pop();
+			Tree *existing = set_list_mem( list(obj), field, val );
+
+			/* Set up the reverse instruction. */
+			reverseCode.append( IN_SET_LIST_MEM_BKT );
+			reverseCode.appendHalf( field );
+			reverseCode.appendWord( (Word)existing );
+			rcodeUnitLen += 7;
+			reverseCode.append( rcodeUnitLen );
+			/* FLUSH */
+			break;
+		}
+		case IN_SET_LIST_MEM_BKT: {
+			Half field;
+			Tree *val;
+			read_half( field );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			#endif
+
+			Tree *obj = pop();
+			tree_downref( prg, obj );
+
+			Tree *undid = set_list_mem( list(obj), field, val );
+			tree_downref( prg, undid );
+			break;
+		}
+		case IN_MAP_INSERT_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_INSERT_WV" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+			Tree *key = pop();
+
+			tree_downref( prg, obj );
+
+			bool inserted = map_insert( prg, (Map*)obj, key, val );
+			Tree *result = inserted ? prg->trueVal : prg->falseVal;
+			tree_upref( result );
+			push( result );
+
+			/* Set up the reverse instruction. If the insert fails still need
+			 * to pop the loaded map object. Just use the reverse instruction
+			 * since it's nice to see it in the logs. */
+
+			/* Need to upref key for storage in reverse code. */
+			tree_upref( key );
+			reverseCode.append( IN_MAP_INSERT_BKT );
+			reverseCode.append( inserted );
+			reverseCode.appendWord( (Word)key );
+			rcodeUnitLen += 6;
+			reverseCode.append( rcodeUnitLen );
+
+			if ( ! inserted ) {
+				tree_downref( prg, key );
+				tree_downref( prg, val );
+			}
+			break;
+		}
+		case IN_MAP_INSERT_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_INSERT_WC" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *val = pop();
+			Tree *key = pop();
+
+			tree_downref( prg, obj );
+
+			bool inserted = map_insert( prg, (Map*)obj, key, val );
+			Tree *result = inserted ? prg->trueVal : prg->falseVal;
+			tree_upref( result );
+			push( result );
+
+			if ( ! inserted ) {
+				tree_downref( prg, key );
+				tree_downref( prg, val );
+			}
+			break;
+		}
+		case IN_MAP_INSERT_BKT: {
+			uchar inserted;
+			Tree *key;
+			read_byte( inserted );
+			read_tree( key );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_INSERT_BKT" << endl;
+			#endif
+			
+			Tree *obj = pop();
+			if ( inserted ) {
+				Tree *val = map_uninsert( prg, (Map*)obj, key );
+				tree_downref( prg, key );
+				tree_downref( prg, val );
+			}
+
+			tree_downref( prg, obj );
+			tree_downref( prg, key );
+			break;
+		}
+		case IN_MAP_STORE_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_STORE_WC" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *element = pop();
+			Tree *key = pop();
+
+			Tree *existing = map_store( prg, (Map*)obj, key, element );
+			Tree *result = existing == 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( result );
+			push( result );
+
+			tree_downref( prg, obj );
+			if ( existing != 0 ) {
+				tree_downref( prg, key );
+				tree_downref( prg, existing );
+			}
+			break;
+		}
+		case IN_MAP_STORE_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_STORE_WV" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *element = pop();
+			Tree *key = pop();
+
+			Tree *existing = map_store( prg, (Map*)obj, key, element );
+			Tree *result = existing == 0 ? prg->trueVal : prg->falseVal;
+			tree_upref( result );
+			push( result );
+
+			/* Set up the reverse instruction. */
+			tree_upref( key );
+			tree_upref( existing );
+			reverseCode.append( IN_MAP_STORE_BKT );
+			reverseCode.appendWord( (Word)key );
+			reverseCode.appendWord( (Word)existing );
+			rcodeUnitLen += 9;
+			reverseCode.append( rcodeUnitLen );
+			/* FLUSH */
+
+			tree_downref( prg, obj );
+			if ( existing != 0 ) {
+				tree_downref( prg, key );
+				tree_downref( prg, existing );
+			}
+			break;
+		}
+		case IN_MAP_STORE_BKT: {
+			Tree *key, *val;
+			read_tree( key );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_STORE_BKT" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *stored = map_unstore( prg, (Map*)obj, key, val );
+
+			tree_downref( prg, stored );
+			if ( val == 0 )
+				tree_downref( prg, key );
+
+			tree_downref( prg, obj );
+			tree_downref( prg, key );
+			break;
+		}
+		case IN_MAP_REMOVE_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_REMOVE_WC" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *key = pop();
+			TreePair pair = map_remove( prg, (Map*)obj, key );
+
+			push( pair.val );
+
+			tree_downref( prg, obj );
+			tree_downref( prg, key );
+			tree_downref( prg, pair.key );
+			break;
+		}
+		case IN_MAP_REMOVE_WV: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_REMOVE_WV" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *key = pop();
+			TreePair pair = map_remove( prg, (Map*)obj, key );
+
+			tree_upref( pair.val );
+			push( pair.val );
+
+			/* Reverse instruction. */
+			reverseCode.append( IN_MAP_REMOVE_BKT );
+			reverseCode.appendWord( (Word)pair.key );
+			reverseCode.appendWord( (Word)pair.val );
+			rcodeUnitLen += 9;
+			reverseCode.append( rcodeUnitLen );
+
+			tree_downref( prg, obj );
+			tree_downref( prg, key );
+			break;
+		}
+		case IN_MAP_REMOVE_BKT: {
+			Tree *key, *val;
+			read_tree( key );
+			read_tree( val );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_REMOVE_BKT" << endl;
+			#endif
+
+			/* Either both or neither. */
+			assert( ( key == 0 ) xor ( val != 0 ) );
+
+			Tree *obj = pop();
+			if ( key != 0 )
+				map_unremove( prg, (Map*)obj, key, val );
+
+			tree_downref( prg, obj );
+			break;
+		}
+		case IN_MAP_LENGTH: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_LENGTH" << endl;
+			#endif
+
+			Tree *obj = pop();
+			long len = map_length( (Map*)obj );
+			Tree *res = construct_integer( prg, len );
+			tree_upref( res );
+			push( res );
+
+			tree_downref( prg, obj );
+			break;
+		}
+		case IN_MAP_FIND: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_MAP_FIND" << endl;
+			#endif
+
+			Tree *obj = pop();
+			Tree *key = pop();
+			Tree *result = map_find( (Map*)obj, key );
+			tree_upref( result );
+			push( result );
+
+			tree_downref( prg, obj );
+			tree_downref( prg, key );
+			break;
+		}
+		case IN_INIT_LOCALS: {
+			Half size;
+			read_half( size );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_INIT_LOCALS " << size << endl;
+			#endif
+
+			frame = ptop();
+			pushn( size );
+			memset( ptop(), 0, sizeof(Word) * size );
+			break;
+		}
+		case IN_POP_LOCALS: {
+			Half frameId, size;
+			read_half( frameId );
+			read_half( size );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_POP_LOCALS " << frameId << " " << size << endl;
+			#endif
+
+			FrameInfo *fi = &prg->rtd->frameInfo[frameId];
+			downref_local_trees( prg, frame, fi->trees, fi->treesLen );
+			popn( size );
+			break;
+		}
+		case IN_CALL: {
+			Half funcId;
+			read_half( funcId );
+
+			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_CALL " << fi->name << endl;
+			#endif
+
+			push( 0 ); /* Return value. */
+			push( (SW)instr );
+			push( (SW)frame );
+
+			instr = prg->rtd->frameInfo[fi->frameId].code;
+			frame = ptop();
+			break;
+		}
+		case IN_YIELD: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_YIELD" << endl;
+			#endif
+
+			Kid *kid = (Kid*)pop();
+			Ref *next = (Ref*)pop();
+			UserIter *uiter = (UserIter*) plocal_iframe( IFR_AA );
+
+			if ( kid == 0 || kid->tree == 0 ||
+					kid->tree->id == uiter->searchId || 
+					uiter->searchId == prg->rtd->anyId )
+			{
+				/* Store the yeilded value. */
+				uiter->ref.kid = kid;
+				uiter->ref.next = next;
+				uiter->stackSize = uiter->stackRoot - ptop();
+				uiter->resume = instr;
+				uiter->frame = frame;
+
+				/* Restore the instruction and frame pointer. */
+				instr = (Code*) local_iframe(IFR_RIN);
+				frame = (Tree**) local_iframe(IFR_RFR);
+				iframe = (Tree**) local_iframe(IFR_RIF);
+
+				/* Return the yield result on the top of the stack. */
+				Tree *result = uiter->ref.kid != 0 ? prg->trueVal : prg->falseVal;
+				tree_upref( result );
+				push( result );
+			}
+			break;
+		}
+		case IN_UITER_CREATE: {
+			short field;
+			Half funcId, searchId;
+			read_half( field );
+			read_half( funcId );
+			read_half( searchId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_CREATE " << field << " " << 
+					funcId << " " << searchId << endl;
+			#endif
+
+			FunctionInfo *fi = prg->rtd->functionInfo + funcId;
+			UserIter *uiter = uiter_create( sp, prg, fi, searchId );
+			local(field) = (SW) uiter;
+
+			/* This is a setup similar to as a call, only the frame structure
+			 * is slightly different for user iterators. We aren't going to do
+			 * the call. We don't need to set up the return ip because the
+			 * uiter advance will set it. The frame we need to do because it
+			 * is set once for the lifetime of the iterator. */
+			push( 0 );            /* Return instruction pointer,  */
+			push( (SW)iframe ); /* Return iframe. */
+			push( (SW)frame );  /* Return frame. */
+
+			/* Now set up the first yeild. */
+			uiter->ref.kid = 0;
+			uiter->stackSize = uiter->stackRoot - ptop();
+			uiter->resume = prg->rtd->frameInfo[fi->frameId].code;
+			uiter->frame = &uiter->stackRoot[-IFR_AA];
+
+			upref_uiter_args( frame, fi->argSize );
+			break;
+		}
+		case IN_UITER_DESTROY: {
+			short field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_DESTROY " << field << endl;
+			#endif
+
+			UserIter *uiter = (UserIter*) local(field);
+			user_iter_destroy( sp, uiter );
+			break;
+		}
+		case IN_RET: {
+			Half funcId;
+			read_half( funcId );
+
+			FunctionInfo *fui = &prg->rtd->functionInfo[funcId];
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_RET " << fui->name << endl;
+			#endif
+
+			FrameInfo *fi = &prg->rtd->frameInfo[fui->frameId];
+			downref_local_trees( prg, frame, fi->trees, fi->treesLen );
+
+			popn( fui->frameSize );
+			frame = (Tree**) pop();
+			instr = (Code*) pop();
+			Tree *retVal = pop();
+			popn( fui->argSize );
+			push( retVal );
+			break;
+		}
+		case IN_OPEN_FILE: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_OPEN_FILE" << endl;
+			#endif
+
+			Tree *name = pop();
+			Tree *res = open_file( prg, name );
+			tree_upref( res );
+			push( res );
+			tree_downref( prg, name );
+			break;
+		}
+		case IN_GET_STDIN: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_GET_STDIN" << endl;
+			#endif
+
+			/* Pop the root object. */
+			tree_downref( prg, pop() );
+			if ( prg->stdinVal == 0 ) {
+				prg->stdinVal = open_stream_fd( prg, 0 );
+				tree_upref( (Tree*)prg->stdinVal );
+			}
+
+			tree_upref( (Tree*)prg->stdinVal );
+			push( (Tree*)prg->stdinVal );
+			break;
+		}
+		case IN_STOP: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_STOP" << endl;
+			#endif
+
+			cout.flush();
+			return;
+		}
+
+		/* Halt is a default instruction given by the compiler when it is
+		 * asked to generate and instruction it doesn't have. It is deliberate
+		 * and can represent "not implemented" or "compiler error" because a
+		 * variable holding instructions was not properly initialize. */
+		case IN_HALT: {
+			cerr << "IN_HALT -- compiler did something wrong" << endl;
+			exit(1);
+			break;
+		}
+		default: {
+			cerr << "UNKNOWN INSTRUCTION: " << (ulong)instr[-1] << 
+					" -- something is wrong" << endl;
+			exit(1);
+			break;
+		}
+	}
+	goto again;
+}
diff --git a/colm/bytecode.h b/colm/bytecode.h
new file mode 100644
index 00000000..0bdcab99
--- /dev/null
+++ b/colm/bytecode.h
@@ -0,0 +1,615 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _BYTECODE_H
+#define _BYTECODE_H
+
+#include "vector.h"
+#include "resize.h"
+#include "dlist.h"
+#include "config.h"
+#include "avlmap.h"
+
+#include <iostream>
+
+using std::cerr;
+using std::endl;
+using std::ostream;
+
+typedef unsigned long ulong;
+typedef unsigned char uchar;
+
+#define read_word_p( i, p ) do { \
+	i = ((Word)  p[0]); \
+	i |= ((Word) p[1]) << 8; \
+	i |= ((Word) p[2]) << 16; \
+	i |= ((Word) p[3]) << 24; \
+} while(0)
+
+#define IN_LOAD_INT              0x01
+#define IN_LOAD_STR              0x02
+#define IN_LOAD_NIL              0x03
+#define IN_LOAD_TRUE             0xa3
+#define IN_LOAD_FALSE            0xa4
+
+#define IN_ADD_INT               0x04
+#define IN_SUB_INT               0x06
+#define IN_MULT_INT              0x05
+
+#define IN_TST_EQL               0xa0
+#define IN_TST_NOT_EQL           0xa1
+#define IN_TST_LESS              0x0e
+#define IN_TST_GRTR              0x10
+#define IN_TST_LESS_EQL          0x0f
+#define IN_TST_GRTR_EQL          0x11
+#define IN_TST_LOGICAL_AND       0x12
+#define IN_TST_LOGICAL_OR        0x13
+
+#define IN_NOT                   0x16
+
+#define IN_JMP                   0x0c
+#define IN_JMP_FALSE             0x0b
+#define IN_JMP_TRUE              0x0d
+
+#define IN_STR_ATOI              0x14
+#define IN_STR_LENGTH            0x15
+#define IN_CONCAT_STR            0x17
+
+#define IN_INIT_LOCALS           0x18
+#define IN_POP_LOCALS            0xb0
+#define IN_POP                   0x19
+#define IN_DUP_TOP               0x1a
+#define IN_REJECT                0x1b
+#define IN_MATCH                 0x1c
+#define IN_CONSTRUCT             0x1d
+#define IN_TREE_NEW              0x1f
+
+#define IN_GET_LOCAL_R           0x20
+#define IN_GET_LOCAL_WC          0x21
+#define IN_SET_LOCAL_WC          0x22
+
+#define IN_GET_LOCAL_REF_R       0x23
+#define IN_GET_LOCAL_REF_WC      0x24
+#define IN_SET_LOCAL_REF_WC      0x25
+
+#define IN_SAVE_RET              0x26
+
+#define IN_GET_FIELD_R           0x27
+#define IN_GET_FIELD_WC          0x28
+#define IN_GET_FIELD_WV          0x29
+#define IN_GET_FIELD_BKT         0x2a
+
+#define IN_SET_FIELD_WV          0x2b
+#define IN_SET_FIELD_WC          0x2c
+#define IN_SET_FIELD_BKT         0x2d
+#define IN_SET_FIELD_LEAVE_WC    0x2e
+
+#define IN_GET_MATCH_LENGTH_R    0x2f
+#define IN_GET_MATCH_TEXT_R      0x30
+
+#define IN_GET_TOKEN_DATA_R      0x31
+#define IN_SET_TOKEN_DATA_WC     0x32
+#define IN_SET_TOKEN_DATA_WV     0x33
+#define IN_SET_TOKEN_DATA_BKT    0x34
+
+#define IN_GET_TOKEN_POS_R       0x35
+
+#define IN_INIT_RHS_EL           0x3b
+
+#define IN_TRITER_FROM_REF       0x3c
+#define IN_TRITER_ADVANCE        0x3d
+#define IN_TRITER_NEXT_CHILD     0x98
+#define IN_TRITER_PREV_CHILD     0x9b
+#define IN_TRITER_GET_CUR_R      0x3e
+#define IN_TRITER_GET_CUR_WC     0x3f
+#define IN_TRITER_SET_CUR_WC     0x40
+#define IN_TRITER_DESTROY        0x41
+
+#define IN_UITER_DESTROY         0x52
+#define IN_UITER_CREATE          0x53
+#define IN_UITER_ADVANCE         0x54
+#define IN_UITER_GET_CUR_R       0x55
+#define IN_UITER_GET_CUR_WC      0x56
+#define IN_UITER_SET_CUR_WC      0x57
+
+#define IN_TREE_SEARCH           0x58
+
+#define IN_LOAD_GLOBAL_R         0x59
+#define IN_LOAD_GLOBAL_WV        0x5a
+#define IN_LOAD_GLOBAL_BKT       0x5b
+
+#define IN_PTR_DEREF_R           0x5e
+#define IN_PTR_DEREF_WV          0x5f
+#define IN_PTR_DEREF_WC          0x60
+#define IN_PTR_DEREF_BKT         0x61
+
+#define IN_REF_FROM_LOCAL        0x62
+#define IN_REF_FROM_REF          0x97
+#define IN_TRITER_REF_FROM_CUR   0x63
+#define IN_UITER_REF_FROM_CUR    0x64
+                                
+#define IN_MAP_LENGTH            0x65
+#define IN_MAP_FIND              0x66
+#define IN_MAP_INSERT_WV         0x67
+#define IN_MAP_INSERT_WC         0x68
+#define IN_MAP_INSERT_BKT        0x69
+#define IN_MAP_STORE_WV          0x6a
+#define IN_MAP_STORE_WC          0x6b
+#define IN_MAP_STORE_BKT         0x6c
+#define IN_MAP_REMOVE_WV         0x6d
+#define IN_MAP_REMOVE_WC         0x6e
+#define IN_MAP_REMOVE_BKT        0x6f
+
+#define IN_LIST_LENGTH           0x70
+#define IN_LIST_APPEND_WV        0x71
+#define IN_LIST_APPEND_WC        0x72
+#define IN_LIST_APPEND_BKT       0x73
+#define IN_LIST_REMOVE_END_WV    0x74
+#define IN_LIST_REMOVE_END_WC    0x75
+#define IN_LIST_REMOVE_END_BKT   0x76
+
+#define IN_GET_LIST_MEM_R        0x77
+#define IN_GET_LIST_MEM_WC       0x78
+#define IN_GET_LIST_MEM_WV       0x79
+#define IN_GET_LIST_MEM_BKT      0x7a
+#define IN_SET_LIST_MEM_WV       0x7b
+#define IN_SET_LIST_MEM_WC       0x7c
+#define IN_SET_LIST_MEM_BKT      0x7d
+
+#define IN_VECTOR_LENGTH         0x7e
+#define IN_VECTOR_APPEND_WV      0x7f
+#define IN_VECTOR_APPEND_WC      0x80
+#define IN_VECTOR_APPEND_BKT     0x81
+#define IN_VECTOR_INSERT_WV      0x82
+#define IN_VECTOR_INSERT_WC      0x83
+#define IN_VECTOR_INSERT_BKT     0x84
+
+#define IN_PRINT                 0x87
+#define IN_PRINT_XML             0x88
+
+#define IN_HALT                  0x8a
+
+#define IN_CALL                  0x8b
+#define IN_RET                   0x8c
+#define IN_YIELD                 0x8d
+#define IN_STOP                  0x8e
+
+#define IN_STR_UORD8             0x8f
+#define IN_STR_SORD8             0x90
+#define IN_STR_UORD16            0x91
+#define IN_STR_SORD16            0x92
+#define IN_STR_UORD32            0x93
+#define IN_STR_SORD32            0x94
+
+#define IN_INT_TO_STR            0x99
+
+#define IN_CREATE_TOKEN          0x95
+#define IN_MAKE_TOKEN            0x96
+#define IN_MAKE_TREE             0xb2
+#define IN_CONSTRUCT_TERM        0x9a
+#define IN_PARSE                 0xb1
+#define IN_PARSE_BKT             0xb3
+#define IN_STREAM_PULL           0xb4
+#define IN_STREAM_PULL_BKT       0xb5
+#define IN_STREAM_PUSH           0xbc
+#define IN_STREAM_PUSH_BKT       0xbd
+#define IN_SEND                  0xb6
+#define IN_IGNORE                0xb7
+
+#define IN_OPEN_FILE             0xb8
+#define IN_GET_STDIN             0xb9
+#define IN_GET_STDOUT            0xba
+#define IN_GET_STDERR            0xbb
+
+
+/* Types */
+#define TYPE_NIL      0x01
+#define TYPE_TREE     0x02
+#define TYPE_REF      0x03
+#define TYPE_PTR      0x04
+#define TYPE_ITER     0x05
+
+/* Types of Generics. */
+#define GEN_LIST      0x10
+#define GEN_MAP       0x11
+#define GEN_VECTOR    0x12
+
+/* Allocation, number of items. */
+#define FRESH_BLOCK 8128                    
+
+/* Virtual machine stack size, number of pointers. 
+ * This will be mmapped. */
+#define VM_STACK_SIZE (4*1024ll*1024ll) 
+
+/* Known language element ids. */
+#define LEL_ID_PTR    1
+#define LEL_ID_BOOL   2
+#define LEL_ID_INT    3
+#define LEL_ID_STR    4
+#define LEL_ID_STREAM 5
+
+#define AF_GENERATED   0x1
+#define AF_COMMITTED   0x2
+#define AF_REV_FREED   0x4
+#define AF_ARTIFICIAL  0x8
+#define AF_NAMED       0x10
+#define AF_GROUP_MEM   0x20
+#define AF_IGNORE      0x40
+#define AF_HAS_RCODE   0x80
+
+/*
+ * Call stack.
+ */
+
+/* Number of spots in the frame, after the args. */
+#define FR_AA 3
+
+/* Positions relative to the frame pointer. */
+#define FR_RV 2    /* return value */
+#define FR_RI 1    /* return instruction */
+#define FR_RF 0    /* return frame pointer */
+
+/*
+ * Calling Convention:
+ *   a1
+ *   a2
+ *   a3
+ *   ...
+ *   return value FR_RV
+ *   return instr FR_RI
+ *   return frame FR_RF
+ */
+
+/*
+ * User iterator call stack. 
+ * Adds an iframe pointer, removes the return value.
+ */
+
+/* Number of spots in the frame, after the args. */
+#define IFR_AA  3
+
+/* Positions relative to the frame pointer. */
+#define IFR_RIN 2    /* return instruction */
+#define IFR_RIF 1    /* return iframe pointer */
+#define IFR_RFR 0    /* return frame pointer */
+
+
+struct Kid;
+struct Tree;
+struct Alg;
+struct ListEl;
+struct MapEl;
+struct PdaTables;
+struct RuntimeData;
+struct FsmRun;
+struct PdaRun;
+struct Program;
+struct List;
+struct Map;
+struct Stream;
+
+typedef unsigned char Code;
+typedef unsigned long Word;
+typedef unsigned long Half;
+
+typedef Tree *SW;
+typedef Tree **StackPtr;
+typedef Tree **&StackRef;
+
+Tree **alloc_obj_data( long length );
+
+Kid *alloc_attrs( Program *prg, long length );
+void free_attrs( Program *prg, Kid *attrs );
+void set_attr( Tree *tree, long pos, Tree *val );
+Tree *get_attr( Tree *tree, long pos );
+
+/* Return the size of a type in words. */
+template<class T> int sizeof_in_words()
+{
+	assert( (sizeof(T) % sizeof(Word)) == 0 );
+	return sizeof(T) / sizeof(Word);
+}
+
+/* 
+ * Code Vector
+ */
+struct CodeVect : public Vector<Code>
+{
+	void appendHalf( Half half )
+	{
+		/* not optimal. */
+		append( half & 0xff );
+		append( (half>>8) & 0xff );
+	}
+	
+	void appendWord( Word word )
+	{
+		/* not optimal. */
+		append( word & 0xff );
+		append( (word>>8) & 0xff );
+		append( (word>>16) & 0xff );
+		append( (word>>24) & 0xff );
+	}
+
+	void setHalf( long pos, Half half )
+	{
+		/* not optimal. */
+		data[pos] = half & 0xff;
+		data[pos+1] = (half>>8) & 0xff;
+	}
+	
+	void insertHalf( long pos, Half half )
+	{
+		/* not optimal. */
+		insert( pos, half & 0xff );
+		insert( pos+1, (half>>8) & 0xff );
+	}
+
+	void insertWord( long pos, Word word )
+	{
+		/* not optimal. */
+		insert( pos, word & 0xff );
+		insert( pos+1, (word>>8) & 0xff );
+		insert( pos+2, (word>>16) & 0xff );
+		insert( pos+3, (word>>24) & 0xff );
+	}
+	
+	void insertTree( long pos, Tree *tree )
+		{ insertWord( pos, (Word) tree ); }
+};
+
+/*
+ * Strings
+ */
+
+/* Header located just before string data. */
+struct Head
+{
+	const char *data;
+	long length;
+};
+
+struct Program;
+struct Stream;
+
+Head *string_alloc_new( Program *prg, const char *data, long length );
+Head *string_alloc_const( Program *prg, const char *data, long length );
+Head *string_copy( Program *prg, Head *head );
+void string_free( Program *prg, Head *head );
+
+void print_str( Head *str );
+
+long string_length( Head *str );
+const char *string_data( Head *str );
+void string_shorten( Head *tokdata, long newlen );
+void ignore_data( Tree *tree, char *dest );
+long ignore_length( Tree *tree );
+void free_obj_data( Program *prg, Kid *attrs );
+Head *concat_str( Head *s1, Head *s2 );
+Word cmp_string( Head *s1, Head *s2 );
+Word str_atoi( Head *str );
+Head *int_to_str( Program *prg, Word i );
+Word str_uord16( Head *head );
+Word str_uord8( Head *head );
+Head *make_literal( Program *prg, long litoffset );
+void rcode_downref( Tree **stack_root, Program *prg, Code *instr );
+void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *cv );
+void xml_print_tree( Tree **&sp, Program *prg, Tree *tree );
+void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
+void parsed_downref( Tree **root, Program *prg, Tree *tree );
+Stream *open_stream( Program *prg, FILE *file );
+Tree *construct_string( Program *prg, Head *s );
+void list_free( Program *prg, List *list );
+void ignore_free( Program *prg, Tree *tree );
+void map_free( Program *prg, Map *map );
+void stream_free( Program *prg, Stream *s );
+
+void tree_downref( Program *prg, Tree *tree );
+void tree_upref( Tree *tree );
+Kid *tree_child( Program *prg, Tree *tree );
+Kid *tree_extract_child( Program *prg, Tree *tree );
+Kid *tree_ignore( Program *prg, Tree *tree );
+void print_tree( Tree **&sp, Program *prg, Tree *tree );
+void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
+bool tree_is_ignore( Program *prg, Kid *kid );
+Kid *kid_list_concat( Kid *list1, Kid *list2 );
+
+/*
+ * Maps
+ */
+struct GenericInfo
+{
+	long type;
+	long typeArg;
+	long keyOffset;
+	long keyType;
+	long langElId;
+};
+
+long cmp_tree( const Tree *tree1, const Tree *tree2 );
+
+/*
+ * Runtime environment
+ */
+
+struct PoolItem
+{
+	PoolItem *next;
+};
+
+template <class T> struct PoolBlock
+{
+	T data[FRESH_BLOCK];
+	PoolBlock<T> *next;
+};
+
+template <class T> struct PoolAlloc
+{
+	PoolAlloc() : 
+		head(0), nextel(FRESH_BLOCK), pool(0)
+	{}
+
+	T *allocate();
+	void free( T *el );
+	void clear();
+	long numlost();
+
+	PoolBlock<T> *head;
+	long nextel;
+	PoolItem *pool;
+};
+
+template <class T> T *PoolAlloc<T>::allocate()
+{
+	//#ifdef COLM_LOG_BYTECODE
+	//cerr << "allocating in: " << __PRETTY_FUNCTION__ << endl;
+	//#endif
+
+	T *newEl = 0;
+	if ( pool == 0 ) {
+		if ( nextel == FRESH_BLOCK ) {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "allocating " << FRESH_BLOCK << " Elements of type T" << endl;
+			#endif
+
+			PoolBlock<T> *newBlock = new PoolBlock<T>;
+			newBlock->next = head;
+			head = newBlock;
+			nextel = 0;
+		}
+		newEl = &head->data[nextel++];
+	}
+	else {
+		newEl = (T*)pool;
+		pool = pool->next;
+	}
+	memset( newEl, 0, sizeof(T) );
+	return newEl;
+}
+
+template <class T> void PoolAlloc<T>::free( T *el )
+{
+	//#ifdef COLM_LOG_BYTECODE
+	//cerr << "freeing in: " << __PRETTY_FUNCTION__ << endl;
+	//#endif
+
+	memset( el, 0, sizeof(T) );
+	PoolItem *pi = (PoolItem*) el;
+	pi->next = pool;
+	pool = pi;
+}
+
+template <class T> void PoolAlloc<T>::clear()
+{
+	PoolBlock<T> *block = head;
+	while ( block != 0 ) {
+		PoolBlock<T> *next = block->next;
+		delete block;
+		block = next;
+	}
+
+	head = 0;
+	nextel = 0;
+	pool = 0;
+}
+
+template <class T> long PoolAlloc<T>::numlost()
+{
+	/* Count the number of items allocated. */
+	long lost = 0;
+	PoolBlock<T> *block = head;
+	if ( block != 0 ) {
+		lost = nextel;
+		block = block->next;
+		while ( block != 0 ) {
+			lost += FRESH_BLOCK;
+			block = block->next;
+		}
+	}
+
+	/* Subtract. Items that are on the free list. */
+	PoolItem *pi = pool;
+	while ( pi != 0 ) {
+		lost -= 1;
+		pi = pi->next;
+	}
+
+	return lost;
+}
+
+struct Int;
+
+struct Program
+{
+	Program( bool ctxDepParsing, RuntimeData *rtd );
+
+	bool ctxDepParsing;
+	RuntimeData *rtd;
+	Tree *global;
+
+	PoolAlloc<Kid> kidPool;
+	PoolAlloc<Tree> treePool;
+	PoolAlloc<Alg> algPool;
+	PoolAlloc<ListEl> listElPool;
+	PoolAlloc<MapEl> mapElPool;
+
+	Tree *trueVal;
+	Tree *falseVal;
+
+	void run();
+	void clear();
+	void clearGlobal();
+	void freshGlobal();
+
+	Kid *heap;
+
+	Stream *stdinVal;
+	Stream *stdoutVal;
+	Stream *stderrVal;
+};
+
+struct Execution
+{
+	Execution( Program *prg, CodeVect &reverseCode,
+			PdaRun *parser, Code *code, Tree *lhs, Head *matchText );
+
+	Program *prg;
+	PdaTables *pdaTables;
+	PdaRun *parser;
+	Code *code;
+	Tree **frame;
+	Tree **iframe;
+	Tree *lhs;
+
+	Head *matchText;
+	bool reject;
+
+	/* Reverse code. */
+	CodeVect &reverseCode;
+	long rcodeUnitLen;
+
+	void execute( Tree **root );
+	void rexecute( Tree **root, Code *revcode, CodeVect &allRev );
+	void execute( Tree **&sp, Code *instr );
+	void rdownref( Code *instr );
+};
+
+#endif
diff --git a/colm/closure.cpp b/colm/closure.cpp
new file mode 100644
index 00000000..3a10d030
--- /dev/null
+++ b/colm/closure.cpp
@@ -0,0 +1,450 @@
+/*
+ *  Copyright 2005 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "colm.h"
+#include "parsedata.h"
+
+#include "vector.h"
+#include <assert.h>
+#include <string.h>
+#include <iostream>
+
+using std::endl;
+using std::cerr;
+
+void ParseData::lr0BringInItem( PdaGraph *pdaGraph, PdaState *dest, PdaState *prodState, 
+		PdaTrans *expandFrom, Definition *prod )
+{
+	/* We use dot sets for finding unique states. In the future, should merge
+	 * dots sets with the stateSet pointer (only need one of these). */
+	assert( dest != prodState );
+	dest->dotSet.insert( prodState->dotSet );
+
+	/* Get the epsilons, context, out priorities. */
+	dest->pendingCommits.insert( prodState->pendingCommits );
+	//if ( prodState->pendingCommits.length() > 0 )
+	//	cerr << "THERE ARE PENDING COMMITS DRAWN IN" << endl;
+	
+	if ( prodState->transMap.length() > 0 ) {
+		assert( prodState->transMap.length() == 1 );
+		PdaTrans *srcTrans = prodState->transMap[0].value;
+
+		/* Look for the source in the destination. */
+		TransMapEl *destTel = dest->transMap.find( srcTrans->lowKey );
+		if ( destTel == 0 ) {
+			/* Make a new state and transition to it. */
+			PdaState *newState = pdaGraph->addState();
+			PdaTrans *newTrans = new PdaTrans();
+
+			/* Attach the new transition to the new state. */
+			newTrans->lowKey = srcTrans->lowKey;
+			pdaGraph->attachTrans( dest, newState, newTrans );
+			pdaGraph->addInTrans( newTrans, srcTrans );
+
+			/* The transitions we make during lr0 closure are all shifts. */
+			assert( newTrans->isShift );
+			assert( srcTrans->isShift );
+
+			/* The new state must have its state set setup. */
+			newState->stateSet = new PdaStateSet;
+			newState->stateSet->insert( srcTrans->toState );
+
+			/* Insert the transition into the map. Be sure to set destTel, it
+			 * is needed below. */
+			dest->transMap.insert( srcTrans->lowKey, newTrans, &destTel );
+
+			/* If the item is a non-term, queue it for closure. */
+			KlangEl *langEl = langElIndex[srcTrans->lowKey];
+			if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+				pdaGraph->transClosureQueue.append( newTrans );
+				//cerr << "put to trans closure queue" << endl;
+			}
+		}
+		else {
+			//cerr << "merging transitions" << endl;
+			destTel->value->toState->stateSet->insert( srcTrans->toState );
+			pdaGraph->addInTrans( destTel->value, srcTrans );
+		}
+
+		/* If this is an expansion then we may need to bring in commits. */
+		if ( expandFrom != 0 && expandFrom->commits.length() > 0 ) {
+			//cerr << "SETTING COMMIT ON CLOSURE ROUND" << endl;
+			destTel->value->commits.insert( expandFrom->commits );
+
+			expandFrom->commits.empty();
+		}
+	}
+	else {
+		/* ProdState does not have any transitions out. It is at the end of a
+		 * production. */
+		if ( expandFrom != 0 && expandFrom->commits.length() > 0 ) {
+			//cerr << "SETTING COMMIT IN PENDING LOOKAHEAD" << endl;
+			for ( LongSet::Iter len = expandFrom->commits; len.lte(); len++ )
+				dest->pendingCommits.insert( ProdIdPair( prod->prodId, *len ) );
+
+			expandFrom->commits.empty();
+		}
+	}
+}
+
+void ParseData::lr0InvokeClosure( PdaGraph *pdaGraph, PdaState *state )
+{
+	/* State should not already be closed. */
+	assert( !state->inClosedMap );
+
+	/* This is used each time we invoke closure, it must be cleared. */
+	pdaGraph->transClosureQueue.abandon();
+
+	/* Drag in the core items. */
+	for ( PdaStateSet::Iter ssi = *state->stateSet; ssi.lte(); ssi++ )
+		lr0BringInItem( pdaGraph, state, *ssi, 0, 0 );
+
+	/* Now bring in the derived items. */
+	while ( pdaGraph->transClosureQueue.length() > 0 ) {
+		PdaTrans *toClose = pdaGraph->transClosureQueue.detachFirst();
+		//cerr << "have a transition to derive" << endl;
+
+		/* Get the langEl. */
+		KlangEl *langEl = langElIndex[toClose->lowKey];
+
+		/* Make graphs for all of the productions that the non
+		 * terminal goes to that are not already in the state's dotSet. */
+		for ( LelDefList::Iter prod = langEl->defList; prod.lte(); prod++ ) {
+			/* Bring in the start state of the production. */
+			lr0BringInItem( pdaGraph, state, prod->fsm->startState, toClose, prod );
+		}
+	}
+
+	/* Try and insert into the closed dict. */
+	DotSetMapEl *lastFound;
+	if ( pdaGraph->closedMap.insert( state, &lastFound ) ) {
+		/* Insertion into closed dict succeeded. There is no state with the
+		 * same dot set. The state is now closed. It is guaranteed a spot in
+		 * the closed dict and it will never go away (states never deleted
+		 * during closure). */
+		pdaGraph->stateClosedList.append( state );
+		state->inClosedMap = true;
+
+		/* Add all of the states in the out transitions to the closure queue.
+		 * This will give us a depth first search of the graph. */
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			/* Get the state the transEl goes to. */
+			PdaState *targ = trans->value->toState;
+
+			/* If the state on this tranisition has not already been slated
+			 * for closure, then add it to the queue. */
+			if ( !targ->onClosureQueue && !targ->inClosedMap ) {
+				pdaGraph->stateClosureQueue.append( targ );
+				targ->onClosureQueue = true;
+			}
+		}
+	}
+	else {
+		/* Insertion into closed dict failed. There is an existing state
+		 * with the same dot set. Get the existing state. */
+		pdaGraph->inTransMove( lastFound, state );
+		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+			pdaGraph->stateList.detach( tel->value->toState );
+			delete tel->value->toState;
+			delete tel->value;
+		}
+		pdaGraph->stateList.detach( state );
+		delete state;
+	}
+}
+
+/* Invoke cloure on the graph. We use a queue here to achieve a breadth
+ * first search of the tree we build. Note, there are back edges in this
+ * tree. They are the edges made when upon closure, a dot set exists
+ * already. */
+void ParseData::lr0CloseAllStates( PdaGraph *pdaGraph )
+{
+	/* While there are items on the closure queue. */
+	while ( pdaGraph->stateClosureQueue.length() > 0 ) {
+		/* Pop the first item off. */
+		PdaState *state = pdaGraph->stateClosureQueue.detachFirst();
+		state->onClosureQueue = false;
+
+		/* Invoke closure upon the state. */
+		lr0InvokeClosure( pdaGraph, state );
+	}
+}
+
+void ParseData::transferCommits( PdaGraph *pdaGraph, PdaTrans *trans, 
+		PdaState *state, long prodId )
+{
+	ProdIdPairSet &pendingCommits = state->pendingCommits;
+	for ( ProdIdPairSet::Iter pi = pendingCommits; pi.lte(); pi++ ) {
+		if ( pi->onReduce == prodId )
+			trans->commits.insert( pi->length );
+	}
+}
+
+void ParseData::lalr1AddFollow2( PdaGraph *pdaGraph, PdaTrans *trans, FollowToAdd &followKeys )
+{
+	for ( ExpandToSet::Iter ets = trans->expandTo; ets.lte(); ets++ ) {
+		int prodId = ets->prodId;
+		PdaState *expandTo = ets->state;
+
+		for ( FollowToAdd::Iter fkey = followKeys; fkey.lte(); fkey++ ) {
+			TransMapEl *transEl = expandTo->transMap.find( fkey->key );
+
+			if ( transEl != 0 ) {
+				/* Set up the follow transition. */
+				PdaTrans *destTrans = transEl->value;
+
+				transferCommits( pdaGraph, destTrans, expandTo, prodId );
+
+				pdaGraph->addInReduction( destTrans, prodId, fkey->value );
+			}
+			else {
+				/* Set up the follow transition. */
+				PdaTrans *followTrans = new PdaTrans;
+				followTrans->lowKey = fkey->key;
+				followTrans->isShift = false;
+				followTrans->reductions.insert( prodId, fkey->value );
+
+				transferCommits( pdaGraph, followTrans, expandTo, prodId );
+
+				pdaGraph->attachTrans( expandTo, actionDestState, followTrans );
+				expandTo->transMap.insert( followTrans->lowKey, followTrans );
+				pdaGraph->transClosureQueue.append( followTrans );
+			}
+		}
+	}
+}
+
+long PdaTrans::maxPrior()
+{
+	long prior = LONG_MIN;
+	if ( isShift && shiftPrior > prior )
+		prior = shiftPrior;
+	for ( ReductionMap::Iter red = reductions; red.lte(); red++ ) {
+		if ( red->value > prior )
+			prior = red->value;
+	}
+	return prior;
+}
+
+void ParseData::lalr1AddFollow1( PdaGraph *pdaGraph, PdaState *state )
+{
+	/* Finding non-terminals into the state. */
+	for ( PdaTransInList::Iter in = state->inRange; in.lte(); in++ ) {
+		long key = in->lowKey; 
+		KlangEl *langEl = langElIndex[key];
+		if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+			/* Finding the following transitions. */
+			FollowToAdd followKeys;
+			for ( TransMap::Iter fout = state->transMap; fout.lte(); fout++ ) {
+				int fkey = fout->key; 
+				KlangEl *flel = langElIndex[fkey];
+				if ( flel == 0 || flel->type == KlangEl::Term ) {
+					long prior = fout->value->maxPrior();
+					followKeys.insert( fkey, prior );
+				}
+			}
+
+			if ( followKeys.length() > 0 )
+				lalr1AddFollow2( pdaGraph, in, followKeys );
+		}
+	}
+}
+
+void ParseData::lalr1AddFollow2( PdaGraph *pdaGraph, PdaTrans *trans, 
+		long followKey, long prior )
+{
+	for ( ExpandToSet::Iter ets = trans->expandTo; ets.lte(); ets++ ) {
+		int prodId = ets->prodId;
+		PdaState *expandTo = ets->state;
+
+		TransMapEl *transEl = expandTo->transMap.find( followKey );
+		if ( transEl != 0 ) {
+			/* Add in the reductions, or in the shift. */
+			PdaTrans *destTrans = transEl->value;
+
+			transferCommits( pdaGraph, destTrans, expandTo, prodId );
+
+			pdaGraph->addInReduction( destTrans, prodId, prior );
+		}
+		else {
+			/* Set up the follow transition. */
+			PdaTrans *followTrans = new PdaTrans;
+			followTrans->lowKey = followKey;
+			followTrans->isShift = false;
+			followTrans->reductions.insert( prodId, prior );
+
+			transferCommits( pdaGraph, followTrans, expandTo, prodId );
+
+			pdaGraph->attachTrans( expandTo, actionDestState, followTrans );
+			expandTo->transMap.insert( followTrans->lowKey, followTrans );
+			pdaGraph->transClosureQueue.append( followTrans );
+		}
+	}
+}
+
+void ParseData::lalr1AddFollow1( PdaGraph *pdaGraph, PdaTrans *trans )
+{
+	PdaState *state = trans->fromState;
+	int fkey = trans->lowKey; 
+	KlangEl *flel = langElIndex[fkey];
+	if ( flel == 0 || flel->type == KlangEl::Term ) {
+		/* Finding non-terminals into the state. */
+		for ( PdaTransInList::Iter in = state->inRange; in.lte(); in++ ) {
+			long key = in->lowKey; 
+			KlangEl *langEl = langElIndex[key];
+			if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+				//cerr << "FOLLOW PRIOR TRANSFER 2: " << prior << endl;
+				long prior = trans->maxPrior();
+				lalr1AddFollow2( pdaGraph, in, fkey, prior );
+			}
+		}
+	}
+}
+
+/* Add follow sets to an LR(0) graph to make it LALR(1). */
+void ParseData::lalr1AddFollowSets( PdaGraph *pdaGraph, KlangEl *rootEl )
+{
+	/* Make the state that all reduction actions go to. Since a reduction pops
+	 * states of the stack and sets the new target state, this state is
+	 * actually never reached. Just here to link the trans to. */
+	actionDestState = pdaGraph->addState();
+	pdaGraph->setFinState( actionDestState );
+
+	/* Get the entry into the graph and traverse over start. */
+	PdaState *overStart = pdaGraph->followFsm( pdaGraph->startState, rootEl->rootDef->fsm );
+
+	/* Add _eof after the initial _start. */
+	PdaTrans *eofTrans = pdaGraph->insertNewTrans( overStart, actionDestState, 
+			eofKlangEl->id, eofKlangEl->id );
+	eofTrans->isShift = true;
+
+	/* This was used during lr0 table construction. */
+	pdaGraph->transClosureQueue.abandon();
+
+	/* Need to pass over every state initially. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ )
+		lalr1AddFollow1( pdaGraph, state );
+
+	/* While the closure queue has items, pop them off and add follow
+	 * characters. */
+	while ( pdaGraph->transClosureQueue.length() > 0 ) {
+		/* Pop the first item off and add Follow for it . */
+		PdaTrans *trans = pdaGraph->transClosureQueue.detachFirst();
+		lalr1AddFollow1( pdaGraph, trans );
+	}
+}
+
+void ParseData::linkExpansions( PdaGraph *pdaGraph )
+{
+	pdaGraph->setStateNumbers();
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		/* Find transitions out on non terminals. */
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			long key = trans->key;
+			KlangEl *langEl = langElIndex[key];
+			if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+				/* For each production that the non terminal expand to ... */
+				for ( LelDefList::Iter prod = langEl->defList; prod.lte(); prod++ ) {
+					/* Follow the production and add to the trans's expand to set. */
+					PdaState *followRes = pdaGraph->followFsm( state, prod->fsm );
+
+					//KlangEl *lel = langElIndex[key];
+					//cerr << state->stateNum << ", "; 
+					//if ( lel != 0 )
+					//	cerr << lel->data;
+					//else
+					//	cerr << (char)key;
+					//cerr << " -> " << (*fto)->stateNum << " on " <<
+					//		prod->data << " (fss = " << fin.pos() << ")" << endl;
+					trans->value->expandTo.insert( ExpandToEl( followRes, prod->prodId ) );
+				}
+			}
+		}
+	}
+}
+
+/* Add terminal versions of all nonterminal transitions. */
+void ParseData::addDupTerms( PdaGraph *pdaGraph )
+{
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		PdaTransList newTranitions;
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			KlangEl *lel = langElIndex[trans->value->lowKey];
+			if ( lel->type == KlangEl::NonTerm ) {
+				PdaTrans *dupTrans = new PdaTrans;
+				dupTrans->lowKey = lel->termDup->id;
+				dupTrans->isShift = true;
+
+				/* Save the target state in to state. In the next loop when we
+				 * attach the transition we must clear this because the
+				 * attaching code requires the transition to be unattached. */
+				dupTrans->toState = trans->value->toState;
+				newTranitions.append( dupTrans );
+
+				/* Commit code used? */
+				//transferCommits( pdaGraph, followTrans, expandTo, prodId );
+			}
+		}
+
+		for ( PdaTrans *dup = newTranitions.head; dup != 0; ) {
+			PdaTrans *next = dup->next;
+			PdaState *toState = dup->toState;
+			dup->toState = 0;
+			pdaGraph->attachTrans( state, toState, dup );
+			state->transMap.insert( dup->lowKey, dup );
+			dup = next;
+		}
+	}
+}
+
+/* Generate a LALR(1) graph. */
+void ParseData::lalr1GenerateParser( PdaGraph *pdaGraph, KlangEl *rootEl )
+{
+	/* Make the intial graph. */
+	pdaGraph->langElIndex = langElIndex;
+
+	PdaState *start = pdaGraph->addState();
+	pdaGraph->setStartState( start );
+
+	start->stateSet = new PdaStateSet;
+	start->stateSet->insert( rootEl->rootDef->fsm->startState );
+
+	/* Queue the start state for closure. */
+	start->onClosureQueue = true;
+	pdaGraph->stateClosureQueue.append( start );
+
+	/* Run the lr0 closure. */
+	lr0CloseAllStates( pdaGraph );
+
+	/* Add terminal versions of all nonterminal transitions. */
+	addDupTerms( pdaGraph );
+
+	/* Link production expansions to the place they expand to. */
+	linkExpansions( pdaGraph );
+
+	/* Walk the graph adding follow sets to the LR(0) graph. */
+	lalr1AddFollowSets( pdaGraph, rootEl );
+
+//	/* Set the commit on the final eof shift. */
+//	PdaTrans *overStart = pdaGraph->startState->findTrans( rootEl->id );
+//	PdaTrans *eofTrans = overStart->toState->findTrans( eofKlangEl->id );
+//	eofTrans->afterShiftCommits.insert( 2 );
+}
diff --git a/colm/colm.h b/colm/colm.h
new file mode 100644
index 00000000..9d906c49
--- /dev/null
+++ b/colm/colm.h
@@ -0,0 +1,92 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _COLM_H
+#define _COLM_H
+
+#include <stdio.h>
+#include <iostream>
+#include <fstream>
+#include <fstream>
+#include <string>
+
+#include "config.h"
+#include "avltree.h"
+#include "common.h"
+
+#define PROGNAME "colm"
+
+/* IO filenames and stream. */
+extern bool printPrintables;
+extern bool graphvizDone;
+
+extern int gblErrorCount;
+
+std::ostream &error();
+
+/* IO filenames and stream. */
+extern const char *outputFileName;
+extern std::ostream *outStream;
+extern bool generateGraphviz;
+extern bool branchPointInfo;
+extern bool addUniqueEmptyProductions;
+
+extern int gblErrorCount;
+extern char startDefName[];
+
+/* Error reporting. */
+std::ostream &error();
+std::ostream &error( int first_line, int first_column );
+std::ostream &warning( ); 
+std::ostream &warning( int first_line, int first_column );
+
+struct exit_object { };
+extern exit_object endp;
+void operator<<( std::ostream &out, exit_object & );
+
+extern std::ostream *outStream;
+extern bool printStatistics;
+
+extern int gblErrorCount;
+extern char machineMain[];
+
+/* Location in an input file. */
+struct InputLoc
+{
+	const char *fileName;
+	int line;
+	int col;
+};
+
+/* Error reporting. */
+std::ostream &error();
+std::ostream &error( const InputLoc &loc ); 
+std::ostream &warning( const InputLoc &loc ); 
+
+void scan( char *fileName, std::istream &input, std::ostream &output );
+void terminateAllParsers( );
+void checkMachines( );
+
+void xmlEscapeHost( std::ostream &out, char *data, int len );
+void openOutput();
+void escapeLiteralString( std::ostream &out, const char *data );
+
+#endif /* _COLM_H */
diff --git a/colm/compile.cpp b/colm/compile.cpp
new file mode 100644
index 00000000..ebe1fbdc
--- /dev/null
+++ b/colm/compile.cpp
@@ -0,0 +1,2492 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "bytecode.h"
+#include "parsedata.h"
+#include <iostream>
+#include <assert.h>
+
+using std::cout;
+using std::cerr;
+using std::endl;
+
+void ParseData::initUniqueTypes( )
+{
+	uniqueTypeNil = new UniqueType( TYPE_NIL );
+	uniqueTypePtr = new UniqueType( TYPE_TREE, ptrKlangEl );
+	uniqueTypeBool = new UniqueType( TYPE_TREE, boolKlangEl );
+	uniqueTypeInt = new UniqueType( TYPE_TREE, intKlangEl );
+	uniqueTypeStr = new UniqueType( TYPE_TREE, strKlangEl );
+	uniqueTypeStream = new UniqueType( TYPE_TREE, streamKlangEl );
+	uniqueTypeAny = new UniqueType( TYPE_TREE, anyKlangEl );
+
+	uniqeTypeMap.insert( uniqueTypeNil );
+	uniqeTypeMap.insert( uniqueTypePtr );
+	uniqeTypeMap.insert( uniqueTypeBool );
+	uniqeTypeMap.insert( uniqueTypeInt );
+	uniqeTypeMap.insert( uniqueTypeStr );
+	uniqeTypeMap.insert( uniqueTypeStream );
+	uniqeTypeMap.insert( uniqueTypeAny );
+}
+
+IterDef::IterDef( Type type ) : 
+	type(type), 
+	func(0),
+	useFuncId(false),
+	useSearchUT(false)
+{
+	if ( type == Tree ) {
+		inCreate = IN_TRITER_FROM_REF;
+		inDestroy = IN_TRITER_DESTROY;
+		inAdvance = IN_TRITER_ADVANCE;
+
+		inGetCurR = IN_TRITER_GET_CUR_R;
+		inGetCurWC = IN_TRITER_GET_CUR_WC;
+		inSetCurWC = IN_TRITER_SET_CUR_WC;
+		inRefFromCur = IN_TRITER_REF_FROM_CUR;
+		useSearchUT = true;
+	}
+	else if ( type == Child ) {
+		inCreate = IN_TRITER_FROM_REF;
+		inDestroy = IN_TRITER_DESTROY;
+		inAdvance = IN_TRITER_NEXT_CHILD;
+
+		inGetCurR = IN_TRITER_GET_CUR_R;
+		inGetCurWC = IN_TRITER_GET_CUR_WC;
+		inSetCurWC = IN_TRITER_SET_CUR_WC;
+		inRefFromCur = IN_TRITER_REF_FROM_CUR;
+		useSearchUT = true;
+	}
+	else if ( type == RevChild ) {
+		inCreate = IN_TRITER_FROM_REF;
+		inDestroy = IN_TRITER_DESTROY;
+		inAdvance = IN_TRITER_PREV_CHILD;
+
+		inGetCurR = IN_TRITER_GET_CUR_R;
+		inGetCurWC = IN_TRITER_GET_CUR_WC;
+		inSetCurWC = IN_TRITER_SET_CUR_WC;
+		inRefFromCur = IN_TRITER_REF_FROM_CUR;
+		useSearchUT = true;
+	}
+	else
+		assert(false);
+}
+
+IterDef::IterDef( Type type, Function *func ) : 
+	type(type),
+	func(func),
+	useFuncId(true),
+	useSearchUT(true),
+	inCreate(IN_UITER_CREATE),
+	inDestroy(IN_UITER_DESTROY),
+	inAdvance(IN_UITER_ADVANCE),
+	inGetCurR(IN_UITER_GET_CUR_R),
+	inGetCurWC(IN_UITER_GET_CUR_WC),
+	inSetCurWC(IN_UITER_SET_CUR_WC),
+	inRefFromCur(IN_UITER_REF_FROM_CUR)
+{}
+
+ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
+		const String &name, int methIdWC, int methIdWV, bool isConst )
+{
+	ObjMethod *objMethod = new ObjMethod( retType, name, 
+			methIdWC, methIdWV, 0, 0, 0, isConst );
+	obj->objMethodMap->insert( name, objMethod );
+	return objMethod;
+}
+
+ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
+		const String &name, int methIdWC, int methIdWV, UniqueType *arg1, bool isConst )
+{
+	UniqueType *args[] = { arg1 };
+	ObjMethod *objMethod = new ObjMethod( retType, name, 
+			methIdWC, methIdWV, 1, args, 0, isConst );
+	obj->objMethodMap->insert( name, objMethod );
+	return objMethod;
+}
+
+ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
+		const String &name, int methIdWC, int methIdWV, 
+		UniqueType *arg1, UniqueType *arg2, bool isConst )
+{
+	UniqueType *args[] = { arg1, arg2 };
+	ObjMethod *objMethod = new ObjMethod( retType, name, 
+			methIdWC, methIdWV, 2, args, 0, isConst );
+	obj->objMethodMap->insert( name, objMethod );
+	return objMethod;
+}
+
+IterDef *ParseData::findIterDef( IterDef::Type type, Function *func )
+{
+	IterDefSetEl *el = iterDefSet.find( IterDef( type, func ) );
+	if ( el == 0 )
+		el = iterDefSet.insert( IterDef( type, func ) );
+	return &el->key;
+}
+
+IterDef *ParseData::findIterDef( IterDef::Type type )
+{
+	IterDefSetEl *el = iterDefSet.find( IterDef( type ) );
+	if ( el == 0 )
+		el = iterDefSet.insert( IterDef( type ) );
+	return &el->key;
+}
+
+UniqueType *ParseData::findUniqueType( int typeId )
+{
+	UniqueType searchKey( typeId );
+	UniqueType *uniqueType = uniqeTypeMap.find( &searchKey );
+	if ( uniqueType == 0 ) {
+		uniqueType = new UniqueType( typeId );
+		uniqeTypeMap.insert( uniqueType );
+	}
+	return uniqueType;
+}
+
+UniqueType *ParseData::findUniqueType( int typeId, KlangEl *langEl )
+{
+	UniqueType searchKey( typeId, langEl );
+	UniqueType *uniqueType = uniqeTypeMap.find( &searchKey );
+	if ( uniqueType == 0 ) {
+		uniqueType = new UniqueType( typeId, langEl );
+		uniqeTypeMap.insert( uniqueType );
+	}
+	return uniqueType;
+}
+
+UniqueType *ParseData::findUniqueType( int typeId, IterDef *iterDef )
+{
+	UniqueType searchKey( typeId, iterDef );
+	UniqueType *uniqueType = uniqeTypeMap.find( &searchKey );
+	if ( uniqueType == 0 ) {
+		uniqueType = new UniqueType( typeId, iterDef );
+		uniqeTypeMap.insert( uniqueType );
+	}
+	return uniqueType;
+}
+
+UniqueType *TypeRef::lookupTypePart( ParseData *pd, 
+		NamespaceQual *qual, const String &name )
+{
+	/* Lookup up the qualifiction and then the name. */
+	Namespace *nspace = qual->getQual( pd );
+
+	if ( nspace == 0 )
+		error(loc) << "do not have region for resolving reference" << endp;
+
+	/* Search for the token in the region by name. */
+	SymbolMapEl *inDict = nspace->symbolMap.find( name );
+	if ( inDict != 0 ) {
+		long typeId = ( isPtr ? TYPE_PTR : ( isRef ? TYPE_REF : TYPE_TREE ) );
+		return pd->findUniqueType( typeId, inDict->value );
+	}
+
+	error(loc) << "unknown type in typeof expression" << endp;
+	return 0;
+}
+
+UniqueType *TypeRef::lookupType( ParseData *pd )
+{
+	if ( uniqueType != 0 )
+		return uniqueType;
+	
+	if ( iterDef != 0 )
+		uniqueType = pd->findUniqueType( TYPE_ITER, iterDef );
+	else if ( factor != 0 )
+		uniqueType = pd->findUniqueType( TYPE_TREE, factor->langEl );
+	else {
+		String name = typeName;
+		if ( isOpt )
+			name.setAs( 32, "_opt_%s", name.data );
+		else if ( isRepeat )
+			name.setAs( 32, "_repeat_%s", name.data );
+
+		/* Not an iterator. May be a reference. */
+		uniqueType = lookupTypePart( pd, nspaceQual, name );
+	}
+
+	return uniqueType;
+}
+
+ObjField *ObjectDef::findField( String name )
+{
+	ObjFieldMapEl *objDefMapEl = objFieldMap->find( name );
+	if ( objDefMapEl != 0 )
+		return objDefMapEl->value;
+	return 0;
+}
+
+ObjMethod *ObjectDef::findMethod( String name )
+{
+	ObjMethodMapEl *objMethodMapEl = objMethodMap->find( name );
+	if ( objMethodMapEl != 0 )
+		return objMethodMapEl->value;
+	return 0;
+}
+
+long sizeOfField( UniqueType *fieldUT )
+{
+	long size = 0;
+	if ( fieldUT->typeId == TYPE_ITER ) {
+		/* Select on the iterator type. */
+		if ( fieldUT->iterDef->type == IterDef::Tree ||
+				fieldUT->iterDef->type == IterDef::Child ||
+				fieldUT->iterDef->type == IterDef::RevChild )
+			size = sizeof(TreeIter) / sizeof(Word);
+		else if ( fieldUT->iterDef->type == IterDef::User ) {
+			/* User iterators are just a pointer to the UserIter struct. The
+			 * struct needs to go right beneath the call to the user iterator
+			 * so it can be found by a yield. It is therefore allocated on the
+			 * stack right before the call. */
+			size = 1;
+		}
+		else {
+			assert(false);
+		}
+	}
+	else if ( fieldUT->typeId == TYPE_REF )
+		size = 2;
+	else
+		size = 1;
+
+	return size;
+}
+
+void ObjectDef::referenceField( ParseData *pd, ObjField *field )
+{
+	field->beenReferenced = true;
+	initField( pd, field );
+}
+
+void ObjectDef::initField( ParseData *pd, ObjField *field )
+{
+	if ( !field->beenInitialized ) {
+		field->beenInitialized = true;
+		UniqueType *fieldUT = field->typeRef->lookupType( pd );
+
+		if ( type == FrameType ) {
+			nextOffset += sizeOfField( fieldUT );
+			field->offset = -nextOffset;
+
+			pd->initLocalInstructions( field );
+		}
+		else {
+			field->offset = nextOffset;
+			nextOffset += sizeOfField( fieldUT );
+
+			/* Initialize the instructions. */
+			pd->initFieldInstructions( field );
+		}
+	}
+}
+
+UniqueType *LangVarRef::loadFieldInstr( ParseData *pd, CodeVect &code, 
+		ObjectDef *inObject, ObjField *el, bool forWriting, bool revert )
+{
+	/* Ensure that the field is referenced. */
+	inObject->referenceField( pd, el );
+
+	UniqueType *elUT = el->typeRef->lookupType( pd );
+
+	/* If it's a reference then we load it read always. */
+	if ( forWriting ) {
+		/* The instruction, depends on whether or not we are reverting. */
+		if ( elUT->typeId == TYPE_ITER )
+			code.append( elUT->iterDef->inGetCurWC );
+		else if ( revert )
+			code.append( el->inGetWV );
+		else
+			code.append( el->inGetWC );
+	}
+	else {
+		/* Loading something for writing */
+		if ( elUT->typeId == TYPE_ITER )
+			code.append( elUT->iterDef->inGetCurR );
+		else
+			code.append( el->inGetR );
+	}
+
+	if ( el->useOffset ) {
+		/* Gets of locals and fields require offsets. Fake vars like token
+		 * data and lhs don't require it. */
+		code.appendHalf( el->offset );
+	}
+
+	/* If we are dealing with an iterator then dereference it. */
+	if ( elUT->typeId == TYPE_ITER )
+		elUT = el->typeRef->searchTypeRef->lookupType( pd );
+
+	return elUT;
+}
+
+ObjectDef *objDefFromUT( ParseData *pd, UniqueType *ut )
+{
+	ObjectDef *objDef = 0;
+	if ( ut->typeId == TYPE_TREE || ut->typeId == TYPE_REF )
+		objDef = ut->langEl->objectDef;
+	else {
+		/* This should have generated a compiler error. */
+		assert(false);
+	}
+	return objDef;
+}
+
+void LangVarRef::loadQualification( ParseData *pd, CodeVect &code, 
+		ObjectDef *rootObj, int lastPtrInQual, bool forWriting, bool revert )
+{
+	/* Start the search from the root object. */
+	ObjectDef *searchObjDef = rootObj;
+
+	for ( QualItemVect::Iter qi = *qual; qi.lte(); qi++ ) {
+		/* Lookup the field int the current qualification. */
+		ObjFieldMapEl *objDefMapEl = searchObjDef->objFieldMap->find( qi->data );
+		if ( objDefMapEl == 0 )
+			error(qi->loc) << "cannot resolve qualification " << qi->data << endp;
+		ObjField *el = objDefMapEl->value;
+
+		if ( forWriting && el->refActive )
+			error(qi->loc) << "reference active, cannot write to object" << endp;
+
+		bool lfForWriting = forWriting;
+		bool lfRevert = revert;
+
+		/* If there is a pointer in the qualification, we need to compute
+		 * forWriting and revert. */
+		if ( lastPtrInQual >= 0 ) {
+			if ( qi.pos() <= lastPtrInQual ) {
+				/* If we are before or at the pointer we are strictly read
+				 * only, regardless of the origin. */
+				lfForWriting = false;
+				lfRevert = false;
+			}
+			else {
+				/* If we are past the pointer then we are always reverting
+				 * because the object is global. Forwriting is as passed in.
+				 * */
+				lfRevert = true;
+			}
+		}
+
+		UniqueType *qualUT = loadFieldInstr( pd, code, searchObjDef, 
+				el, lfForWriting, lfRevert );
+		
+		if ( qi->type == QualItem::Dot ) {
+			/* Cannot a reference. Iterator yes (access of the iterator not
+			 * hte current) */
+			if ( qualUT->typeId == TYPE_PTR )
+				error(loc) << "dot cannot be used to access a pointer" << endp;
+		}
+		else if ( qi->type == QualItem::Arrow ) {
+			if ( qualUT->typeId == TYPE_PTR ) {
+				/* Always dereference references when used for qualification. If
+				 * this is the last one then we must start with the reverse
+				 * execution business. */
+				if ( qi.pos() == lastPtrInQual && forWriting ) {
+					/* This is like a global load. */
+					code.append( IN_PTR_DEREF_WV );
+				}
+				else {
+					/* If reading or not yet the last in ref then we only need a
+					 * reading deref. */
+					code.append( IN_PTR_DEREF_R );
+				}
+
+				qualUT = pd->findUniqueType( TYPE_TREE, qualUT->langEl );
+			}
+			else {
+				error(loc) << "arrow operator cannot be used to access this type" << endp;
+			}
+		}
+
+		searchObjDef = objDefFromUT( pd, qualUT );
+	}
+}
+
+void LangVarRef::loadGlobalObj( ParseData *pd, CodeVect &code, 
+		int lastPtrInQual, bool forWriting )
+{
+	/* Start the search in the global object. */
+	ObjectDef *rootObj = pd->globalObjectDef;
+
+	if ( forWriting && lastPtrInQual < 0 ) {
+		/* If we are writing an no reference was found in the qualification
+		 * then load the gloabl with a revert. */
+		code.append( IN_LOAD_GLOBAL_WV );
+	}
+	else
+		code.append( IN_LOAD_GLOBAL_R );
+
+	loadQualification( pd, code, rootObj, lastPtrInQual, forWriting, true );
+}
+
+void LangVarRef::loadLocalObj( ParseData *pd, CodeVect &code, 
+		int lastPtrInQual, bool forWriting )
+{
+	/* Start the search in the local frame. */
+	ObjectDef *rootObj = pd->curLocalFrame;
+	loadQualification( pd, code, rootObj, lastPtrInQual, forWriting, false );
+}
+
+bool LangVarRef::isLocalRef( ParseData *pd )
+{
+	if ( qual->length() > 0 ) {
+		if ( pd->curLocalFrame->objFieldMap->find( qual->data[0].data ) != 0 )
+			return true;
+	}
+	else if ( pd->curLocalFrame->objFieldMap->find( name ) != 0 )
+		return true;
+	else if ( pd->curLocalFrame->objMethodMap->find( name ) != 0 )
+		return true;
+
+	return false;
+}
+
+void LangVarRef::loadObj( ParseData *pd, CodeVect &code, 
+		int lastPtrInQual, bool forWriting )
+{
+	if ( isLocalRef( pd ) )
+		loadLocalObj( pd, code, lastPtrInQual, forWriting );
+	else
+		loadGlobalObj( pd, code, lastPtrInQual, forWriting );
+}
+
+VarRefLookup LangVarRef::lookupQualification( ParseData *pd, ObjectDef *rootDef ) const
+{
+	int lastPtrInQual = -1;
+	ObjectDef *searchObjDef = rootDef;
+	int firstConstPart = -1;
+
+	for ( QualItemVect::Iter qi = *qual; qi.lte(); qi++ ) {
+		/* Lookup the field int the current qualification. */
+		ObjFieldMapEl *objDefMapEl = searchObjDef->objFieldMap->find( qi->data );
+		if ( objDefMapEl == 0 )
+			error(qi->loc) << "cannot resolve qualification " << qi->data << endp;
+		ObjField *el = objDefMapEl->value;
+
+		/* Lookup the type of the field. */
+		UniqueType *qualUT = el->typeRef->lookupType( pd );
+
+		/* If we are dealing with an iterator then dereference it. */
+		if ( qualUT->typeId == TYPE_ITER )
+			qualUT = el->typeRef->searchTypeRef->lookupType( pd );
+
+		/* Is it const? */
+		if ( firstConstPart < 0 && el->isConst )
+			firstConstPart = qi.pos();
+
+		/* Check for references. When loop is done we will have the last one
+		 * present, if any. */
+		if ( qualUT->typeId == TYPE_PTR )
+			lastPtrInQual = qi.pos();
+
+		if ( qi->type == QualItem::Dot ) {
+			/* Cannot dot a reference. Iterator yes (access of the iterator
+			 * not the current) */
+			if ( qualUT->typeId == TYPE_PTR )
+				error(loc) << "dot cannot be used to access a pointer" << endp;
+		}
+		else if ( qi->type == QualItem::Arrow ) {
+			if ( qualUT->typeId == TYPE_ITER )
+				qualUT = el->typeRef->searchTypeRef->lookupType( pd );
+			else if ( qualUT->typeId == TYPE_PTR )
+				qualUT = pd->findUniqueType( TYPE_TREE, qualUT->langEl );
+		}
+
+		searchObjDef = objDefFromUT( pd, qualUT );
+	}
+
+	return VarRefLookup( lastPtrInQual, firstConstPart, searchObjDef );
+}
+
+VarRefLookup LangVarRef::lookupObj( ParseData *pd )
+{
+	ObjectDef *rootDef;
+	if ( isLocalRef( pd ) )
+		rootDef = pd->curLocalFrame;
+	else
+		rootDef = pd->globalObjectDef;
+
+	return lookupQualification( pd, rootDef );
+}
+
+VarRefLookup LangVarRef::lookupField( ParseData *pd )
+{
+	/* Lookup the object that the field is in. */
+	VarRefLookup lookup = lookupObj( pd );
+
+	/* Lookup the field. */
+	ObjFieldMapEl *objDefMapEl = lookup.inObject->objFieldMap->find( name );
+	if ( objDefMapEl == 0 )
+		error(loc) << "cannot find name " << name << " in object" << endp;
+
+	ObjField *field = objDefMapEl->value;
+
+	lookup.objField = field;
+	lookup.uniqueType = field->typeRef->lookupType( pd );
+
+	if ( field->typeRef->searchTypeRef != 0 )
+		lookup.iterSearchUT = field->typeRef->searchTypeRef->lookupType( pd );
+
+	return lookup;
+}
+
+VarRefLookup LangVarRef::lookupMethod( ParseData *pd )
+{
+	/* Lookup the object that the field is in. */
+	VarRefLookup lookup = lookupObj( pd );
+
+	/* Find the method. */
+	assert( lookup.inObject->objMethodMap != 0 );
+	ObjMethod *method = lookup.inObject->findMethod( name );
+	if ( method == 0 )
+		error(loc) << "cannot find " << name << "(...) in object" << endp;
+	
+	lookup.objMethod = method;
+	lookup.uniqueType = method->returnUT;
+	
+	return lookup;
+}
+
+void LangVarRef::setFieldInstr( ParseData *pd, CodeVect &code, 
+		ObjectDef *inObject, ObjField *el, UniqueType *exprUT, bool revert )
+{
+	/* Ensure that the field is referenced. */
+	inObject->referenceField( pd, el );
+
+	if ( revert )
+		code.append( el->inSetWV );
+	else
+		code.append( el->inSetWC );
+
+	/* Maybe write out an offset. */
+	if ( el->useOffset )
+		code.appendHalf( el->offset );
+}
+
+bool castAssignment( ParseData *pd, CodeVect &code, UniqueType *destUT, 
+		UniqueType *destSearchUT, UniqueType *srcUT )
+{
+	if ( destUT == srcUT )
+		return true;
+
+	/* Casting trees to any. */
+	if ( destUT->typeId == TYPE_TREE && destUT->langEl == pd->anyKlangEl &&
+			srcUT->typeId == TYPE_TREE )
+		return true;
+	
+	/* Setting a reference from a tree. */
+	if ( destUT->typeId == TYPE_REF && srcUT->typeId == TYPE_TREE &&
+			destUT->langEl == srcUT->langEl )
+		return true;
+	
+	/* Setting an iterator from a tree. */
+	if ( destUT->typeId == TYPE_ITER && srcUT->typeId == TYPE_TREE && 
+			destSearchUT->langEl == srcUT->langEl )
+		return true;
+	
+	/* Assigning nil to a tree. */
+	if ( destUT->typeId == TYPE_TREE && srcUT->typeId == TYPE_NIL )
+		return true;
+
+	/* Assigning nil to a pointer. */
+	if ( destUT->typeId == TYPE_PTR && srcUT->typeId == TYPE_NIL )
+		return true;
+
+	return false;
+}
+
+void LangVarRef::setField( ParseData *pd, CodeVect &code, 
+		ObjectDef *inObject, UniqueType *exprUT, bool revert )
+{
+	ObjFieldMapEl *objDefMapEl = inObject->objFieldMap->find( name );
+	if ( objDefMapEl == 0 )
+		error(loc) << "cannot find name " << name << " in object" << endp;
+
+	ObjField *el = objDefMapEl->value;
+	setFieldInstr( pd, code, inObject, el, exprUT, revert );
+}
+
+void LangVarRef::setFieldIter( ParseData *pd, CodeVect &code, 
+		ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert )
+{
+	ObjFieldMapEl *objDefMapEl = inObject->objFieldMap->find( name );
+	if ( objDefMapEl == 0 )
+		error(loc) << "cannot find name " << name << " in object" << endp;
+
+	ObjField *el = objDefMapEl->value;
+	code.append( objUT->iterDef->inSetCurWC );
+	code.appendHalf( el->offset );
+}
+
+UniqueType *LangVarRef::evaluate( ParseData *pd, CodeVect &code, bool forWriting )
+{
+	/* Lookup the loadObj. */
+	VarRefLookup lookup = lookupField( pd );
+
+	/* Load the object, if any. */
+	loadObj( pd, code, lookup.lastPtrInQual, forWriting );
+
+	/* Load the field. */
+	UniqueType *ut = loadFieldInstr( pd, code, lookup.inObject, 
+			lookup.objField, forWriting, false );
+
+	return ut;
+}
+
+/* Return the field referenced. */
+ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code )
+{
+	/* Lookup the loadObj. */
+	VarRefLookup lookup = lookupField( pd );
+
+	if ( lookup.inObject->type != ObjectDef::FrameType )
+		error(loc) << "can only take references of local variables" << endl;
+	
+	if ( lookup.objField->refActive )
+		error(loc) << "reference current active, cannot take another" << endl;
+
+	/* Ensure that the field is referenced. */
+	lookup.inObject->referenceField( pd, lookup.objField );
+
+	/* Note that we could have modified children. */
+	lookup.objField->refActive = true;
+
+	if ( lookup.objField->typeRef->iterDef != 0 ) {
+		code.append( lookup.objField->typeRef->iterDef->inRefFromCur );
+		code.appendHalf( lookup.objField->offset );
+	}
+	else if ( lookup.objField->typeRef->isRef ) {
+		code.append( IN_REF_FROM_REF );
+		code.appendHalf( lookup.objField->offset );
+	}
+	else {
+		code.append( IN_REF_FROM_LOCAL );
+		code.appendHalf( lookup.objField->offset );
+	}
+
+	return lookup.objField;
+}
+
+ObjField **LangVarRef::evaluateArgs( ParseData *pd, CodeVect &code, 
+		VarRefLookup &lookup, ExprVect *args )
+{
+	/* Parameter list is given only for user defined methods. Otherwise it
+	 * will be null. */
+	ParameterList *paramList = lookup.objMethod->paramList;
+
+	/* Match the number of arguments. */
+	int numArgs = args != 0 ? args->length() : 0;
+	if ( numArgs != lookup.objMethod->numParams )
+		error(loc) << "wrong number of arguments" << endp;
+
+	/* This is for storing the object fields used by references. */
+	ObjField **paramRefs = new ObjField*[numArgs];
+	memset( paramRefs, 0, sizeof(ObjField*) * numArgs );
+
+	/* Evaluate and push the args. */
+	if ( args != 0 ) {
+		/* If we have the parameter list, initialize an iterator. */
+		ParameterList::Iter p;
+		paramList != 0 && ( p = *paramList );
+
+		for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
+			/* Get the expression and the UT for the arg. */
+			LangExpr *expression = *pe;
+			UniqueType *paramUT = lookup.objMethod->paramUTs[pe.pos()];
+
+			if ( paramUT->typeId == TYPE_REF ) {
+				/* Make sure we are dealing with a variable reference. */
+				if ( expression->type != LangExpr::TermType )
+					error(loc) << "not a term: argument must be a local variable" << endp;
+				if ( expression->term->type != LangTerm::VarRefType )
+					error(loc) << "not a variable: argument must be a local variable" << endp;
+
+				/* Lookup the field. */
+				LangVarRef *varRef = expression->term->varRef;
+
+				ObjField *refOf = varRef->evaluateRef( pd, code );
+				paramRefs[pe.pos()] = refOf;
+			}
+			else {
+				UniqueType *exprUT = expression->evaluate( pd, code );
+
+				if ( !castAssignment( pd, code, paramUT, 0, exprUT ) )
+					error(loc) << "arg " << pe.pos()+1 << " is of the wrong type" << endp;
+			}
+
+			/* Advance the parameter list iterator if we have it. */
+			paramList != 0 && p.increment();
+		}
+	}
+
+	return paramRefs;
+}
+
+void LangVarRef::resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs )
+{
+	/* Parameter list is given only for user defined methods. Otherwise it
+	 * will be null. */
+	for ( long p = 0; p < lookup.objMethod->numParams; p++ ) {
+		if ( paramRefs[p] != 0 )
+			paramRefs[p]->refActive = false;
+	}
+}
+
+
+void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup )
+{
+	/* This is for writing if it is a non-const builtin. */
+	bool forWriting = lookup.objMethod->func == 0 && 
+			!lookup.objMethod->isConst;
+
+	if ( lookup.objMethod->useCallObj ) {
+		/* Load the object, if any. */
+		loadObj( pd, code, lookup.lastPtrInQual, forWriting );
+	}
+
+	/* Check if we need to revert the function. If it operates on a reference
+	 * or if it is not local then we need to revert it. */
+	bool revert = lookup.lastPtrInQual >= 0 || !isLocalRef(pd);
+	
+	/* The call instruction. */
+	if ( revert ) 
+		code.append( lookup.objMethod->opcodeWV );
+	else
+		code.append( lookup.objMethod->opcodeWC );
+	
+	if ( lookup.objMethod->useFuncId )
+		code.appendHalf( lookup.objMethod->funcId );
+}
+
+UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args )
+{
+	/* Evaluate the object. */
+	VarRefLookup lookup = lookupMethod( pd );
+
+	/* Evaluate and push the arguments. */
+	ObjField **paramRefs = evaluateArgs( pd, code, lookup, args );
+
+	/* Write the call opcode. */
+	callOperation( pd, code, lookup );
+
+	resetActiveRefs( pd, lookup, paramRefs );
+	delete[] paramRefs;
+
+	/* Return the type to the expression. */
+	return lookup.uniqueType;
+}
+
+UniqueType *LangTerm::evaluateMatch( ParseData *pd, CodeVect &code )
+{
+	/* Add the vars bound by the pattern into the local scope. */
+	for ( PatternItemList::Iter item = *pattern->list; item.lte(); item++ ) {
+		if ( item->varRef != 0 )
+			item->bindId = pattern->nextBindId++;
+	}
+
+	UniqueType *ut = varRef->evaluate( pd, code );
+	if ( ut->typeId != TYPE_TREE )
+		error(varRef->loc) << "expected match against a tree type" << endp;
+
+	/* Store the language element type in the pattern. This is needed by
+	 * the pattern parser. */
+	pattern->langEl = ut->langEl;
+
+	code.append( IN_MATCH );
+	code.appendHalf( pattern->patRepId );
+
+	for ( PatternItemList::Iter item = pattern->list->last(); item.gtb(); item-- ) {
+		if ( item->varRef != 0 ) {
+			/* Compute the unique type. */
+			UniqueType *exprType = pd->findUniqueType( TYPE_TREE, item->factor->langEl );
+
+			/* Get the type of the variable being assigned to. */
+			VarRefLookup lookup = item->varRef->lookupField( pd );
+
+			item->varRef->loadObj( pd, code, lookup.lastPtrInQual, false );
+			item->varRef->setField( pd, code, lookup.inObject, exprType, false );
+		}
+	}
+
+	return ut;
+}
+
+UniqueType *LangTerm::evaluateNew( ParseData *pd, CodeVect &code )
+{
+	/* Evaluate the expression. */
+	UniqueType *ut = expr->evaluate( pd, code );
+	if ( ut->typeId != TYPE_TREE )
+		error() << "new can only be applied to tree types" << endp;
+
+	code.append( IN_TREE_NEW );
+	return pd->findUniqueType( TYPE_PTR, ut->langEl );
+}
+
+void LangTerm::assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT )
+{
+	/* Now assign the field initializations. Note that we need to do this in
+	 * reverse because the last expression evaluated is at the top of the
+	 * stack. */
+	if ( fieldInitArgs != 0 && fieldInitArgs->length() > 0 ) {
+		ObjectDef *objDef = objDefFromUT( pd, replUT );
+		/* Note the reverse traversal. */
+		for ( FieldInitVect::Iter pi = fieldInitArgs->last(); pi.gtb(); pi-- ) {
+			FieldInit *fieldInit = *pi;
+			ObjFieldMapEl *el = objDef->objFieldMap->find( fieldInit->name );
+			if ( el == 0 ) {
+				error(fieldInit->loc) << "failed to find init name " << 
+					fieldInit->name << " in object" << endp;
+			}
+
+			/* Lookup the type of the field and compare it to the type of the
+			 * expression. */
+			ObjField *field = el->value;
+			UniqueType *fieldUT = field->typeRef->lookupType( pd );
+			if ( !castAssignment( pd, code, fieldUT, 0, fieldInit->exprUT ) )
+				error(fieldInit->loc) << "type mismatch in initialization" << endp;
+
+			/* The set field instruction must leave the object on the top of
+			 * the stack. */
+			code.append( IN_SET_FIELD_LEAVE_WC );
+			code.appendHalf( field->offset );
+		}
+	}
+}
+
+UniqueType *LangTerm::evaluateTreeConstruct( ParseData *pd, CodeVect &code )
+{
+	/* Evaluate the initialization expressions. */
+	if ( fieldInitArgs != 0 && fieldInitArgs->length() > 0 ) {
+		for ( FieldInitVect::Iter pi = *fieldInitArgs; pi.lte(); pi++ ) {
+			FieldInit *fieldInit = *pi;
+			fieldInit->exprUT = fieldInit->expr->evaluate( pd, code );
+		}
+	}
+
+	/* Assign bind ids to the variables in the replacement. */
+	for ( ReplItemList::Iter item = *replacement->list; item.lte(); item++ ) {
+		if ( item->varRef != 0 )
+			item->bindId = replacement->nextBindId++;
+	}
+
+	/* Evaluate variable references. */
+	for ( ReplItemList::Iter item = replacement->list->last(); item.gtb(); item-- ) {
+		if ( item->type == ReplItem::VarRefType ) {
+			UniqueType *ut = item->varRef->evaluate( pd, code );
+		
+			if ( ut->typeId != TYPE_TREE )
+				error() << "variables used in replacements must be trees" << endp;
+
+			item->langEl = ut->langEl;
+		}
+	}
+
+	/* Construct the tree using the tree information stored in the compiled
+	 * code. */
+	code.append( IN_CONSTRUCT );
+	code.appendHalf( replacement->patRepId );
+
+	/* Lookup the type of the replacement and store it in the replacement
+	 * object so that replacement parsing has a target. */
+	UniqueType *replUT = typeRef->lookupType( pd );
+	if ( replUT->typeId == TYPE_TREE )
+		replacement->langEl = replUT->langEl;
+	else
+		error(loc) << "don't know how to construct this type" << endp;
+
+	assignFieldArgs( pd, code, replUT );
+
+	return replUT;
+}
+
+
+UniqueType *LangTerm::evaluateTermConstruct( ParseData *pd, CodeVect &code )
+{
+	/* Going to make this replacement directly. Take it out of the list of
+	 * replacements so that we don't try to parse it. */
+	pd->replList.remove( replacement );
+
+	/* Evaluate the initialization expressions. */
+	if ( fieldInitArgs != 0 && fieldInitArgs->length() > 0 ) {
+		for ( FieldInitVect::Iter pi = *fieldInitArgs; pi.lte(); pi++ ) {
+			FieldInit *fieldInit = *pi;
+			fieldInit->exprUT = fieldInit->expr->evaluate( pd, code );
+		}
+	}
+
+	UniqueType *replUT = typeRef->lookupType( pd );
+
+	/* Evaluate the expression that we are constructing the term with and make
+	 * the term. */
+	ReplItem *replItem = replacement->list->head;
+	replItem->varRef->evaluate( pd, code );
+	code.append( IN_CONSTRUCT_TERM );
+	code.appendHalf( replUT->langEl->id );
+
+	assignFieldArgs( pd, code, replUT );
+	return replUT;
+}
+
+bool LangTerm::constructTermFromString( ParseData *pd )
+{
+	UniqueType *replUT = typeRef->lookupType( pd );
+	if ( replUT->typeId == TYPE_TREE && replUT->langEl->id < pd->firstNonTermId ) {
+		if ( replacement->list->length() == 1 ) {
+			ReplItem *replItem = replacement->list->head;
+			if ( replItem->type == ReplItem::VarRefType ) {
+				VarRefLookup lookup = replItem->varRef->lookupField( pd );
+				if ( lookup.uniqueType == pd->uniqueTypeStr )
+					return true;
+			}
+		}
+	}
+	return false;
+}
+
+UniqueType *LangTerm::evaluateConstruct( ParseData *pd, CodeVect &code )
+{
+	/* If the type is a token and the replacement contains just a string then
+	 * construct a token using the text of the string. Otherwise do a normal
+	 * tree construct. */
+	if ( constructTermFromString( pd ) )
+		return evaluateTermConstruct( pd, code );
+	else
+		return evaluateTreeConstruct( pd, code );
+}
+
+UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
+{
+	UniqueType *ut = typeRef->lookupType( pd );
+	if ( ut->typeId != TYPE_TREE )
+		error(loc) << "can only parse trees" << endl;
+	
+	/* Should be one arg, a stream. */
+	if ( args == 0 || args->length() != 1 )
+		error(loc) << "expecting one argument" << endp;
+
+	UniqueType *argUT = args->data[0]->evaluate( pd, code );
+	if ( argUT != pd->uniqueTypeStream )
+		error(loc) << "single argument must be a stream" << endp;
+
+	/* Allocate a parser id. This will cause a parser to be built for
+	 * the type. */
+	ut->langEl->parserId = pd->nextParserId++;
+
+	code.append( IN_PARSE );
+	code.appendHalf( ut->langEl->parserId );
+	if ( stop )
+		code.appendHalf( ut->langEl->id );
+	else 
+		code.appendHalf( 0 );
+	return ut;
+}
+
+UniqueType *LangTerm::evaluate( ParseData *pd, CodeVect &code )
+{
+	switch ( type ) {
+		case VarRefType:
+			return varRef->evaluate( pd, code );
+		case MethodCallType:
+			return varRef->evaluateCall( pd, code, args );
+		case NilType:
+			code.append( IN_LOAD_NIL );
+			return pd->uniqueTypeNil;
+		case TrueType:
+			code.append( IN_LOAD_TRUE );
+			return pd->uniqueTypeBool;
+		case FalseType:
+			code.append( IN_LOAD_FALSE );
+			return pd->uniqueTypeBool;
+		case MakeTokenType:
+			return evaluateMakeToken( pd, code );
+		case MakeTreeType:
+			return evaluateMakeTree( pd, code );
+		case NumberType: {
+			unsigned int n = atoi( data );
+			code.append( IN_LOAD_INT );
+			code.appendWord( n );
+			return pd->uniqueTypeInt;
+		}
+		case StringType: {
+			String interp;
+			bool unused;
+			prepareLitString( interp, unused, data, InputLoc() );
+
+			/* Make sure we have this string. */
+			StringMapEl *mapEl = 0;
+			if ( pd->literalStrings.insert( interp, &mapEl ) )
+				mapEl->value = pd->literalStrings.length()-1;
+
+			code.append( IN_LOAD_STR );
+			code.appendWord( mapEl->value );
+			return pd->uniqueTypeStr;
+		}
+		case MatchType:
+			return evaluateMatch( pd, code );
+		case ParseType:
+			return evaluateParse( pd, code, false );
+		case ParseStopType:
+			return evaluateParse( pd, code, true );
+		case ConstructType:
+			return evaluateConstruct( pd, code );
+		case NewType:
+			return evaluateNew( pd, code );
+		case TypeIdType: {
+			/* Evaluate the expression. */
+			UniqueType *ut = typeRef->lookupType( pd );
+			if ( ut->typeId != TYPE_TREE )
+				error() << "typeid can only be applied to tree types" << endp;
+
+			code.append( IN_LOAD_INT );
+			code.appendWord( ut->langEl->id );
+			return pd->uniqueTypeInt;
+		}
+		case SearchType: {
+			/* Evaluate the expression. */
+			UniqueType *ut = typeRef->lookupType( pd );
+			if ( ut->typeId != TYPE_TREE )
+				error(loc) << "can only search for tree types" << endp;
+
+			UniqueType *treeUT = varRef->evaluate( pd, code );
+			if ( treeUT->typeId != TYPE_TREE )
+				error(loc) << "search can be applied only to tree types" << endl;
+
+			code.append( IN_TREE_SEARCH );
+			code.appendWord( ut->langEl->id );
+			return ut;
+		};
+	}
+	return 0;
+}
+
+UniqueType *LangExpr::evaluate( ParseData *pd, CodeVect &code )
+{
+	switch ( type ) {
+		case BinaryType: {
+			switch ( op ) {
+				case '+': {
+					UniqueType *lt = left->evaluate( pd, code );
+					UniqueType *rt = right->evaluate( pd, code );
+
+					if ( lt == pd->uniqueTypeInt && rt == pd->uniqueTypeInt ) {
+						code.append( IN_ADD_INT );
+						return pd->uniqueTypeInt;
+					}
+
+					if ( lt == pd->uniqueTypeStr && rt == pd->uniqueTypeStr ) {
+						code.append( IN_CONCAT_STR );
+						return pd->uniqueTypeStr;
+					}
+
+					error(loc) << "do not have an addition operator for these types" << endp;
+					break;
+				}
+				case '-': {
+					UniqueType *lt = left->evaluate( pd, code );
+					UniqueType *rt = right->evaluate( pd, code );
+
+					if ( lt == pd->uniqueTypeInt && rt == pd->uniqueTypeInt ) {
+						code.append( IN_SUB_INT );
+						return pd->uniqueTypeInt;
+					}
+
+					error(loc) << "do not have an addition operator for these types" << endp;
+					break;
+				}
+				case '*': {
+					UniqueType *lt = left->evaluate( pd, code );
+					UniqueType *rt = right->evaluate( pd, code );
+
+					if ( lt == pd->uniqueTypeInt && rt == pd->uniqueTypeInt ) {
+						code.append( IN_MULT_INT );
+						return pd->uniqueTypeInt;
+					}
+
+					error(loc) << "do not have an multiplication "
+							"operator for these types" << endp;
+					break;
+				}
+				case OP_DoubleEql: {
+					UniqueType *lt = left->evaluate( pd, code );
+					UniqueType *rt = right->evaluate( pd, code );
+
+					if ( lt != rt )
+						error(loc) << "comparison of different types" << endp;
+						
+					code.append( IN_TST_EQL );
+					return pd->uniqueTypeBool;
+				}
+				case OP_NotEql: {
+					UniqueType *lt = left->evaluate( pd, code );
+					UniqueType *rt = right->evaluate( pd, code );
+
+					if ( lt != rt )
+						error(loc) << "comparison of different types" << endp;
+
+					code.append( IN_TST_NOT_EQL );
+					return pd->uniqueTypeBool;
+				}
+				case '<': {
+					left->evaluate( pd, code );
+					right->evaluate( pd, code );
+
+					code.append( IN_TST_LESS );
+					return pd->uniqueTypeBool;
+				}
+				case '>': {
+					left->evaluate( pd, code );
+					right->evaluate( pd, code );
+
+					code.append( IN_TST_GRTR );
+					return pd->uniqueTypeBool;
+				}
+				case OP_LessEql: {
+					left->evaluate( pd, code );
+					right->evaluate( pd, code );
+
+					code.append( IN_TST_LESS_EQL );
+					return pd->uniqueTypeBool;
+				}
+				case OP_GrtrEql: {
+					left->evaluate( pd, code );
+					right->evaluate( pd, code );
+
+					code.append( IN_TST_GRTR_EQL );
+					return pd->uniqueTypeBool;
+				}
+				case OP_LogicalAnd: {
+					/* Evaluate the left and duplicate it. */
+					left->evaluate( pd, code );
+					code.append( IN_DUP_TOP );
+
+					/* Jump over the right if false, leaving the original left
+					 * result on the top of the stack. We don't know the
+					 * distance yet so record the position of the jump. */
+					long jump = code.length();
+					code.append( IN_JMP_FALSE );
+					code.appendHalf( 0 );
+
+					/* Evauluate the right, add the test. Store it separately. */
+					right->evaluate( pd, code );
+					code.append( IN_TST_LOGICAL_AND );
+
+					/* Set the distance of the jump. */
+					long distance = code.length() - jump - 3;
+					code.setHalf( jump+1, distance );
+
+					return pd->uniqueTypeInt;
+				}
+				case OP_LogicalOr: {
+					/* Evaluate the left and duplicate it. */
+					left->evaluate( pd, code );
+					code.append( IN_DUP_TOP );
+
+					/* Jump over the right if true, leaving the original left
+					 * result on the top of the stack. We don't know the
+					 * distance yet so record the position of the jump. */
+					long jump = code.length();
+					code.append( IN_JMP_TRUE );
+					code.appendHalf( 0 );
+
+					/* Evauluate the right, add the test. */
+					right->evaluate( pd, code );
+					code.append( IN_TST_LOGICAL_OR );
+
+					/* Set the distance of the jump. */
+					long distance = code.length() - jump - 3;
+					code.setHalf( jump+1, distance );
+
+					return pd->uniqueTypeInt;
+				}
+			}
+
+			assert(false);
+			return 0;
+		}
+		case UnaryType: {
+			switch ( op ) {
+				case '!': {
+					/* Evaluate the left and duplicate it. */
+					right->evaluate( pd, code );
+					code.append( IN_NOT );
+					return pd->uniqueTypeBool;
+				}
+				case OP_Deref: {
+					UniqueType *ut = right->evaluate( pd, code );
+					if ( ut->typeId != TYPE_PTR )
+						error(loc) << "can only dereference pointers" << endl;
+
+					code.append( IN_PTR_DEREF_R );
+					ut = pd->findUniqueType( TYPE_TREE, ut->langEl );
+					return ut;
+				}
+				default: 
+					assert(false);
+			}
+			return 0;
+		}
+		case TermType: {
+			return term->evaluate( pd, code );
+		}
+	}
+	return 0;
+}
+
+void LangVarRef::assignValue( ParseData *pd, CodeVect &code, 
+		UniqueType *exprUT )
+{
+	/* Lookup the left hand side of the assignment. */
+	VarRefLookup lookup = lookupField( pd );
+
+	if ( lookup.objField->refActive )
+		error(loc) << "reference active, cannot write to object" << endp;
+
+	if ( lookup.firstConstPart >= 0 ) {
+		error(loc) << "left hand side qualification \"" <<
+			qual->data[lookup.firstConstPart].data << "\" is const" << endp;
+	}
+
+	if ( lookup.objField->isConst )
+		error(loc) << "field \"" << name << "\" is const" << endp;
+
+	/* Check the types of the assignment and possibly cast. */
+	UniqueType *objUT = lookup.objField->typeRef->lookupType( pd );
+	assert( lookup.uniqueType == lookup.objField->typeRef->lookupType( pd ) );
+	if ( !castAssignment( pd, code, objUT, lookup.iterSearchUT, exprUT ) )
+		error(loc) << "type mismatch in assignment" << endp;
+	
+	/* Decide if we need to revert the assignment. */
+	bool revert = lookup.lastPtrInQual >= 0 || !isLocalRef(pd);
+
+	/* Load the object and generate the field setting code. */
+	loadObj( pd, code, lookup.lastPtrInQual, true );
+
+	if ( lookup.uniqueType->typeId == TYPE_ITER )
+		setFieldIter( pd, code, lookup.inObject, lookup.uniqueType, exprUT, false );
+	else
+		setField( pd, code, lookup.inObject, exprUT, revert );
+}
+
+UniqueType *LangTerm::evaluateMakeToken( ParseData *pd, CodeVect &code )
+{
+//	if ( pd->compileContext != ParseData::CompileTranslation )
+//		error(loc) << "make_token can be used only in a translation block" << endp;
+
+	/* Match the number of arguments. */
+	int numArgs = args != 0 ? args->length() : 0;
+	if ( numArgs < 2 )
+		error(loc) << "need at least two arguments" << endp;
+
+	for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
+		/* Evaluate. */
+		UniqueType *exprUT = (*pe)->evaluate( pd, code );
+
+		if ( pe.pos() == 0 && exprUT != pd->uniqueTypeInt )
+			error(loc) << "first arg, id, must be an int" << endp;
+
+		if ( pe.pos() == 1 && exprUT != pd->uniqueTypeStr )
+			error(loc) << "second arg, length, must be a string" << endp;
+	}
+
+	/* The token is now created, send it. */
+	code.append( IN_MAKE_TOKEN );
+	code.append( args->length() );
+
+	return pd->uniqueTypeAny;
+}
+
+UniqueType *LangTerm::evaluateMakeTree( ParseData *pd, CodeVect &code )
+{
+	if ( pd->compileContext != ParseData::CompileTranslation )
+		error(loc) << "make_tree can be used only in a translation block" << endp;
+
+	/* Match the number of arguments. */
+	int numArgs = args != 0 ? args->length() : 0;
+	if ( numArgs < 1 )
+		error(loc) << "need at least one argument" << endp;
+
+	for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
+		/* Evaluate. */
+		UniqueType *exprUT = (*pe)->evaluate( pd, code );
+
+		if ( pe.pos() == 0 && exprUT != pd->uniqueTypeInt )
+			error(loc) << "first arg, nonterm id, must be an int" << endp;
+	}
+
+	/* The token is now created, send it. */
+	code.append( IN_MAKE_TREE );
+	code.append( args->length() );
+
+	return pd->uniqueTypeAny;
+}
+
+void LangStmt::compileForIterBody( ParseData *pd, CodeVect &code, 
+		ObjField *iterObjField, LangVarRef *iterVarRef, 
+		UniqueType *iterUT )
+{
+	/* Remember the top of the loop. */
+	long top = code.length();
+
+	/* Advance */
+	code.append( iterUT->iterDef->inAdvance );
+	code.appendHalf( iterObjField->offset );
+
+	/* Test: jump past the while block if false. Note that we don't have the
+	 * distance yet. */
+	long jumpFalse = code.length();
+	code.append( IN_JMP_FALSE );
+	code.appendHalf( 0 );
+
+	/*
+	 * Set up the loop cleanup code. 
+	 */
+
+	/* Set up the current loop cleanup. */
+	CodeVect loopCleanup;
+	if ( pd->loopCleanup != 0 )
+		loopCleanup.setAs( *pd->loopCleanup );
+
+	/* Add the cleanup for the current loop. */
+	loopCleanup.append( iterUT->iterDef->inDestroy );
+	loopCleanup.appendHalf( iterObjField->offset );
+
+	/* Push the loop cleanup. */
+	CodeVect *oldLoopCleanup = pd->loopCleanup;
+	pd->loopCleanup = &loopCleanup;
+
+	/* Compile the contents. */
+	for ( StmtList::Iter stmt = *stmtList; stmt.lte(); stmt++ )
+		stmt->compile( pd, code );
+
+	pd->loopCleanup = oldLoopCleanup;
+
+	/* Jump back to the top to retest. */
+	long retestDist = code.length() - top + 3;
+	code.append( IN_JMP );
+	code.appendHalf( -retestDist );
+
+	/* Set the jump false distance. */
+	long falseDist = code.length() - jumpFalse - 3;
+	code.setHalf( jumpFalse+1, falseDist );
+
+	/* Compute the jump distance for the break jumps. */
+	for ( LongVect::Iter brk = pd->breakJumps; brk.lte(); brk++ ) {
+		long distance = code.length() - *brk - 3;
+		code.setHalf( *brk+1, distance );
+	}
+	pd->breakJumps.empty();
+
+	/* Destroy the iterator. */
+	code.append( iterUT->iterDef->inDestroy );
+	code.appendHalf( iterObjField->offset );
+
+	unscopeIterVariable( pd, iterObjField );
+}
+
+ObjField *LangStmt::createIterVariable( ParseData *pd, TypeRef *iterTypeRef )
+{
+	/* Check for redeclaration. */
+	if ( pd->curLocalFrame->objFieldMap->find( name ) != 0 )
+		error(loc) << "variable " << name << " redeclared" << endp;
+
+	/* Create the field and insert it into the field map. */
+	ObjField *iterObjField = new ObjField( loc, iterTypeRef, name );
+	pd->curLocalFrame->objFieldMap->insert( name, iterObjField );
+	pd->curLocalFrame->initField( pd, iterObjField );
+	return iterObjField;
+}
+
+void LangStmt::unscopeIterVariable( ParseData *pd, ObjField *iterObjField )
+{
+	pd->curLocalFrame->objFieldMap->detach( name );
+}
+
+LangTerm *LangStmt::chooseDefaultIter( ParseData *pd )
+{
+	/* Lookup the lang term and decide what iterator to use based
+	 * on its type. */
+	VarRefLookup lookup = langTerm->varRef->lookupField( pd );
+	
+	if ( lookup.inObject->type != ObjectDef::FrameType )
+		error(loc) << "root of iteration must be a local" << endp;
+	
+	LangVarRef *callVarRef = 0;
+	if ( lookup.uniqueType->typeId == TYPE_TREE || 
+			lookup.uniqueType->typeId == TYPE_REF ||
+			lookup.uniqueType->typeId == TYPE_ITER ||
+			lookup.uniqueType->typeId == TYPE_PTR )
+	{
+		/* The iterator name. */
+		callVarRef = new LangVarRef( loc, new QualItemVect, "triter" );
+	}
+	else {
+		error(loc) << "there is no default iterator for a "
+				"root of that type" << endp;
+	}
+
+	/* The parameters. */
+	ExprVect *callExprVect = new ExprVect;
+	LangExpr *callExpr = new LangExpr( new LangTerm( 
+			LangTerm::VarRefType, langTerm->varRef ) );
+	callExprVect->append( callExpr );
+
+	LangTerm *callLangTerm = new LangTerm( callVarRef, callExprVect );
+
+	return callLangTerm;
+}
+
+void LangStmt::compileForIter( ParseData *pd, CodeVect &code )
+{
+	if ( langTerm->type != LangTerm::MethodCallType )
+		langTerm = chooseDefaultIter( pd );
+
+	/* The type we are searching for. */
+	UniqueType *searchUT = typeRef->lookupType( pd );
+
+	/* 
+	 * Declare the iterator variable.
+	 */
+	VarRefLookup lookup = langTerm->varRef->lookupMethod( pd );
+	if ( lookup.objMethod->iterDef == 0 ) {
+		error(loc) << "attempt to iterate using something "
+				"that is not an iterator" << endp;
+	}
+
+	/* Type ref and object field for the iterator. */
+	TypeRef *iterTypeRef = new TypeRef( loc, lookup.objMethod->iterDef, typeRef );
+	ObjField *iterObjField = createIterVariable( pd, iterTypeRef );
+
+	/* 
+	 * Create the iterator from the local var.
+	 */
+
+	LangVarRef *iterVarRef = new LangVarRef( loc, new QualItemVect, name ); 
+	UniqueType *iterUT = iterTypeRef->lookupType( pd );
+
+	/* Evaluate and push the arguments. */
+	ObjField **paramRefs = langTerm->varRef->evaluateArgs( 
+			pd, code, lookup, langTerm->args );
+
+	code.append( iterUT->iterDef->inCreate );
+	code.appendHalf( iterObjField->offset );
+	if ( lookup.objMethod->func != 0 )
+		code.appendHalf( lookup.objMethod->func->funcId );
+
+	if ( iterUT->iterDef->useSearchUT ) {
+		if ( searchUT->typeId == TYPE_PTR )
+			code.appendHalf( pd->uniqueTypePtr->langEl->id );
+		else
+			code.appendHalf( searchUT->langEl->id );
+	}
+
+	compileForIterBody( pd, code, iterObjField, iterVarRef, iterUT );
+
+	langTerm->varRef->resetActiveRefs( pd, lookup, paramRefs );
+	delete[] paramRefs;
+}
+
+void LangStmt::compileWhile( ParseData *pd, CodeVect &code )
+{
+	/* Generate code for the while test. Remember the top. */
+	long top = code.length();
+	expr->evaluate( pd, code );
+
+	/* Jump past the while block if false. Note that we don't have the
+	 * distance yet. */
+	long jumpFalse = code.length();
+	code.append( IN_JMP_FALSE );
+	code.appendHalf( 0 );
+
+	/* Compute the while block. */
+	for ( StmtList::Iter stmt = *stmtList; stmt.lte(); stmt++ )
+		stmt->compile( pd, code );
+
+	/* Jump back to the top to retest. */
+	long retestDist = code.length() - top + 3;
+	code.append( IN_JMP );
+	code.appendHalf( -retestDist );
+
+	/* Set the jump false distance. */
+	long falseDist = code.length() - jumpFalse - 3;
+	code.setHalf( jumpFalse+1, falseDist );
+
+	/* Compute the jump distance for the break jumps. */
+	for ( LongVect::Iter brk = pd->breakJumps; brk.lte(); brk++ ) {
+		long distance = code.length() - *brk - 3;
+		code.setHalf( *brk+1, distance );
+	}
+	pd->breakJumps.empty();
+}
+
+void LangStmt::compile( ParseData *pd, CodeVect &code )
+{
+	switch ( type ) {
+		case PrintType: 
+		case PrintXMLType: {
+			UniqueType **types = new UniqueType*[exprPtrVect->length()];
+			
+			/* Push the args backwards. */
+			for ( ExprVect::Iter pex = exprPtrVect->last(); pex.gtb(); pex-- )
+				types[pex.pos()] = (*pex)->evaluate( pd, code );
+
+			/* Run the printing forwards. */
+			if ( type == PrintType ) {
+				for ( ExprVect::Iter pex = *exprPtrVect; pex.lte(); pex++ )
+					code.append( IN_PRINT );
+			}
+			else {
+				for ( ExprVect::Iter pex = *exprPtrVect; pex.lte(); pex++ )
+					code.append( IN_PRINT_XML );
+			}
+
+			delete[] types;
+
+			break;
+		}
+		case ExprType: {
+			/* Evaluate the exrepssion, then pop it immediately. */
+			expr->evaluate( pd, code );
+			code.append( IN_POP );
+			break;
+		}
+		case IfType: {
+			long jumpFalse, jumpPastElse, distance;
+
+			/* Evaluate the test. */
+			expr->evaluate( pd, code );
+
+			/* Jump past the if block if false. We don't know the distance
+			 * yet so store the location of the jump. */
+			jumpFalse = code.length();
+			code.append( IN_JMP_FALSE );
+			code.appendHalf( 0 );
+
+			/* Compile the if true branch. */
+			for ( StmtList::Iter stmt = *stmtList; stmt.lte(); stmt++ )
+				stmt->compile( pd, code );
+
+			if ( elsePart != 0 ) {
+				/* Jump past the else code for the if true branch. */
+				jumpPastElse = code.length();
+				code.append( IN_JMP );
+				code.appendHalf( 0 );
+			}
+
+			/* Set the distance for the jump false case. */
+			distance = code.length() - jumpFalse - 3;
+			code.setHalf( jumpFalse+1, distance );
+
+			if ( elsePart != 0 ) {
+				/* Compile the else branch. */
+				for ( StmtList::Iter stmt = *elsePart; stmt.lte(); stmt++ )
+					stmt->compile( pd, code );
+
+				/* Set the distance for jump over the else part. */
+				distance = code.length() - jumpPastElse - 3;
+				code.setHalf( jumpPastElse+1, distance );
+			}
+
+			break;
+		}
+		case RejectType: {
+			code.append( IN_REJECT );
+			break;
+		}
+		case WhileType: {
+			compileWhile( pd, code );
+			break;
+		}
+		case AssignType: {
+			/* Evaluate the exrepssion. */
+			UniqueType *exprUT = expr->evaluate( pd, code );
+
+			/* Do the assignment. */
+			varRef->assignValue( pd, code, exprUT );
+			break;
+		}
+		case ForIterType: {
+			compileForIter( pd, code );
+			break;
+		}
+		case ReturnType: {
+			/* Evaluate the exrepssion. */
+			UniqueType *exprUT = expr->evaluate( pd, code );
+
+			UniqueType *resUT = pd->curFunction->typeRef->lookupType( pd );
+			if ( !castAssignment( pd, code, resUT, 0, exprUT ) )
+				error(loc) << "return value wrong type" << endp;
+
+			code.append( IN_SAVE_RET );
+
+			/* The loop cleanup code. */
+			if ( pd->loopCleanup != 0 )
+				code.append( *pd->loopCleanup );
+
+			/* Jump to the return label. The distnacnce will be filled in
+			 * later. */
+			pd->returnJumps.append( code.length() );
+			code.append( IN_JMP );
+			code.appendHalf( 0 );
+			break;
+		}
+		case BreakType: {
+			pd->breakJumps.append( code.length() );
+			code.append( IN_JMP );
+			code.appendHalf( 0 );
+			break;
+		}
+		case YieldType: {
+			/* take a reference and yield it. Immediately reset the referece. */
+			ObjField *objField = varRef->evaluateRef( pd, code );
+			objField->refActive = false;
+			code.append( IN_YIELD );
+			break;
+		}
+	}
+}
+
+void CodeBlock::compile( ParseData *pd, CodeVect &code )
+{
+	for ( StmtList::Iter stmt = *stmtList; stmt.lte(); stmt++ )
+		stmt->compile( pd, code );
+}
+
+void ParseData::addProdRedObjectVar( ObjectDef *localFrame, KlangEl *nonTerm )
+{
+	UniqueType *prodNameUT = findUniqueType( TYPE_TREE, nonTerm );
+	TypeRef *typeRef = new TypeRef( InputLoc(), prodNameUT );
+	ObjField *el = new ObjField( InputLoc(), typeRef, "lhs" );
+
+	/* Is the only item pushed to the stack just before a reduction action is
+	 * executed. We rely on a zero offset. */
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isLhsEl = true;
+	el->offset = 0;
+
+	initLocalInstructions( el );
+
+	localFrame->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList )
+{
+	long position = 1;
+	for ( ProdElList::Iter rhsEl = *prodElList; rhsEl.lte(); rhsEl++, position++ ) {
+		if ( rhsEl->type == PdaFactor::ReferenceType ) {
+			TypeRef *typeRef = new TypeRef( rhsEl->loc, rhsEl->nspaceQual, rhsEl->refName );
+
+			/* Use an offset of zero. For frame objects we compute the offset on
+			 * demand. */
+			String name( 8, "r%d", position );
+			ObjField *el = new ObjField( InputLoc(), typeRef, name );
+			rhsEl->objField = el;
+
+			/* Right hand side elements are constant. */
+			el->isConst = true;
+			el->isRhsEl = true;
+
+			/* Only ever fetch for reading since they are constant. */
+			el->inGetR = IN_GET_LOCAL_R;
+
+			localFrame->objFieldMap->insert( el->name, el );
+		}
+	}
+}
+
+void ParseData::addProdRHSLoads( Definition *prod, long codeInsertPos )
+{
+	CodeVect code;
+	long position = 0;
+	for ( ProdElList::Iter rhsEl = *prod->prodElList; rhsEl.lte(); rhsEl++, position++ ) {
+		if ( rhsEl->type == PdaFactor::ReferenceType ) {
+			if ( rhsEl->objField->beenReferenced ) {
+				code.append ( IN_INIT_RHS_EL );
+				code.appendHalf( position );
+				code.appendHalf( rhsEl->objField->offset );
+			}
+		}
+	}
+	prod->redBlock->code.insert( codeInsertPos, code );
+}
+
+void ParseData::addMatchLength( ObjectDef *frame, KlangEl *lel )
+{
+	/* Make the type ref. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeInt );
+
+	/* Create the field and insert it into the map. */
+	ObjField *el = new ObjField( InputLoc(), typeRef, "match_length" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR    = IN_GET_MATCH_LENGTH_R;
+	frame->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::addMatchText( ObjectDef *frame, KlangEl *lel )
+{
+	/* Make the type ref. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeStr );
+
+	/* Create the field and insert it into the map. */
+	ObjField *el = new ObjField( InputLoc(), typeRef, "match_text" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR    = IN_GET_MATCH_TEXT_R;
+	frame->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::initFieldInstructions( ObjField *el )
+{
+	el->inGetR =   IN_GET_FIELD_R;
+	el->inGetWC =  IN_GET_FIELD_WC;
+	el->inGetWV =  IN_GET_FIELD_WV;
+	el->inSetWC =  IN_SET_FIELD_WC;
+	el->inSetWV =  IN_SET_FIELD_WV;
+}
+
+void ParseData::initLocalInstructions( ObjField *el )
+{
+	el->inGetR =   IN_GET_LOCAL_R;
+	el->inGetWC =  IN_GET_LOCAL_WC;
+	el->inSetWC =  IN_SET_LOCAL_WC;
+}
+
+void ParseData::initLocalRefInstructions( ObjField *el )
+{
+	el->inGetR =   IN_GET_LOCAL_REF_R;
+	el->inGetWC =  IN_GET_LOCAL_REF_WC;
+	el->inSetWC =  IN_SET_LOCAL_REF_WC;
+}
+
+void ParseData::initIntObject( )
+{
+	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjMethodMap *methodMap = new ObjMethodMap;
+	intObj = new ObjectDef( ObjectDef::BuiltinType, "int", 
+			fieldMap, methodMap, nextObjectId++ );
+	intKlangEl->objectDef = intObj;
+
+	initFunction( uniqueTypeStr, intObj, "to_string", IN_INT_TO_STR, IN_INT_TO_STR, true );
+}
+
+/* Add a constant length field to the object. 
+ * Opcode supplied by the caller. */
+void ParseData::addLengthField( ObjectDef *objDef, Code getLength )
+{
+	/* Create the "length" field. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeInt );
+	ObjField *el = new ObjField( InputLoc(), typeRef, "length" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR = getLength;
+
+	objDef->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::initStrObject( )
+{
+	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjMethodMap *methodMap = new ObjMethodMap;
+	strObj = new ObjectDef( ObjectDef::BuiltinType, "str", 
+			fieldMap, methodMap, nextObjectId++ );
+	strKlangEl->objectDef = strObj;
+
+	initFunction( uniqueTypeInt, strObj, "atoi",   IN_STR_ATOI, IN_STR_ATOI, true );
+	initFunction( uniqueTypeInt, strObj, "uord8",  IN_STR_UORD8,  IN_STR_UORD8, true );
+	initFunction( uniqueTypeInt, strObj, "sord8",  IN_STR_SORD8,  IN_STR_SORD8, true );
+	initFunction( uniqueTypeInt, strObj, "uord16", IN_STR_UORD16, IN_STR_UORD16, true );
+	initFunction( uniqueTypeInt, strObj, "sord16", IN_STR_SORD16, IN_STR_SORD16, true );
+	initFunction( uniqueTypeInt, strObj, "uord32", IN_STR_UORD32, IN_STR_UORD32, true );
+	initFunction( uniqueTypeInt, strObj, "sord32", IN_STR_SORD32, IN_STR_SORD32, true );
+	addLengthField( strObj, IN_STR_LENGTH );
+}
+
+void ParseData::initStreamObject( )
+{
+	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjMethodMap *methodMap = new ObjMethodMap;
+	streamObj = new ObjectDef( ObjectDef::BuiltinType, "stream", 
+			fieldMap, methodMap, nextObjectId++ );
+	streamKlangEl->objectDef = streamObj;
+
+//	initFunction( uniqueTypeInt, strObj, "atoi",   IN_STR_ATOI, IN_STR_ATOI, true );
+//	initFunction( uniqueTypeInt, strObj, "uord8",  IN_STR_UORD8,  IN_STR_UORD8, true );
+//	initFunction( uniqueTypeInt, strObj, "sord8",  IN_STR_SORD8,  IN_STR_SORD8, true );
+//	initFunction( uniqueTypeInt, strObj, "uord16", IN_STR_UORD16, IN_STR_UORD16, true );
+//	initFunction( uniqueTypeInt, strObj, "sord16", IN_STR_SORD16, IN_STR_SORD16, true );
+//	initFunction( uniqueTypeInt, strObj, "uord32", IN_STR_UORD32, IN_STR_UORD32, true );
+//	initFunction( uniqueTypeInt, strObj, "sord32", IN_STR_SORD32, IN_STR_SORD32, true );
+//	addLengthField( strObj, IN_STR_LENGTH );
+}
+
+ObjField *ParseData::makeDataEl()
+{
+	/* Create the "data" field. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeStr );
+	ObjField *el = new ObjField( InputLoc(), typeRef, "data" );
+
+	/* Setting beenReferenced to true prevents us from assigning instructions
+	 * and an offset to the field. */
+
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->useOffset = false;
+	el->inGetR = IN_GET_TOKEN_DATA_R;
+	el->inSetWC = IN_SET_TOKEN_DATA_WC;
+	el->inSetWV = IN_SET_TOKEN_DATA_WV;
+	return el;
+}
+
+ObjField *ParseData::makePosEl()
+{
+	/* Create the "data" field. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeInt );
+	ObjField *el = new ObjField( InputLoc(), typeRef, "pos" );
+
+	/* Setting beenReferenced to true prevents us from assigning instructions
+	 * and an offset to the field. */
+
+	el->isConst = true;
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->useOffset = false;
+	el->inGetR = IN_GET_TOKEN_POS_R;
+	return el;
+}
+
+void ParseData::initTokenObjects( )
+{
+	/* Make a default object Definition. */
+	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjMethodMap *methodMap = new ObjMethodMap;
+	tokenObj = new ObjectDef( ObjectDef::BuiltinType, "token", fieldMap, 
+			methodMap, nextObjectId++ );
+
+	ObjField *dataEl = makeDataEl();
+	tokenObj->objFieldMap->insert( dataEl->name, dataEl );
+
+	ObjField *posEl = makePosEl();
+	tokenObj->objFieldMap->insert( posEl->name, posEl );
+
+
+	/* Give all user terminals the token object type. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->isUserTerm ) {
+			if ( lel->objectDef == 0 )
+				lel->objectDef = tokenObj;
+			else {
+				/* Create the "data" field. */
+				ObjField *dataEl = makeDataEl();
+				lel->objectDef->objFieldMap->insert( dataEl->name, dataEl );
+
+				/* Create the "pos" field. */
+				ObjField *posEl = makePosEl();
+				lel->objectDef->objFieldMap->insert( posEl->name, posEl );
+			}
+		}
+	}
+}
+
+void ParseData::findLocalTrees( CharSet &trees )
+{
+	/* We exlcude "lhs" from being downrefed because we need to use if after
+	 * the frame is is cleaned and so it must survive. */
+	for ( ObjFieldMap::Iter of = *curLocalFrame->objFieldMap; of.lte(); of++ ) {
+		ObjField *el = of->value;
+		if ( !el->isLhsEl && el->beenReferenced ) {
+			UniqueType *ut = el->typeRef->lookupType( this );
+			if ( ut->typeId == TYPE_TREE || ut->typeId == TYPE_PTR )
+				trees.insert( el->offset );
+		}
+	}
+}
+
+void ParseData::compileReductionCode( Definition *prod )
+{
+	CodeBlock *block = prod->redBlock;
+
+	/* Init the compilation context. */
+	compileContext = CompileReduction;
+	curLocalFrame = block->localFrame;
+	block->frameId = nextFrameId++;
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+	long afterAllocFrame = block->code.length();
+
+	/* Compile the reduce block. */
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Set in the alloc frame instruction. */
+	long frameSize = curLocalFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	addProdRHSLoads( prod, afterAllocFrame );
+
+	block->code.append( IN_POP_LOCALS );
+	block->code.appendHalf( block->frameId );
+	block->code.appendHalf( frameSize );
+
+	block->code.append( IN_STOP );
+
+	/* Now that compilation is done variables are referenced. Make the local
+	 * trees descriptor. */
+	findLocalTrees( block->trees );
+}
+
+void ParseData::compileTranslateBlock( KlangEl *langEl )
+{
+	CodeBlock *block = langEl->transBlock;
+
+	/* Set up compilation context. */
+	compileContext = CompileTranslation;
+	curLocalFrame = block->localFrame;
+	block->frameId = nextFrameId++;
+
+	/* References to the reduce item. */
+	addMatchLength( curLocalFrame, langEl );
+	addMatchText( curLocalFrame, langEl );
+	initFunction( uniqueTypeStr, curLocalFrame, "pull",
+			IN_STREAM_PULL, IN_STREAM_PULL, uniqueTypeStream, uniqueTypeInt, true );
+	initFunction( uniqueTypeInt, curLocalFrame, "push",
+			IN_STREAM_PUSH, IN_STREAM_PUSH, uniqueTypeStream, uniqueTypeAny, true );
+
+	initFunction( uniqueTypeInt, curLocalFrame, "send",
+			IN_SEND, IN_SEND, uniqueTypeAny, true );
+	initFunction( uniqueTypeInt, curLocalFrame, "send_ignore",
+			IN_IGNORE, IN_IGNORE, uniqueTypeAny, true );
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+
+	/* Set the local frame and compile the reduce block. */
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Set in the alloc frame instruction. */
+	long frameSize = curLocalFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	block->code.append( IN_POP_LOCALS );
+	block->code.appendHalf( block->frameId );
+	block->code.appendHalf( frameSize );
+
+	block->code.append( IN_STOP );
+
+	/* Now that compilation is done variables are referenced. Make the local
+	 * trees descriptor. */
+	findLocalTrees( block->trees );
+}
+
+void ParseData::compilePreEof( TokenRegion *region )
+{
+	CodeBlock *block = region->preEofBlock;
+
+	/* Set up compilation context. */
+	compileContext = CompileTranslation;
+	curLocalFrame = region->preEofBlock->localFrame;
+	block->frameId = nextFrameId++;
+
+	/* References to the reduce item. */
+//	addMatchLength( curLocalFrame, langEl );
+//	addMatchText( curLocalFrame, langEl );
+//	initFunction( uniqueTypeStr, curLocalFrame, "pull",
+//			IN_STREAM_PULL, IN_STREAM_PULL, uniqueTypeStream, uniqueTypeInt, true );
+
+	initFunction( uniqueTypeInt, curLocalFrame, "send",
+			IN_SEND, IN_SEND, uniqueTypeAny, true );
+	initFunction( uniqueTypeInt, curLocalFrame, "send_ignore",
+			IN_IGNORE, IN_IGNORE, uniqueTypeAny, true );
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+
+	/* Set the local frame and compile the reduce block. */
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Set in the alloc frame instruction. */
+	long frameSize = curLocalFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	block->code.append( IN_POP_LOCALS );
+	block->code.appendHalf( block->frameId );
+	block->code.appendHalf( frameSize );
+
+	block->code.append( IN_STOP );
+
+	/* Now that compilation is done variables are referenced. Make the local
+	 * trees descriptor. */
+	findLocalTrees( block->trees );
+}
+
+void ParseData::compileRootBlock( )
+{
+	CodeBlock *block = rootCodeBlock;
+
+	/* Set up the compile context. No locals are needed for the root code
+	 * block, but we need an empty local frame for the compile. */
+	compileContext = CompileRoot;
+	curLocalFrame = rootLocalFrame;
+	block->frameId = nextFrameId++;
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Store it in frame init. */
+	long frameSize = curLocalFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	block->code.append( IN_POP_LOCALS );
+	block->code.appendHalf( block->frameId );
+	block->code.appendHalf( frameSize );
+
+	block->code.append( IN_STOP );
+
+	/* Make the local trees descriptor. */
+	findLocalTrees( block->trees );
+}
+
+void ParseData::initAllLanguageObjects()
+{
+	/* Init all user object fields (need consistent size). */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		ObjectDef *obj = lel->objectDef;
+		if ( obj != 0 ) {
+			/* Init all fields of the object. */
+			for ( ObjFieldMap::Iter f = *obj->objFieldMap; f.lte(); f++ )
+				obj->initField( this, f->value );
+		}
+	}
+
+	/* Init all fields of the global object. */
+	for ( ObjFieldMap::Iter f = *globalObjectDef->objFieldMap; f.lte(); f++ )
+		globalObjectDef->initField( this, f->value );
+}
+
+void ParseData::initMapFunctions( GenericType *gen )
+{
+	addLengthField( gen->objDef, IN_MAP_LENGTH );
+	initFunction( gen->utArg, gen->objDef, "find", 
+			IN_MAP_FIND, IN_MAP_FIND, gen->keyUT, true );
+	initFunction( uniqueTypeInt, gen->objDef, "insert", 
+			IN_MAP_INSERT_WC, IN_MAP_INSERT_WV, gen->keyUT, gen->utArg, false );
+	initFunction( uniqueTypeInt, gen->objDef, "store", 
+			IN_MAP_STORE_WC, IN_MAP_STORE_WV, gen->keyUT, gen->utArg, false );
+	initFunction( gen->utArg, gen->objDef, "remove", 
+			IN_MAP_REMOVE_WC, IN_MAP_REMOVE_WV, gen->keyUT, false );
+}
+
+void ParseData::initListFunctions( GenericType *gen )
+{
+	addLengthField( gen->objDef, IN_LIST_LENGTH );
+
+	initFunction( uniqueTypeInt, gen->objDef, "append", 
+			IN_LIST_APPEND_WC, IN_LIST_APPEND_WV, gen->utArg, false );
+	initFunction( uniqueTypeInt, gen->objDef, "push", 
+			IN_LIST_APPEND_WC, IN_LIST_APPEND_WV, gen->utArg, false );
+
+	initFunction( gen->utArg, gen->objDef, "remove_end", 
+			IN_LIST_REMOVE_END_WC, IN_LIST_REMOVE_END_WV, false );
+	initFunction( gen->utArg, gen->objDef, "pop", 
+			IN_LIST_REMOVE_END_WC, IN_LIST_REMOVE_END_WV, false );
+}
+
+void ParseData::initListField( GenericType *gen, const char *name, int offset )
+{
+	/* Make the type ref and create the field. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), gen->utArg );
+	ObjField *el = new ObjField( InputLoc(), typeRef, name );
+
+	el->inGetR =  IN_GET_LIST_MEM_R;
+	el->inGetWC = IN_GET_LIST_MEM_WC;
+	el->inGetWV = IN_GET_LIST_MEM_WV;
+	el->inSetWC = IN_SET_LIST_MEM_WC;
+	el->inSetWV = IN_SET_LIST_MEM_WV;
+
+	gen->objDef->objFieldMap->insert( el->name, el );
+
+	el->useOffset = true;
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+
+	/* Zero for head, One for tail. */
+	el->offset = offset;
+}
+
+void ParseData::initListFields( GenericType *gen )
+{
+	initListField( gen, "head", 0 );
+	initListField( gen, "tail", 1 );
+	initListField( gen, "top", 1 );
+}
+
+void ParseData::initVectorFunctions( GenericType *gen )
+{
+	addLengthField( gen->objDef, IN_VECTOR_LENGTH );
+	initFunction( uniqueTypeInt, gen->objDef, "append", 
+			IN_VECTOR_APPEND_WC, IN_VECTOR_APPEND_WV, gen->utArg, false );
+	initFunction( uniqueTypeInt, gen->objDef, "insert", 
+			IN_VECTOR_INSERT_WC, IN_VECTOR_INSERT_WV, uniqueTypeInt, gen->utArg, false );
+}
+
+void ParseData::resolveGenericTypes()
+{
+	for ( NamespaceList::Iter ns = namespaceList; ns.lte(); ns++ ) {
+		for ( GenericList::Iter gen = ns->genericList; gen.lte(); gen++ ) {
+			gen->utArg = gen->typeArg->lookupType( this );
+
+			if ( gen->typeId == GEN_MAP )
+				gen->keyUT = gen->keyTypeArg->lookupType( this );
+
+			ObjFieldMap *fieldMap = new ObjFieldMap;
+			ObjMethodMap *methodMap = new ObjMethodMap;
+			gen->objDef = new ObjectDef( ObjectDef::BuiltinType, 
+					gen->name, fieldMap, methodMap, nextObjectId++ );
+
+			switch ( gen->typeId ) {
+				case GEN_MAP: 
+					initMapFunctions( gen );
+					break;
+				case GEN_LIST:
+					initListFunctions( gen );
+					initListFields( gen );
+					break;
+				case GEN_VECTOR:
+					initVectorFunctions( gen );
+					break;
+			}
+
+			gen->langEl->objectDef = gen->objDef;
+		}
+	}
+}
+
+void ParseData::makeFuncVisible( Function *func, bool isUserIter )
+{
+	/* Need an object for the local frame. */
+	curLocalFrame = func->codeBlock->localFrame;
+	func->localFrame = func->codeBlock->localFrame;
+
+	/* Set up the parameters. */
+	long paramPos = 0, paramListSize = 0;
+	UniqueType **paramUTs = new UniqueType*[func->paramList->length()];
+	for ( ParameterList::Iter param = *func->paramList; param.lte(); param++ ) {
+		paramUTs[paramPos] = param->typeRef->lookupType( this );
+
+		if ( func->localFrame->objFieldMap->find( param->name ) != 0 )
+			error(param->loc) << "parameter " << param->name << " redeclared" << endp;
+
+		func->localFrame->objFieldMap->insert( param->name, param );
+		param->beenInitialized = true;
+		param->pos = paramPos;
+
+		/* Initialize the object field as a local variable. We also want trees
+		 * downreffed. */
+		if ( paramUTs[paramPos]->typeId == TYPE_REF )
+			initLocalRefInstructions( param );
+		else
+			initLocalInstructions( param );
+
+		paramListSize += sizeOfField( paramUTs[paramPos] );
+		paramPos += 1;
+	}
+
+	/* Param offset is relative to one past the last item in the array of
+	 * words containing the args. */
+	long paramOffset = 0;
+	for ( ParameterList::Iter param = *func->paramList; param.lte(); param++ ) {
+
+		/* Moving downward, and need the offset to point to the lower half of
+		 * the argument. */
+		paramOffset -= sizeOfField( paramUTs[param->pos] );
+
+		/* How much space do we need to make for call overhead. */
+		long frameAfterArgs = isUserIter ? IFR_AA : FR_AA;
+
+		/* Going up first we have the frame data, then maybe
+		 * the user iterator, then the args from high to low. */
+		param->offset = frameAfterArgs + 
+				( isUserIter ? ( sizeof(UserIter) / sizeof(Word) ) : 0 ) +
+				paramListSize + paramOffset;
+	}
+
+	func->paramListSize = paramListSize;
+	func->paramUTs = paramUTs;
+
+	/* Insert the function into the global function map. */
+	UniqueType *returnUT = func->typeRef != 0 ? 
+			func->typeRef->lookupType(this) : uniqueTypeInt;
+	ObjMethod *objMethod = new ObjMethod( returnUT, func->name, 
+			IN_CALL, IN_CALL, 
+			func->paramList->length(), paramUTs, func->paramList, false );
+	objMethod->funcId = func->funcId;
+	objMethod->useFuncId = true;
+	objMethod->useCallObj = false;
+	objMethod->func = func;
+
+	if ( isUserIter ) {
+		IterDef *uiter = findIterDef( IterDef::User, func );
+		objMethod->iterDef = uiter;
+	}
+
+	globalObjectDef->objMethodMap->insert( func->name, objMethod );
+}
+
+void ParseData::compileUserIter( Function *func )
+{
+	CodeBlock *block = func->codeBlock;
+
+	compileContext = CompileFunction;
+	curFunction = func;
+	block->frameId = nextFrameId++;
+
+	makeFuncVisible( func, true );
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+
+	/* Compile the block. */
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Set in the alloc frame instruction. */
+	int frameSize = func->localFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	/* Check for a return statement. */
+	if ( block->stmtList->length() == 0 ||
+			block->stmtList->tail->type != LangStmt::YieldType )
+	{
+		/* Push the return value. */
+		block->code.append( IN_LOAD_NIL );
+		block->code.append( IN_YIELD );
+	}
+
+	/* Now that compilation is done variables are referenced. Make the local
+	 * trees descriptor. */
+	findLocalTrees( block->trees );
+
+	/* FIXME: Need to deal with the freeing of local trees. */
+}
+
+void ParseData::compileFunction( Function *func )
+{
+	CodeBlock *block = func->codeBlock;
+
+	compileContext = CompileFunction;
+	curFunction = func;
+	block->frameId = nextFrameId++;
+
+	makeFuncVisible( func, false );
+
+	/* Add the alloc frame opcode. We don't have the right 
+	 * frame size yet. We will fill it in later. */
+	block->code.append( IN_INIT_LOCALS );
+	block->code.appendHalf( 0 );
+
+	/* Compile the block. */
+	block->compile( this, block->code );
+
+	/* We have the frame size now. Set in the alloc frame instruction. */
+	int frameSize = func->localFrame->size();
+	block->code.setHalf( 1, frameSize );
+
+	/* Check for a return statement. */
+	if ( block->stmtList->length() == 0 ||
+			block->stmtList->tail->type != LangStmt::ReturnType )
+	{
+		/* Push the return value. */
+		block->code.append( IN_LOAD_NIL );
+		block->code.append( IN_SAVE_RET );
+	}
+
+	/* Compute the jump distance for the return jumps. */
+	for ( LongVect::Iter rj = returnJumps; rj.lte(); rj++ ) {
+		long distance = block->code.length() - *rj - 3;
+		block->code.setHalf( *rj+1, distance );
+	}
+
+	/* Reset the vector of return jumps. */
+	returnJumps.empty();
+
+	/* Return cleans up the stack (including the args) and leaves the return
+	 * value on the top. */
+	block->code.append( IN_RET );
+	block->code.appendHalf( func->funcId );
+
+	/* Now that compilation is done variables are referenced. Make the local
+	 * trees descriptor. */
+	findLocalTrees( block->trees );
+}
+
+void ParseData::makeDefaultIterators()
+{
+	/* Tree iterator. */
+	{
+		UniqueType *anyRefUT = findUniqueType( TYPE_REF, anyKlangEl );
+		ObjMethod *objMethod = initFunction( uniqueTypeAny, globalObjectDef, 
+				"triter", IN_HALT, IN_HALT, anyRefUT, true );
+
+		IterDef *triter = findIterDef( IterDef::Tree );
+		objMethod->iterDef = triter;
+	}
+
+	/* Child iterator. */
+	{
+		UniqueType *anyRefUT = findUniqueType( TYPE_REF, anyKlangEl );
+		ObjMethod *objMethod = initFunction( uniqueTypeAny, globalObjectDef, 
+				"child", IN_HALT, IN_HALT, anyRefUT, true );
+
+		IterDef *triter = findIterDef( IterDef::Child );
+		objMethod->iterDef = triter;
+	}
+
+	/* Reverse iterator. */
+	{
+		UniqueType *anyRefUT = findUniqueType( TYPE_REF, anyKlangEl );
+		ObjMethod *objMethod = initFunction( uniqueTypeAny, globalObjectDef, 
+				"rev_child", IN_HALT, IN_HALT, anyRefUT, true );
+
+		IterDef *triter = findIterDef( IterDef::RevChild );
+		objMethod->iterDef = triter;
+	}
+}
+
+void ParseData::addStdin()
+{
+	/* Make the type ref. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeStream );
+
+	/* Create the field and insert it into the map. */
+	ObjField *el = new ObjField( InputLoc(), typeRef, "stdin" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR    = IN_GET_STDIN;
+	globalObjectDef->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::addStdout()
+{
+	/* Make the type ref. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeStr );
+
+	/* Create the field and insert it into the map. */
+	ObjField *el = new ObjField( InputLoc(), typeRef, "stout" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR    = IN_GET_STDOUT;
+	globalObjectDef->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::addStderr()
+{
+	/* Make the type ref. */
+	TypeRef *typeRef = new TypeRef( InputLoc(), uniqueTypeStr );
+
+	/* Create the field and insert it into the map. */
+	ObjField *el = new ObjField( InputLoc(), typeRef, "stderr" );
+	el->beenReferenced = true;
+	el->beenInitialized = true;
+	el->isConst = true;
+	el->useOffset = false;
+	el->inGetR    = IN_GET_STDERR;
+	globalObjectDef->objFieldMap->insert( el->name, el );
+}
+
+void ParseData::initGlobalFunctions()
+{
+	ObjMethod *method;
+
+	method = initFunction( uniqueTypeStream, globalObjectDef, "open_file",
+		IN_OPEN_FILE, IN_OPEN_FILE, uniqueTypeStr, true );
+	method->useCallObj = false;
+
+	addStdin();
+	addStdout();
+	addStderr();
+}
+
+void ParseData::compileByteCode()
+{
+	initUniqueTypes();
+	initIntObject();
+	initStrObject();
+	initStreamObject();
+	initTokenObjects();
+	makeDefaultIterators();
+	initAllLanguageObjects();
+	resolveGenericTypes();
+
+	initGlobalFunctions();
+
+	/* The function info structure relies on functions being compile first,
+	 * then iterators. */
+
+	/* Compile functions. */
+	for ( FunctionList::Iter f = functionList; f.lte(); f++ ) {
+		if ( f->isUserIter )
+			compileUserIter( f );
+		else
+			compileFunction( f );
+	}
+
+	/* Compile the reduction code. */
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		if ( prod->redBlock != 0 )
+			compileReductionCode( prod );
+	}
+
+	/* Compile the token translation code. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->transBlock != 0 )
+			compileTranslateBlock( lel );
+	}
+
+	/* Compile preeof blocks. */
+	for ( RegionList::Iter r = regionList; r.lte(); r++ ) {
+		if ( r->preEofBlock != 0 )
+			compilePreEof( r );
+	}
+
+	/* Compile the init code */
+	compileRootBlock( );
+}
diff --git a/colm/dotgen.cpp b/colm/dotgen.cpp
new file mode 100644
index 00000000..d362d714
--- /dev/null
+++ b/colm/dotgen.cpp
@@ -0,0 +1,369 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+
+#include "dotgen.h"
+#include "parsedata.h"
+#include "pdacodegen.h"
+
+using namespace std;
+#if 0
+
+std::ostream &GraphvizDotGen::KEY( Key key )
+{
+	if ( printPrintables && key.isPrintable() ) {
+		// Output values as characters, ensuring we escape the quote (") character
+		char cVal = (char) key.getVal();
+		out << "'";
+		switch ( cVal ) {
+			case '"': case '\\':
+				out << "\\" << cVal;
+				break;
+			default:	
+				out << cVal;
+				break;
+		}
+		out << "'";
+	}
+	else {
+		if ( keyOps->isSigned )
+			out << key.getVal();
+		else
+			out << (unsigned long) key.getVal();
+	}
+
+	return out;
+}
+
+std::ostream &GraphvizDotGen::TRANS_ACTION( RedState *fromState, RedTrans *trans )
+{
+	int n = 0;
+	RedAction *actions[3];
+
+	if ( fromState->fromStateAction != 0 )
+		actions[n++] = fromState->fromStateAction;
+	if ( trans->action != 0 )
+		actions[n++] = trans->action;
+	if ( trans->targ != 0 && trans->targ->toStateAction != 0 )
+		actions[n++] = trans->targ->toStateAction;
+
+	if ( n > 0 )
+		out << " / ";
+	
+	/* Loop the existing actions and write out what's there. */
+	for ( int a = 0; a < n; a++ ) {
+		for ( GenActionTable::Iter actIt = actions[a]->key.first(); actIt.lte(); actIt++ ) {
+			GenAction *action = actIt->value;
+			out << action->nameOrLoc();
+			if ( a < n-1 || !actIt.last() )
+				out << ", ";
+		}
+	}
+	return out;
+}
+
+std::ostream &GraphvizDotGen::ACTION( RedAction *action )
+{
+	/* The action. */
+	out << " / ";
+	for ( GenActionTable::Iter actIt = action->key.first(); actIt.lte(); actIt++ ) {
+		GenAction *action = actIt->value;
+		if ( action->name != 0 )
+			out << action->name;
+		else
+			out << action->loc.line << ":" << action->loc.col;
+		if ( !actIt.last() )
+			out << ", ";
+	}
+	return out;
+}
+
+std::ostream &GraphvizDotGen::ONCHAR( Key lowKey, Key highKey )
+{
+	if ( lowKey > keyOps->maxKey ) {
+		GenCondSpace *condSpace = redFsm->findCondSpace( lowKey, highKey );
+		Key values = ( lowKey - condSpace->baseKey ) / keyOps->alphSize();
+
+		lowKey = keyOps->minKey + 
+			(lowKey - condSpace->baseKey - keyOps->alphSize() * values.getVal());
+		highKey = keyOps->minKey + 
+			(highKey - condSpace->baseKey - keyOps->alphSize() * values.getVal());
+		KEY( lowKey );
+		if ( lowKey != highKey ) {
+			out << "..";
+			KEY( highKey );
+		}
+		out << "(";
+
+		for ( GenCondSet::Iter csi = condSpace->condSet; csi.lte(); csi++ ) {
+			bool set = values & (1 << csi.pos());
+			if ( !set )
+				out << "!";
+			out << (*csi)->nameOrLoc();
+			if ( !csi.last() )
+				out << ", ";
+		}
+		out << ")";
+	}
+	else {
+		/* Output the key. Possibly a range. */
+		KEY( lowKey );
+		if ( highKey != lowKey ) {
+			out << "..";
+			KEY( highKey );
+		}
+	}
+	return out;
+}
+
+void GraphvizDotGen::writeTransList( RedState *state )
+{
+	/* Build the set of unique transitions out of this state. */
+	RedTransPtrSet stTransSet;
+	for ( RedTransList::Iter tel = state->outRange; tel.lte(); tel++ ) {
+		/* If we haven't seen the transitions before, the move forward
+		 * emitting all the transitions on the same character. */
+		if ( stTransSet.insert( tel->value ) ) {
+			/* Write out the from and to states. */
+			out << "\t" << state->id << " -> ";
+
+			if ( tel->value->targ == 0 )
+				out << "err_" << state->id;
+			else
+				out << tel->value->targ->id;
+
+			/* Begin the label. */
+			out << " [ label = \""; 
+			ONCHAR( tel->lowKey, tel->highKey );
+
+			/* Walk the transition list, finding the same. */
+			for ( RedTransList::Iter mtel = tel.next(); mtel.lte(); mtel++ ) {
+				if ( mtel->value == tel->value ) {
+					out << ", ";
+					ONCHAR( mtel->lowKey, mtel->highKey );
+				}
+			}
+
+			/* Write the action and close the transition. */
+			TRANS_ACTION( state, tel->value );
+			out << "\" ];\n";
+		}
+	}
+
+	/* Write the default transition. */
+	if ( state->defTrans != 0 ) {
+		/* Write out the from and to states. */
+		out << "\t" << state->id << " -> ";
+
+		if ( state->defTrans->targ == 0 )
+			out << "err_" << state->id;
+		else
+			out << state->defTrans->targ->id;
+
+		/* Begin the label. */
+		out << " [ label = \"DEF"; 
+
+		/* Write the action and close the transition. */
+		TRANS_ACTION( state, state->defTrans );
+		out << "\" ];\n";
+	}
+}
+
+void GraphvizDotGen::writeDotFile( )
+{
+	out << 
+		"digraph " << fsmName << " {\n"
+		"	rankdir=LR;\n";
+	
+	/* Define the psuedo states. Transitions will be done after the states
+	 * have been defined as either final or not final. */
+	out << "	node [ shape = point ];\n";
+	out << "	ENTRY;\n";
+
+	/* Psuedo states for entry points in the entry map. */
+	for ( EntryIdVect::Iter en = redFsm->entryPointIds; en.lte(); en++ ) {
+		RedState *state = redFsm->allStates + *en;
+		out << "	en_" << state->id << ";\n";
+	}
+
+	/* Psuedo states for final states with eof actions. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		if ( st->eofAction != 0 )
+			out << "	eof_" << st->id << ";\n";
+	}
+
+	out << "	node [ shape = circle, height = 0.2 ];\n";
+
+	/* Psuedo states for states whose default actions go to error. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		bool needsErr = false;
+		if ( st->defTrans != 0 && st->defTrans->targ == 0 )
+			needsErr = true;
+		else {
+			for ( RedTransList::Iter tel = st->outRange; tel.lte(); tel++ ) {
+				if ( tel->value->targ == 0 ) {
+					needsErr = true;
+					break;
+				}
+			}
+		}
+
+		if ( needsErr )
+			out << "	err_" << st->id << " [ label=\"\"];\n";
+	}
+
+	/* Attributes common to all nodes, plus double circle for final states. */
+	out << "	node [ fixedsize = true, height = 0.65, shape = doublecircle ];\n";
+
+	/* List Final states. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		if ( st->isFinal )
+			out << "	" << st->id << ";\n";
+	}
+
+	/* List transitions. */
+	out << "	node [ shape = circle ];\n";
+
+	/* Walk the states. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
+		writeTransList( st );
+
+	/* Transitions into the start state. */
+	out << "	ENTRY -> " << redFsm->startState->id << " [ label = \"IN";
+	out << "\" ];\n";
+
+	/* Transitions into the entry points. */
+	for ( EntryIdVect::Iter en = redFsm->entryPointIds; en.lte(); en++ ) {
+		RedState *state = redFsm->allStates + *en;
+		char *name = redFsm->entryPointNames[en.pos()];
+		out << "	en_" << state->id << " -> " << state->id <<
+				" [ label = \"" << name << "\" ];\n";
+	}
+
+	/* Out action transitions. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		if ( st->eofAction != 0 ) {
+			out << "	" << st->id << " -> eof_" << 
+					st->id << " [ label = \"EOF"; 
+			ACTION( st->eofAction ) << "\" ];\n";
+		}
+	}
+
+	out <<
+		"}\n";
+}
+
+void GraphvizDotGen::finishRagelDef()
+{
+	if ( !graphvizDone ) {
+		graphvizDone = true;
+
+		/* For dot file generation we want to pick default transitions. */
+		redFsm->chooseDefaultSpan();
+
+		/* Write out with it. */
+		writeDotFile();
+	}
+}
+
+
+void PdaCodeGen::writeTransList( PdaState *state )
+{
+	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+		/* Write out the from and to states. */
+		out << "\t" << state->stateNum << " -> " << trans->value->toState->stateNum;
+
+		/* Begin the label. */
+		out << " [ label = \""; 
+		long key = trans->key;  
+		KlangEl *lel = pd->langElIndex[key];
+		if ( lel != 0 )
+			out << lel->data;
+		else
+			out << (char)key;
+
+		if ( trans->value->actions.length() > 0 ) {
+			out << " / ";
+			for ( ActDataList::Iter act = trans->value->actions; act.lte(); act++ ) {
+				switch ( *act & 0x3 ) {
+				case 1: 
+					out << "S(" << trans->value->actOrds[act.pos()] << ")";
+					break;
+				case 2: {
+					out << "R(" << pd->prodIdIndex[(*act >> 2)]->data <<
+							", " << trans->value->actOrds[act.pos()] << ")";
+					break;
+				}
+				case 3: {
+					out << "SR(" << pd->prodIdIndex[(*act >> 2)]->data << 
+							", " << trans->value->actOrds[act.pos()] << ")";
+					break;
+				}}
+				if ( ! act.last() )
+					out << ", ";
+			}
+		}
+
+		out << "\" ];\n";
+	}
+}
+
+void PdaCodeGen::writeDotFile( PdaGraph *graph )
+{
+	out << 
+		"digraph " << parserName << " {\n"
+		"	rankdir=LR;\n";
+	
+	/* Define the psuedo states. Transitions will be done after the states
+	 * have been defined as either final or not final. */
+	out << "	node [ shape = point ];\n";
+	out << "	ENTRY;\n";
+
+	out << "	node [ shape = circle, height = 0.2 ];\n";
+
+	/* Attributes common to all nodes, plus double circle for final states. */
+	out << "	node [ fixedsize = true, height = 0.65, shape = doublecircle ];\n";
+
+	/* List Final states. */
+	for ( PdaStateSet::Iter st = graph->finStateSet; st.lte(); st++ )
+		out << "	" << (*st)->stateNum << ";\n";
+
+	/* List transitions. */
+	out << "	node [ shape = circle ];\n";
+
+	/* Walk the states. */
+	for ( PdaStateList::Iter st = graph->stateList; st.lte(); st++ )
+		writeTransList( st );
+
+	/* Transitions into the start state. */
+	out << "	ENTRY -> " << graph->startState->stateNum << " [ label = \"START\" ];\n";
+
+	out <<
+		"}\n";
+}
+
+void PdaCodeGen::writeDotFile( )
+{
+	writeDotFile( pd->pdaGraph );
+}
+
+#endif
+
diff --git a/colm/dotgen.h b/colm/dotgen.h
new file mode 100644
index 00000000..c0cd31e7
--- /dev/null
+++ b/colm/dotgen.h
@@ -0,0 +1,51 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _GVDOTGEN_H
+#define _GVDOTGEN_H
+
+#include <iostream>
+
+#if 0
+
+class GraphvizDotGen : public CodeGenData
+{
+public:
+	GraphvizDotGen( ostream &out ) : CodeGenData(out) { }
+
+	/* Print an fsm to out stream. */
+	void writeTransList( RedState *state );
+	void writeDotFile( );
+
+	virtual void finishRagelDef();
+
+private:
+	/* Writing labels and actions. */
+	std::ostream &ONCHAR( Key lowKey, Key highKey );
+	std::ostream &TRANS_ACTION( RedState *fromState, RedTrans *trans );
+	std::ostream &ACTION( RedAction *action );
+	std::ostream &KEY( Key key );
+};
+
+#endif
+
+
+#endif /* _GVDOTGEN_H */
diff --git a/colm/fsmap.cpp b/colm/fsmap.cpp
new file mode 100644
index 00000000..d843474f
--- /dev/null
+++ b/colm/fsmap.cpp
@@ -0,0 +1,854 @@
+/*
+ *  Copyright 2002-2004 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "config.h"
+#include "fsmgraph.h"
+#include <iostream>
+
+using std::cerr;
+using std::endl;
+
+CondData *condData = 0;
+KeyOps *keyOps = 0;
+
+/* Insert an action into an action table. */
+void ActionTable::setAction( int ordering, Action *action )
+{
+	/* Multi-insert in case specific instances of an action appear in a
+	 * transition more than once. */
+	insertMulti( ordering, action );
+}
+
+/* Set all the action from another action table in this table. */
+void ActionTable::setActions( const ActionTable &other )
+{
+	for ( ActionTable::Iter action = other; action.lte(); action++ )
+		insertMulti( action->key, action->value );
+}
+
+void ActionTable::setActions( int *orderings, Action **actions, int nActs )
+{
+	for ( int a = 0; a < nActs; a++ )
+		insertMulti( orderings[a], actions[a] );
+}
+
+bool ActionTable::hasAction( Action *action )
+{
+	for ( int a = 0; a < length(); a++ ) {
+		if ( data[a].value == action )
+			return true;
+	}
+	return false;
+}
+
+/* Insert an action into an action table. */
+void LmActionTable::setAction( int ordering, TokenDef *action )
+{
+	/* Multi-insert in case specific instances of an action appear in a
+	 * transition more than once. */
+	insertMulti( ordering, action );
+}
+
+/* Set all the action from another action table in this table. */
+void LmActionTable::setActions( const LmActionTable &other )
+{
+	for ( LmActionTable::Iter action = other; action.lte(); action++ )
+		insertMulti( action->key, action->value );
+}
+
+void ErrActionTable::setAction( int ordering, Action *action, int transferPoint )
+{
+	insertMulti( ErrActionTableEl( action, ordering, transferPoint ) );
+}
+
+void ErrActionTable::setActions( const ErrActionTable &other )
+{
+	for ( ErrActionTable::Iter act = other; act.lte(); act++ )
+		insertMulti( ErrActionTableEl( act->action, act->ordering, act->transferPoint ) );
+}
+
+/* Insert a priority into this priority table. Looks out for priorities on
+ * duplicate keys. */
+void PriorTable::setPrior( int ordering, PriorDesc *desc )
+{
+	PriorEl *lastHit = 0;
+	PriorEl *insed = insert( PriorEl(ordering, desc), &lastHit );
+	if ( insed == 0 ) {
+		/* This already has a priority on the same key as desc. Overwrite the
+		 * priority if the ordering is larger (later in time). */
+		if ( ordering >= lastHit->ordering )
+			*lastHit = PriorEl( ordering, desc );
+	}
+}
+
+/* Set all the priorities from a priorTable in this table. */
+void PriorTable::setPriors( const PriorTable &other )
+{
+	/* Loop src priorities once to overwrite duplicates. */
+	PriorTable::Iter priorIt = other;
+	for ( ; priorIt.lte(); priorIt++ )
+		setPrior( priorIt->ordering, priorIt->desc );
+}
+
+/* Set the priority of starting transitions. Isolates the start state so it has
+ * no other entry points, then sets the priorities of all the transitions out
+ * of the start state. If the start state is final, then the outPrior of the
+ * start state is also set. The idea is that a machine that accepts the null
+ * string can still specify the starting trans prior for when it accepts the
+ * null word. */
+void FsmGraph::startFsmPrior( int ordering, PriorDesc *prior )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+
+	/* Walk all transitions out of the start state. */
+	for ( TransList::Iter trans = startState->outList; trans.lte(); trans++ ) {
+		if ( trans->toState != 0 )
+			trans->priorTable.setPrior( ordering, prior );
+	}
+}
+
+/* Set the priority of all transitions in a graph. Walks all transition lists
+ * and all def transitions. */
+void FsmGraph::allTransPrior( int ordering, PriorDesc *prior )
+{
+	/* Walk the list of all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Walk the out list of the state. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+			if ( trans->toState != 0 )
+				trans->priorTable.setPrior( ordering, prior );
+		}
+	}
+}
+
+/* Set the priority of all transitions that go into a final state. Note that if
+ * any entry states are final, we will not be setting the priority of any
+ * transitions that may go into those states in the future. The graph does not
+ * support pending in transitions in the same way pending out transitions are
+ * supported. */
+void FsmGraph::finishFsmPrior( int ordering, PriorDesc *prior )
+{
+	/* Walk all final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ ) {
+		/* Walk all in transitions of the final state. */
+		for ( TransInList::Iter trans = (*state)->inList; trans.lte(); trans++ )
+			trans->priorTable.setPrior( ordering, prior );
+	}
+}
+
+/* Set the priority of any future out transitions that may be made going out of
+ * this state machine. */
+void FsmGraph::leaveFsmPrior( int ordering, PriorDesc *prior )
+{
+	/* Set priority in all final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->outPriorTable.setPrior( ordering, prior );
+}
+
+
+/* Set actions to execute on starting transitions. Isolates the start state
+ * so it has no other entry points, then adds to the transition functions
+ * of all the transitions out of the start state. If the start state is final,
+ * then the func is also added to the start state's out func list. The idea is
+ * that a machine that accepts the null string can execute a start func when it
+ * matches the null word, which can only be done when leaving the start/final
+ * state. */
+void FsmGraph::startFsmAction( int ordering, Action *action )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+
+	/* Walk the start state's transitions, setting functions. */
+	for ( TransList::Iter trans = startState->outList; trans.lte(); trans++ ) {
+		if ( trans->toState != 0 )
+			trans->actionTable.setAction( ordering, action );
+	}
+}
+
+/* Set functions to execute on all transitions. Walks the out lists of all
+ * states. */
+void FsmGraph::allTransAction( int ordering, Action *action )
+{
+	/* Walk all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Walk the out list of the state. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+			if ( trans->toState != 0 )
+				trans->actionTable.setAction( ordering, action );
+		}
+	}
+}
+
+/* Specify functions to execute upon entering final states. If the start state
+ * is final we can't really specify a function to execute upon entering that
+ * final state the first time. So function really means whenever entering a
+ * final state from within the same fsm. */
+void FsmGraph::finishFsmAction( int ordering, Action *action )
+{
+	/* Walk all final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ ) {
+		/* Walk the final state's in list. */
+		for ( TransInList::Iter trans = (*state)->inList; trans.lte(); trans++ )
+			trans->actionTable.setAction( ordering, action );
+	}
+}
+
+/* Add functions to any future out transitions that may be made going out of
+ * this state machine. */
+void FsmGraph::leaveFsmAction( int ordering, Action *action )
+{
+	/* Insert the action in the outActionTable of all final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->outActionTable.setAction( ordering, action );
+}
+
+/* Add functions to the longest match action table for constructing scanners. */
+void FsmGraph::longMatchAction( int ordering, TokenDef *lmPart )
+{
+	/* Walk all final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ ) {
+		/* Walk the final state's in list. */
+		for ( TransInList::Iter trans = (*state)->inList; trans.lte(); trans++ )
+			trans->lmActionTable.setAction( ordering, lmPart );
+	}
+}
+
+void FsmGraph::fillGaps( FsmState *state )
+{
+	if ( state->outList.length() == 0 ) {
+		/* Add the range on the lower and upper bound. */
+		attachNewTrans( state, 0, keyOps->minKey, keyOps->maxKey );
+	}
+	else {
+		TransList srcList;
+		srcList.transfer( state->outList );
+
+		/* Check for a gap at the beginning. */
+		TransList::Iter trans = srcList, next;
+		if ( keyOps->minKey < trans->lowKey ) {
+			/* Make the high key and append. */
+			Key highKey = trans->lowKey;
+			highKey.decrement();
+
+			attachNewTrans( state, 0, keyOps->minKey, highKey );
+		}
+
+		/* Write the transition. */
+		next = trans.next();
+		state->outList.append( trans );
+
+		/* Keep the last high end. */
+		Key lastHigh = trans->highKey;
+
+		/* Loop each source range. */
+		for ( trans = next; trans.lte(); trans = next ) {
+			/* Make the next key following the last range. */
+			Key nextKey = lastHigh;
+			nextKey.increment();
+
+			/* Check for a gap from last up to here. */
+			if ( nextKey < trans->lowKey ) {
+				/* Make the high end of the range that fills the gap. */
+				Key highKey = trans->lowKey;
+				highKey.decrement();
+
+				attachNewTrans( state, 0, nextKey, highKey );
+			}
+
+			/* Reduce the transition. If it reduced to anything then add it. */
+			next = trans.next();
+			state->outList.append( trans );
+
+			/* Keep the last high end. */
+			lastHigh = trans->highKey;
+		}
+
+		/* Now check for a gap on the end to fill. */
+		if ( lastHigh < keyOps->maxKey ) {
+			/* Get a copy of the default. */
+			lastHigh.increment();
+
+			attachNewTrans( state, 0, lastHigh, keyOps->maxKey );
+		}
+	}
+}
+
+void FsmGraph::setErrorAction( FsmState *state, int ordering, Action *action )
+{
+	/* Fill any gaps in the out list with an error transition. */
+	fillGaps( state );
+
+	/* Set error transitions in the transitions that go to error. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+		if ( trans->toState == 0 )
+			trans->actionTable.setAction( ordering, action );
+	}
+}
+
+void FsmGraph::setErrorActions( FsmState *state, const ActionTable &other )
+{
+	/* Fill any gaps in the out list with an error transition. */
+	fillGaps( state );
+
+	/* Set error transitions in the transitions that go to error. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+		if ( trans->toState == 0 )
+			trans->actionTable.setActions( other );
+	}
+}
+
+
+/* Give a target state for error transitions. */
+void FsmGraph::setErrorTarget( FsmState *state, FsmState *target, int *orderings, 
+			Action **actions, int nActs )
+{
+	/* Fill any gaps in the out list with an error transition. */
+	fillGaps( state );
+
+	/* Set error target in the transitions that go to error. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+		if ( trans->toState == 0 ) {
+			/* The trans goes to error, redirect it. */
+			redirectErrorTrans( trans->fromState, target, trans );
+			trans->actionTable.setActions( orderings, actions, nActs );
+		}
+	}
+}
+
+void FsmGraph::transferErrorActions( FsmState *state, int transferPoint )
+{
+	for ( int i = 0; i < state->errActionTable.length(); ) {
+		ErrActionTableEl *act = state->errActionTable.data + i;
+		if ( act->transferPoint == transferPoint ) {
+			/* Transfer the error action and remove it. */
+			setErrorAction( state, act->ordering, act->action );
+			state->errActionTable.vremove( i );
+		}
+		else {
+			/* Not transfering and deleting, skip over the item. */
+			i += 1;
+		}
+	}
+}
+
+/* Set error actions in the start state. */
+void FsmGraph::startErrorAction( int ordering, Action *action, int transferPoint )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+
+	/* Add the actions. */
+	startState->errActionTable.setAction( ordering, action, transferPoint );
+}
+
+/* Set error actions in all states where there is a transition out. */
+void FsmGraph::allErrorAction( int ordering, Action *action, int transferPoint )
+{
+	/* Insert actions in the error action table of all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		state->errActionTable.setAction( ordering, action, transferPoint );
+}
+
+/* Set error actions in final states. */
+void FsmGraph::finalErrorAction( int ordering, Action *action, int transferPoint )
+{
+	/* Add the action to the error table of final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->errActionTable.setAction( ordering, action, transferPoint );
+}
+
+void FsmGraph::notStartErrorAction( int ordering, Action *action, int transferPoint )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState )
+			state->errActionTable.setAction( ordering, action, transferPoint );
+	}
+}
+
+void FsmGraph::notFinalErrorAction( int ordering, Action *action, int transferPoint )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( ! state->isFinState() )
+			state->errActionTable.setAction( ordering, action, transferPoint );
+	}
+}
+
+/* Set error actions in the states that have transitions into a final state. */
+void FsmGraph::middleErrorAction( int ordering, Action *action, int transferPoint )
+{
+	/* Isolate the start state in case it is reachable from in inside the
+	 * machine, in which case we don't want it set. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState && ! state->isFinState() )
+			state->errActionTable.setAction( ordering, action, transferPoint );
+	}
+}
+
+/* Set EOF actions in the start state. */
+void FsmGraph::startEOFAction( int ordering, Action *action )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+
+	/* Add the actions. */
+	startState->eofActionTable.setAction( ordering, action );
+}
+
+/* Set EOF actions in all states where there is a transition out. */
+void FsmGraph::allEOFAction( int ordering, Action *action )
+{
+	/* Insert actions in the EOF action table of all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		state->eofActionTable.setAction( ordering, action );
+}
+
+/* Set EOF actions in final states. */
+void FsmGraph::finalEOFAction( int ordering, Action *action )
+{
+	/* Add the action to the error table of final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->eofActionTable.setAction( ordering, action );
+}
+
+void FsmGraph::notStartEOFAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState )
+			state->eofActionTable.setAction( ordering, action );
+	}
+}
+
+void FsmGraph::notFinalEOFAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( ! state->isFinState() )
+			state->eofActionTable.setAction( ordering, action );
+	}
+}
+
+/* Set EOF actions in the states that have transitions into a final state. */
+void FsmGraph::middleEOFAction( int ordering, Action *action )
+{
+	/* Set the actions in all states that are not the start state and not final. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState && ! state->isFinState() )
+			state->eofActionTable.setAction( ordering, action );
+	}
+}
+
+/*
+ * Set To State Actions.
+ */
+
+/* Set to state actions in the start state. */
+void FsmGraph::startToStateAction( int ordering, Action *action )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+	startState->toStateActionTable.setAction( ordering, action );
+}
+
+/* Set to state actions in all states. */
+void FsmGraph::allToStateAction( int ordering, Action *action )
+{
+	/* Insert the action on all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		state->toStateActionTable.setAction( ordering, action );
+}
+
+/* Set to state actions in final states. */
+void FsmGraph::finalToStateAction( int ordering, Action *action )
+{
+	/* Add the action to the error table of final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->toStateActionTable.setAction( ordering, action );
+}
+
+void FsmGraph::notStartToStateAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState )
+			state->toStateActionTable.setAction( ordering, action );
+	}
+}
+
+void FsmGraph::notFinalToStateAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( ! state->isFinState() )
+			state->toStateActionTable.setAction( ordering, action );
+	}
+}
+
+/* Set to state actions in states that are not final and not the start state. */
+void FsmGraph::middleToStateAction( int ordering, Action *action )
+{
+	/* Set the action in all states that are not the start state and not final. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState && ! state->isFinState() )
+			state->toStateActionTable.setAction( ordering, action );
+	}
+}
+
+/* 
+ * Set From State Actions.
+ */
+
+void FsmGraph::startFromStateAction( int ordering, Action *action )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+	startState->fromStateActionTable.setAction( ordering, action );
+}
+
+void FsmGraph::allFromStateAction( int ordering, Action *action )
+{
+	/* Insert the action on all states. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		state->fromStateActionTable.setAction( ordering, action );
+}
+
+void FsmGraph::finalFromStateAction( int ordering, Action *action )
+{
+	/* Add the action to the error table of final states. */
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->fromStateActionTable.setAction( ordering, action );
+}
+
+void FsmGraph::notStartFromStateAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState )
+			state->fromStateActionTable.setAction( ordering, action );
+	}
+}
+
+void FsmGraph::notFinalFromStateAction( int ordering, Action *action )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( ! state->isFinState() )
+			state->fromStateActionTable.setAction( ordering, action );
+	}
+}
+
+void FsmGraph::middleFromStateAction( int ordering, Action *action )
+{
+	/* Set the action in all states that are not the start state and not final. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		if ( state != startState && ! state->isFinState() )
+			state->fromStateActionTable.setAction( ordering, action );
+	}
+}
+
+/* Shift the function ordering of the start transitions to start
+ * at fromOrder and increase in units of 1. Useful before staring.
+ * Returns the maximum number of order numbers used. */
+int FsmGraph::shiftStartActionOrder( int fromOrder )
+{
+	int maxUsed = 0;
+
+	/* Walk the start state's transitions, shifting function ordering. */
+	for ( TransList::Iter trans = startState->outList; trans.lte(); trans++ ) {
+		/* Walk the function data for the transition and set the keys to
+		 * increasing values starting at fromOrder. */
+		int curFromOrder = fromOrder;
+		ActionTable::Iter action = trans->actionTable;
+		for ( ; action.lte(); action++ ) 
+			action->key = curFromOrder++;
+	
+		/* Keep track of the max number of orders used. */
+		if ( curFromOrder - fromOrder > maxUsed )
+			maxUsed = curFromOrder - fromOrder;
+	}
+	
+	return maxUsed;
+}
+
+/* Remove all priorities. */
+void FsmGraph::clearAllPriorities()
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Clear out priority data. */
+		state->outPriorTable.empty();
+
+		/* Clear transition data from the out transitions. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ )
+			trans->priorTable.empty();
+	}
+}
+
+/* Zeros out the function ordering keys. This may be called before minimization
+ * when it is known that no more fsm operations are going to be done.  This
+ * will achieve greater reduction as states will not be separated on the basis
+ * of function ordering. */
+void FsmGraph::nullActionKeys( )
+{
+	/* For each state... */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Walk the transitions for the state. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+			/* Walk the action table for the transition. */
+			for ( ActionTable::Iter action = trans->actionTable;
+					action.lte(); action++ )
+				action->key = 0;
+
+			/* Walk the action table for the transition. */
+			for ( LmActionTable::Iter action = trans->lmActionTable;
+					action.lte(); action++ )
+				action->key = 0;
+		}
+
+		/* Null the action keys of the to state action table. */
+		for ( ActionTable::Iter action = state->toStateActionTable;
+				action.lte(); action++ )
+			action->key = 0;
+
+		/* Null the action keys of the from state action table. */
+		for ( ActionTable::Iter action = state->fromStateActionTable;
+				action.lte(); action++ )
+			action->key = 0;
+
+		/* Null the action keys of the out transtions. */
+		for ( ActionTable::Iter action = state->outActionTable;
+				action.lte(); action++ )
+			action->key = 0;
+
+		/* Null the action keys of the error action table. */
+		for ( ErrActionTable::Iter action = state->errActionTable;
+				action.lte(); action++ )
+			action->ordering = 0;
+
+		/* Null the action keys eof action table. */
+		for ( ActionTable::Iter action = state->eofActionTable;
+				action.lte(); action++ )
+			action->key = 0;
+	}
+}
+
+/* Walk the list of states and verify that non final states do not have out
+ * data, that all stateBits are cleared, and that there are no states with
+ * zero foreign in transitions. */
+void FsmGraph::verifyStates()
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Non final states should not have leaving data. */
+		if ( ! (state->stateBits & SB_ISFINAL) ) {
+			assert( state->outActionTable.length() == 0 );
+			assert( state->outCondSet.length() == 0 );
+			assert( state->outPriorTable.length() == 0 );
+		}
+
+		/* Data used in algorithms should be cleared. */
+		assert( (state->stateBits & SB_BOTH) == 0 );
+		assert( state->foreignInTrans > 0 );
+	}
+}
+
+/* Compare two transitions according to their relative priority. Since the
+ * base transition has no priority associated with it, the default is to
+ * return equal. */
+int FsmGraph::comparePrior( const PriorTable &priorTable1, const PriorTable &priorTable2 )
+{
+	/* Looking for differing priorities on same keys. Need to concurrently
+	 * scan the priority lists. */
+	PriorTable::Iter pd1 = priorTable1;
+	PriorTable::Iter pd2 = priorTable2;
+	while ( pd1.lte() && pd2.lte() ) {
+		/* Check keys. */
+		if ( pd1->desc->key < pd2->desc->key )
+			pd1.increment();
+		else if ( pd1->desc->key > pd2->desc->key )
+			pd2.increment();
+		/* Keys are the same, check priorities. */
+		else if ( pd1->desc->priority < pd2->desc->priority )
+			return -1;
+		else if ( pd1->desc->priority > pd2->desc->priority )
+			return 1;
+		else {
+			/* Keys and priorities are equal, advance both. */
+			pd1.increment();
+			pd2.increment();
+		}
+	}
+
+	/* No differing priorities on the same key. */
+	return 0;
+}
+
+/* Compares two transitions according to priority and functions. Pointers
+ * should not be null. Does not consider to state or from state.  Compare two
+ * transitions according to the data contained in the transitions.  Data means
+ * any properties added to user transitions that may differentiate them. Since
+ * the base transition has no data, the default is to return equal. */
+int FsmGraph::compareTransData( FsmTrans *trans1, FsmTrans *trans2 )
+{
+	/* Compare the prior table. */
+	int cmpRes = CmpPriorTable::compare( trans1->priorTable, 
+			trans2->priorTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Compare longest match action tables. */
+	cmpRes = CmpLmActionTable::compare(trans1->lmActionTable, 
+			trans2->lmActionTable);
+	if ( cmpRes != 0 )
+		return cmpRes;
+	
+	/* Compare action tables. */
+	return CmpActionTable::compare(trans1->actionTable, 
+			trans2->actionTable);
+}
+
+/* Callback invoked when another trans (or possibly this) is added into this
+ * transition during the merging process.  Draw in any properties of srcTrans
+ * into this transition. AddInTrans is called when a new transitions is made
+ * that will be a duplicate of another transition or a combination of several
+ * other transitions. AddInTrans will be called for each transition that the
+ * new transition is to represent. */
+void FsmGraph::addInTrans( FsmTrans *destTrans, FsmTrans *srcTrans )
+{
+	/* Protect against adding in from ourselves. */
+	if ( srcTrans == destTrans ) {
+		/* Adding in ourselves, need to make a copy of the source transitions.
+		 * The priorities are not copied in as that would have no effect. */
+		destTrans->lmActionTable.setActions( LmActionTable(srcTrans->lmActionTable) );
+		destTrans->actionTable.setActions( ActionTable(srcTrans->actionTable) );
+	}
+	else {
+		/* Not a copy of ourself, get the functions and priorities. */
+		destTrans->lmActionTable.setActions( srcTrans->lmActionTable );
+		destTrans->actionTable.setActions( srcTrans->actionTable );
+		destTrans->priorTable.setPriors( srcTrans->priorTable );
+	}
+}
+
+/* Compare the properties of states that are embedded by users. Compares out
+ * priorities, out transitions, to, from, out, error and eof action tables. */
+int FsmGraph::compareStateData( const FsmState *state1, const FsmState *state2 )
+{
+	/* Compare the out priority table. */
+	int cmpRes = CmpPriorTable::
+			compare( state1->outPriorTable, state2->outPriorTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+	
+	/* Test to state action tables. */
+	cmpRes = CmpActionTable::compare( state1->toStateActionTable, 
+			state2->toStateActionTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Test from state action tables. */
+	cmpRes = CmpActionTable::compare( state1->fromStateActionTable, 
+			state2->fromStateActionTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Test out action tables. */
+	cmpRes = CmpActionTable::compare( state1->outActionTable, 
+			state2->outActionTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Test out condition sets. */
+	cmpRes = CmpActionSet::compare( state1->outCondSet, 
+			state2->outCondSet );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Test out error action tables. */
+	cmpRes = CmpErrActionTable::compare( state1->errActionTable, 
+			state2->errActionTable );
+	if ( cmpRes != 0 )
+		return cmpRes;
+
+	/* Test eof action tables. */
+	return CmpActionTable::compare( state1->eofActionTable, 
+			state2->eofActionTable );
+}
+
+
+/* Invoked when a state looses its final state status and the leaving
+ * transition embedding data should be deleted. */
+void FsmGraph::clearOutData( FsmState *state )
+{
+	/* Kill the out actions and priorities. */
+	state->outActionTable.empty();
+	state->outCondSet.empty();
+	state->outPriorTable.empty();
+}
+
+bool FsmGraph::hasOutData( FsmState *state )
+{
+	return ( state->outActionTable.length() > 0 ||
+			state->outCondSet.length() > 0 ||
+			state->outPriorTable.length() > 0 );
+}
+
+/* 
+ * Setting Conditions.
+ */
+
+
+void logNewExpansion( Expansion *exp );
+void logCondSpace( CondSpace *condSpace );
+
+CondSpace *FsmGraph::addCondSpace( const CondSet &condSet )
+{
+	CondSpace *condSpace = condData->condSpaceMap.find( condSet );
+	if ( condSpace == 0 ) {
+		Key baseKey = condData->nextCondKey;
+		condData->nextCondKey += (1 << condSet.length() ) * keyOps->alphSize();
+
+		condSpace = new CondSpace( condSet );
+		condSpace->baseKey = baseKey;
+		condData->condSpaceMap.insert( condSpace );
+
+		#ifdef COLM_LOG_CONDS
+		cerr << "adding new condition space" << endl;
+		cerr << "  condition set: ";
+		logCondSpace( condSpace );
+		cerr << endl;
+		cerr << "  baseKey: " << baseKey.getVal() << endl;
+		#endif
+	}
+	return condSpace;
+}
+
+void FsmGraph::startFsmCondition( Action *condAction )
+{
+	/* Make sure the start state has no other entry points. */
+	isolateStartState();
+	embedCondition( startState, condAction );
+}
+
+void FsmGraph::allTransCondition( Action *condAction )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		embedCondition( state, condAction );
+}
+
+void FsmGraph::leaveFsmCondition( Action *condAction )
+{
+	for ( StateSet::Iter state = finStateSet; state.lte(); state++ )
+		(*state)->outCondSet.insert( condAction );
+}
diff --git a/colm/fsmattach.cpp b/colm/fsmattach.cpp
new file mode 100644
index 00000000..201cdd76
--- /dev/null
+++ b/colm/fsmattach.cpp
@@ -0,0 +1,425 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <assert.h>
+#include "fsmgraph.h"
+
+#include <iostream>
+using namespace std;
+
+/* Insert a transition into an inlist. The head must be supplied. */
+void FsmGraph::attachToInList( FsmState *from, FsmState *to, 
+		FsmTrans *&head, FsmTrans *trans )
+{
+	trans->ilnext = head;
+	trans->ilprev = 0;
+
+	/* If in trans list is not empty, set the head->prev to trans. */
+	if ( head != 0 )
+		head->ilprev = trans;
+
+	/* Now insert ourselves at the front of the list. */
+	head = trans;
+
+	/* Keep track of foreign transitions for from and to. */
+	if ( from != to ) {
+		if ( misfitAccounting ) {
+			/* If the number of foreign in transitions is about to go up to 1 then
+			 * move it from the misfit list to the main list. */
+			if ( to->foreignInTrans == 0 )
+				stateList.append( misfitList.detach( to ) );
+		}
+		
+		to->foreignInTrans += 1;
+	}
+};
+
+/* Detach a transition from an inlist. The head of the inlist must be supplied. */
+void FsmGraph::detachFromInList( FsmState *from, FsmState *to, 
+		FsmTrans *&head, FsmTrans *trans )
+{
+	/* Detach in the inTransList. */
+	if ( trans->ilprev == 0 ) 
+		head = trans->ilnext; 
+	else
+		trans->ilprev->ilnext = trans->ilnext; 
+
+	if ( trans->ilnext != 0 )
+		trans->ilnext->ilprev = trans->ilprev; 
+	
+	/* Keep track of foreign transitions for from and to. */
+	if ( from != to ) {
+		to->foreignInTrans -= 1;
+		
+		if ( misfitAccounting ) {
+			/* If the number of foreign in transitions goes down to 0 then move it
+			 * from the main list to the misfit list. */
+			if ( to->foreignInTrans == 0 )
+				misfitList.append( stateList.detach( to ) );
+		}
+	}
+}
+
+/* Attach states on the default transition, range list or on out/in list key.
+ * First makes a new transition. If there is already a transition out from
+ * fromState on the default, then will assertion fail. */
+FsmTrans *FsmGraph::attachNewTrans( FsmState *from, FsmState *to, Key lowKey, Key highKey )
+{
+	/* Make the new transition. */
+	FsmTrans *retVal = new FsmTrans();
+
+	/* The transition is now attached. Remember the parties involved. */
+	retVal->fromState = from;
+	retVal->toState = to;
+
+	/* Make the entry in the out list for the transitions. */
+	from->outList.append( retVal );
+
+	/* Set the the keys of the new trans. */
+	retVal->lowKey = lowKey;
+	retVal->highKey = highKey;
+
+	/* Attach using inList as the head pointer. */
+	if ( to != 0 )
+		attachToInList( from, to, to->inList.head, retVal );
+
+	return retVal;
+}
+
+/* Attach for range lists or for the default transition.  This attach should
+ * be used when a transition already is allocated and must be attached to a
+ * target state.  Does not handle adding the transition into the out list. */
+void FsmGraph::attachTrans( FsmState *from, FsmState *to, FsmTrans *trans )
+{
+	assert( trans->fromState == 0 && trans->toState == 0 );
+	trans->fromState = from;
+	trans->toState = to;
+
+	if ( to != 0 ) { 
+		/* Attach using the inList pointer as the head pointer. */
+		attachToInList( from, to, to->inList.head, trans );
+	}
+}
+
+/* Redirect a transition away from error and towards some state. This is just
+ * like attachTrans except it requires fromState to be set and does not touch
+ * it. */
+void FsmGraph::redirectErrorTrans( FsmState *from, FsmState *to, FsmTrans *trans )
+{
+	assert( trans->fromState != 0 && trans->toState == 0 );
+	trans->toState = to;
+
+	if ( to != 0 ) { 
+		/* Attach using the inList pointer as the head pointer. */
+		attachToInList( from, to, to->inList.head, trans );
+	}
+}
+
+/* Detach for out/in lists or for default transition. */
+void FsmGraph::detachTrans( FsmState *from, FsmState *to, FsmTrans *trans )
+{
+	assert( trans->fromState == from && trans->toState == to );
+	trans->fromState = 0;
+	trans->toState = 0;
+
+	if ( to != 0 ) {
+		/* Detach using to's inList pointer as the head. */
+		detachFromInList( from, to, to->inList.head, trans );
+	}
+}
+
+
+/* Detach a state from the graph. Detaches and deletes transitions in and out
+ * of the state. Empties inList and outList. Removes the state from the final
+ * state set. A detached state becomes useless and should be deleted. */
+void FsmGraph::detachState( FsmState *state )
+{
+	/* Detach the in transitions from the inList list of transitions. */
+	while ( state->inList.head != 0 ) {
+		/* Get pointers to the trans and the state. */
+		FsmTrans *trans = state->inList.head;
+		FsmState *fromState = trans->fromState;
+
+		/* Detach the transitions from the source state. */
+		detachTrans( fromState, state, trans );
+
+		/* Ok to delete the transition. */
+		fromState->outList.detach( trans );
+		delete trans;
+	}
+
+	/* Remove the entry points in on the machine. */
+	while ( state->entryIds.length() > 0 )
+		unsetEntry( state->entryIds[0], state );
+
+	/* Detach out range transitions. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); ) {
+		TransList::Iter next = trans.next();
+		detachTrans( state, trans->toState, trans );
+		delete trans;
+		trans = next;
+	}
+
+	/* Delete all of the out range pointers. */
+	state->outList.abandon();
+
+	/* Unset final stateness before detaching from graph. */
+	if ( state->stateBits & SB_ISFINAL )
+		finStateSet.remove( state );
+}
+
+
+/* Duplicate a transition. Makes a new transition that is attached to the same
+ * dest as srcTrans. The new transition has functions and priority taken from
+ * srcTrans. Used for merging a transition in to a free spot. The trans can
+ * just be dropped in. It does not conflict with an existing trans and need
+ * not be crossed. Returns the new transition. */
+FsmTrans *FsmGraph::dupTrans( FsmState *from, FsmTrans *srcTrans )
+{
+	/* Make a new transition. */
+	FsmTrans *newTrans = new FsmTrans();
+
+	/* We can attach the transition, one does not exist. */
+	attachTrans( from, srcTrans->toState, newTrans );
+		
+	/* Call the user callback to add in the original source transition. */
+	addInTrans( newTrans, srcTrans );
+
+	return newTrans;
+}
+
+/* In crossing, src trans and dest trans both go to existing states. Make one
+ * state from the sets of states that src and dest trans go to. */
+FsmTrans *FsmGraph::fsmAttachStates( MergeData &md, FsmState *from,
+			FsmTrans *destTrans, FsmTrans *srcTrans )
+{
+	/* The priorities are equal. We must merge the transitions. Does the
+	 * existing trans go to the state we are to attach to? ie, are we to
+	 * simply double up the transition? */
+	FsmState *toState = srcTrans->toState;
+	FsmState *existingState = destTrans->toState;
+
+	if ( existingState == toState ) {
+		/* The transition is a double up to the same state.  Copy the src
+		 * trans into itself. We don't need to merge in the from out trans
+		 * data, that was done already. */
+		addInTrans( destTrans, srcTrans );
+	}
+	else {
+		/* The trans is not a double up. Dest trans cannot be the same as src
+		 * trans. Set up the state set. */
+		StateSet stateSet;
+
+		/* We go to all the states the existing trans goes to, plus... */
+		if ( existingState->stateDictEl == 0 )
+			stateSet.insert( existingState );
+		else
+			stateSet.insert( existingState->stateDictEl->stateSet );
+
+		/* ... all the states that we have been told to go to. */
+		if ( toState->stateDictEl == 0 )
+			stateSet.insert( toState );
+		else
+			stateSet.insert( toState->stateDictEl->stateSet );
+
+		/* Look for the state. If it is not there already, make it. */
+		StateDictEl *lastFound;
+		if ( md.stateDict.insert( stateSet, &lastFound ) ) {
+			/* Make a new state representing the combination of states in
+			 * stateSet. It gets added to the fill list.  This means that we
+			 * need to fill in it's transitions sometime in the future.  We
+			 * don't do that now (ie, do not recurse). */
+			FsmState *combinState = addState();
+
+			/* Link up the dict element and the state. */
+			lastFound->targState = combinState;
+			combinState->stateDictEl = lastFound;
+
+			/* Add to the fill list. */
+			md.fillListAppend( combinState );
+		}
+
+		/* Get the state insertted/deleted. */
+		FsmState *targ = lastFound->targState;
+
+		/* Detach the state from existing state. */
+		detachTrans( from, existingState, destTrans );
+
+		/* Re-attach to the new target. */
+		attachTrans( from, targ, destTrans );
+
+		/* Add in src trans to the existing transition that we redirected to
+		 * the new state. We don't need to merge in the from out trans data,
+		 * that was done already. */
+		addInTrans( destTrans, srcTrans );
+	}
+
+	return destTrans;
+}
+
+/* Two transitions are to be crossed, handle the possibility of either going
+ * to the error state. */
+FsmTrans *FsmGraph::mergeTrans( MergeData &md, FsmState *from,
+			FsmTrans *destTrans, FsmTrans *srcTrans )
+{
+	FsmTrans *retTrans = 0;
+	if ( destTrans->toState == 0 && srcTrans->toState == 0 ) {
+		/* Error added into error. */
+		addInTrans( destTrans, srcTrans );
+		retTrans = destTrans;
+	}
+	else if ( destTrans->toState == 0 && srcTrans->toState != 0 ) {
+		/* Non error added into error we need to detach and reattach, */
+		detachTrans( from, destTrans->toState, destTrans );
+		attachTrans( from, srcTrans->toState, destTrans );
+		addInTrans( destTrans, srcTrans );
+		retTrans = destTrans;
+	}
+	else if ( srcTrans->toState == 0 ) {
+		/* Dest goes somewhere but src doesn't, just add it it in. */
+		addInTrans( destTrans, srcTrans );
+		retTrans = destTrans;
+	}
+	else {
+		/* Both go somewhere, run the actual cross. */
+		retTrans = fsmAttachStates( md, from, destTrans, srcTrans );
+	}
+
+	return retTrans;
+}
+
+/* Find the trans with the higher priority. If src is lower priority then dest then
+ * src is ignored. If src is higher priority than dest, then src overwrites dest. If
+ * the priorities are equal, then they are merged. */
+FsmTrans *FsmGraph::crossTransitions( MergeData &md, FsmState *from,
+		FsmTrans *destTrans, FsmTrans *srcTrans )
+{
+	FsmTrans *retTrans;
+
+	/* Compare the priority of the dest and src transitions. */
+	int compareRes = comparePrior( destTrans->priorTable, srcTrans->priorTable );
+	if ( compareRes < 0 ) {
+		/* Src trans has a higher priority than dest, src overwrites dest.
+		 * Detach dest and return a copy of src. */
+		detachTrans( from, destTrans->toState, destTrans );
+		retTrans = dupTrans( from, srcTrans );
+	}
+	else if ( compareRes > 0 ) {
+		/* The dest trans has a higher priority, use dest. */
+		retTrans = destTrans;
+	}
+	else {
+		/* Src trans and dest trans have the same priority, they must be merged. */
+		retTrans = mergeTrans( md, from, destTrans, srcTrans );
+	}
+
+	/* Return the transition that resulted from the cross. */
+	return retTrans;
+}
+
+/* Copy the transitions in srcList to the outlist of dest. The srcList should
+ * not be the outList of dest, otherwise you would be copying the contents of
+ * srcList into itself as it's iterated: bad news. */
+void FsmGraph::outTransCopy( MergeData &md, FsmState *dest, FsmTrans *srcList )
+{
+	/* The destination list. */
+	TransList destList;
+
+	/* Set up an iterator to stop at breaks. */
+	PairIter<FsmTrans> outPair( dest->outList.head, srcList );
+	for ( ; !outPair.end(); outPair++ ) {
+		switch ( outPair.userState ) {
+		case RangeInS1: {
+			/* The pair iter is the authority on the keys. It may have needed
+			 * to break the dest range. */
+			FsmTrans *destTrans = outPair.s1Tel.trans;
+			destTrans->lowKey = outPair.s1Tel.lowKey;
+			destTrans->highKey = outPair.s1Tel.highKey;
+			destList.append( destTrans );
+			break;
+		}
+		case RangeInS2: {
+			/* Src range may get crossed with dest's default transition. */
+			FsmTrans *newTrans = dupTrans( dest, outPair.s2Tel.trans );
+
+			/* Set up the transition's keys and append to the dest list. */
+			newTrans->lowKey = outPair.s2Tel.lowKey;
+			newTrans->highKey = outPair.s2Tel.highKey;
+			destList.append( newTrans );
+			break;
+		}
+		case RangeOverlap: {
+			/* Exact overlap, cross them. */
+			FsmTrans *newTrans = crossTransitions( md, dest,
+				outPair.s1Tel.trans, outPair.s2Tel.trans );
+
+			/* Set up the transition's keys and append to the dest list. */
+			newTrans->lowKey = outPair.s1Tel.lowKey;
+			newTrans->highKey = outPair.s1Tel.highKey;
+			destList.append( newTrans );
+			break;
+		}
+		case BreakS1: {
+			/* Since we are always writing to the dest trans, the dest needs
+			 * to be copied when it is broken. The copy goes into the first
+			 * half of the break to "break it off". */
+			outPair.s1Tel.trans = dupTrans( dest, outPair.s1Tel.trans );
+			break;
+		}
+		case BreakS2:
+			break;
+		}
+	}
+
+	/* Abandon the old outList and transfer destList into it. */
+	dest->outList.transfer( destList );
+}
+
+
+/* Move all the transitions that go into src so that they go into dest.  */
+void FsmGraph::inTransMove( FsmState *dest, FsmState *src )
+{
+	/* Do not try to move in trans to and from the same state. */
+	assert( dest != src );
+
+	/* If src is the start state, dest becomes the start state. */
+	if ( src == startState ) {
+		unsetStartState();
+		setStartState( dest );
+	}
+
+	/* For each entry point into, create an entry point into dest, when the
+	 * state is detached, the entry points to src will be removed. */
+	for ( EntryIdSet::Iter enId = src->entryIds; enId.lte(); enId++ )
+		changeEntry( *enId, dest, src );
+
+	/* Move the transitions in inList. */
+	while ( src->inList.head != 0 ) {
+		/* Get trans and from state. */
+		FsmTrans *trans = src->inList.head;
+		FsmState *fromState = trans->fromState;
+
+		/* Detach from src, reattach to dest. */
+		detachTrans( fromState, src, trans );
+		attachTrans( fromState, dest, trans );
+	}
+}
diff --git a/colm/fsmbase.cpp b/colm/fsmbase.cpp
new file mode 100644
index 00000000..6db6e8da
--- /dev/null
+++ b/colm/fsmbase.cpp
@@ -0,0 +1,602 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <assert.h>
+#include "fsmgraph.h"
+
+/* Simple singly linked list append routine for the fill list. The new state
+ * goes to the end of the list. */
+void MergeData::fillListAppend( FsmState *state )
+{
+	state->alg.next = 0;
+
+	if ( stfillHead == 0 ) {
+		/* List is empty, state becomes head and tail. */
+		stfillHead = state;
+		stfillTail = state;
+	}
+	else {
+		/* List is not empty, state goes after last element. */
+		stfillTail->alg.next = state;
+		stfillTail = state;
+	}
+}
+
+/* Graph constructor. */
+FsmGraph::FsmGraph()
+:
+	/* No start state. */
+	startState(0),
+	errState(0),
+
+	/* Misfit accounting is a switch, turned on only at specific times. It
+	 * controls what happens when states have no way in from the outside
+	 * world.. */
+	misfitAccounting(false),
+
+	lmRequiresErrorState(false)
+{
+}
+
+/* Copy all graph data including transitions. */
+FsmGraph::FsmGraph( const FsmGraph &graph )
+:
+	/* Lists start empty. Will be filled by copy. */
+	stateList(),
+	misfitList(),
+
+	/* Copy in the entry points, 
+	 * pointers will be resolved later. */
+	entryPoints(graph.entryPoints),
+	startState(graph.startState),
+	errState(0),
+
+	/* Will be filled by copy. */
+	finStateSet(),
+	
+	/* Misfit accounting is only on during merging. */
+	misfitAccounting(false),
+
+	lmRequiresErrorState(graph.lmRequiresErrorState)
+{
+	/* Create the states and record their map in the original state. */
+	StateList::Iter origState = graph.stateList;
+	for ( ; origState.lte(); origState++ ) {
+		/* Make the new state. */
+		FsmState *newState = new FsmState( *origState );
+
+		/* Add the state to the list.  */
+		stateList.append( newState );
+
+		/* Set the mapsTo item of the old state. */
+		origState->alg.stateMap = newState;
+	}
+	
+	/* Derefernce all the state maps. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+			/* The points to the original in the src machine. The taget's duplicate
+			 * is in the statemap. */
+			FsmState *toState = trans->toState != 0 ? trans->toState->alg.stateMap : 0;
+
+			/* Attach The transition to the duplicate. */
+			trans->toState = 0;
+			attachTrans( state, toState, trans );
+		}
+	}
+
+	/* Fix the state pointers in the entry points array. */
+	EntryMapEl *eel = entryPoints.data;
+	for ( int e = 0; e < entryPoints.length(); e++, eel++ ) {
+		/* Get the duplicate of the state. */
+		eel->value = eel->value->alg.stateMap;
+
+		/* Foreign in transitions must be built up when duping machines so
+		 * increment it here. */
+		eel->value->foreignInTrans += 1;
+	}
+
+	/* Fix the start state pointer and the new start state's count of in
+	 * transiions. */
+	startState = startState->alg.stateMap;
+	startState->foreignInTrans += 1;
+
+	/* Build the final state set. */
+	StateSet::Iter st = graph.finStateSet; 
+	for ( ; st.lte(); st++ ) 
+		finStateSet.insert((*st)->alg.stateMap);
+}
+
+/* Deletes all transition data then deletes each state. */
+FsmGraph::~FsmGraph()
+{
+	/* Delete all the transitions. */
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Iterate the out transitions, deleting them. */
+		state->outList.empty();
+	}
+
+	/* Delete all the states. */
+	stateList.empty();
+}
+
+/* Set a state final. The state has its isFinState set to true and the state
+ * is added to the finStateSet. */
+void FsmGraph::setFinState( FsmState *state )
+{
+	/* Is it already a fin state. */
+	if ( state->stateBits & SB_ISFINAL )
+		return;
+	
+	state->stateBits |= SB_ISFINAL;
+	finStateSet.insert( state );
+}
+
+/* Set a state non-final. The has its isFinState flag set false and the state
+ * is removed from the final state set. */
+void FsmGraph::unsetFinState( FsmState *state )
+{
+	/* Is it already a non-final state? */
+	if ( ! (state->stateBits & SB_ISFINAL) )
+		return;
+
+	/* When a state looses its final state status it must relinquish all the
+	 * properties that are allowed only for final states. */
+	clearOutData( state );
+
+	state->stateBits &= ~ SB_ISFINAL;
+	finStateSet.remove( state );
+}
+
+/* Set and unset a state as the start state. */
+void FsmGraph::setStartState( FsmState *state )
+{
+	/* Sould change from unset to set. */
+	assert( startState == 0 );
+	startState = state;
+
+	if ( misfitAccounting ) {
+		/* If the number of foreign in transitions is about to go up to 1 then
+		 * take it off the misfit list and put it on the head list. */
+		if ( state->foreignInTrans == 0 )
+			stateList.append( misfitList.detach( state ) );
+	}
+
+	/* Up the foreign in transitions to the state. */
+	state->foreignInTrans += 1;
+}
+
+void FsmGraph::unsetStartState()
+{
+	/* Should change from set to unset. */
+	assert( startState != 0 );
+
+	/* Decrement the entry's count of foreign entries. */
+	startState->foreignInTrans -= 1;
+
+	if ( misfitAccounting ) {
+		/* If the number of foreign in transitions just went down to 0 then take
+		 * it off the main list and put it on the misfit list. */
+		if ( startState->foreignInTrans == 0 )
+			misfitList.append( stateList.detach( startState ) );
+	}
+
+	startState = 0;
+}
+
+/* Associate an id with a state. Makes the state a named entry point. Has no
+ * effect if the entry point is already mapped to the state. */
+void FsmGraph::setEntry( int id, FsmState *state )
+{
+	/* Insert the id into the state. If the state is already labelled with id,
+	 * nothing to do. */
+	if ( state->entryIds.insert( id ) ) {
+		/* Insert the entry and assert that it succeeds. */
+		entryPoints.insertMulti( id, state );
+
+		if ( misfitAccounting ) {
+			/* If the number of foreign in transitions is about to go up to 1 then
+			 * take it off the misfit list and put it on the head list. */
+			if ( state->foreignInTrans == 0 )
+				stateList.append( misfitList.detach( state ) );
+		}
+
+		/* Up the foreign in transitions to the state. */
+		state->foreignInTrans += 1;
+	}
+}
+
+/* Remove the association of an id with a state. The state looses it's entry
+ * point status. Assumes that the id is indeed mapped to state. */
+void FsmGraph::unsetEntry( int id, FsmState *state )
+{
+	/* Find the entry point in on id. */
+	EntryMapEl *enLow = 0, *enHigh = 0;
+	entryPoints.findMulti( id, enLow, enHigh );
+	while ( enLow->value != state )
+		enLow += 1;
+
+	/* Remove the record from the map. */
+	entryPoints.remove( enLow );
+
+	/* Remove the state's sense of the link. */
+	state->entryIds.remove( id );
+	state->foreignInTrans -= 1;
+	if ( misfitAccounting ) {
+		/* If the number of foreign in transitions just went down to 0 then take
+		 * it off the main list and put it on the misfit list. */
+		if ( state->foreignInTrans == 0 )
+			misfitList.append( stateList.detach( state ) );
+	}
+}
+
+/* Remove all association of an id with states. Assumes that the id is indeed
+ * mapped to a state. */
+void FsmGraph::unsetEntry( int id )
+{
+	/* Find the entry point in on id. */
+	EntryMapEl *enLow = 0, *enHigh = 0;
+	entryPoints.findMulti( id, enLow, enHigh );
+	for ( EntryMapEl *mel = enLow; mel <= enHigh; mel++ ) {
+		/* Remove the state's sense of the link. */
+		mel->value->entryIds.remove( id );
+		mel->value->foreignInTrans -= 1;
+		if ( misfitAccounting ) {
+			/* If the number of foreign in transitions just went down to 0
+			 * then take it off the main list and put it on the misfit list. */
+			if ( mel->value->foreignInTrans == 0 )
+				misfitList.append( stateList.detach( mel->value ) );
+		}
+	}
+
+	/* Remove the records from the entry points map. */
+	entryPoints.removeMulti( enLow, enHigh );
+}
+
+
+void FsmGraph::changeEntry( int id, FsmState *to, FsmState *from )
+{
+	/* Find the entry in the entry map. */
+	EntryMapEl *enLow = 0, *enHigh = 0;
+	entryPoints.findMulti( id, enLow, enHigh );
+	while ( enLow->value != from )
+		enLow += 1;
+	
+	/* Change it to the new target. */
+	enLow->value = to;
+
+	/* Remove from's sense of the link. */
+	from->entryIds.remove( id );
+	from->foreignInTrans -= 1;
+	if ( misfitAccounting ) {
+		/* If the number of foreign in transitions just went down to 0 then take
+		 * it off the main list and put it on the misfit list. */
+		if ( from->foreignInTrans == 0 )
+			misfitList.append( stateList.detach( from ) );
+	}
+
+	/* Add to's sense of the link. */
+	if ( to->entryIds.insert( id ) != 0 ) {
+		if ( misfitAccounting ) {
+			/* If the number of foreign in transitions is about to go up to 1 then
+			 * take it off the misfit list and put it on the head list. */
+			if ( to->foreignInTrans == 0 )
+				stateList.append( misfitList.detach( to ) );
+		}
+
+		/* Up the foreign in transitions to the state. */
+		to->foreignInTrans += 1;
+	}
+}
+
+
+/* Clear all entry points from a machine. */
+void FsmGraph::unsetAllEntryPoints()
+{
+	for ( EntryMap::Iter en = entryPoints; en.lte(); en++ ) {
+		/* Kill all the state's entry points at once. */
+		if ( en->value->entryIds.length() > 0 ) {
+			en->value->foreignInTrans -= en->value->entryIds.length();
+
+			if ( misfitAccounting ) {
+				/* If the number of foreign in transitions just went down to 0
+				 * then take it off the main list and put it on the misfit
+				 * list. */
+				if ( en->value->foreignInTrans == 0 )
+					misfitList.append( stateList.detach( en->value ) );
+			}
+
+			/* Clear the set of ids out all at once. */
+			en->value->entryIds.empty();
+		}
+	}
+
+	/* Now clear out the entry map all at once. */
+	entryPoints.empty();
+}
+
+/* Assigning an epsilon transition into final states. */
+void FsmGraph::epsilonTrans( int id )
+{
+	for ( StateSet::Iter fs = finStateSet; fs.lte(); fs++ )
+		(*fs)->epsilonTrans.append( id );
+}
+
+/* Mark all states reachable from state. Traverses transitions forward. Used
+ * for removing states that have no path into them. */
+void FsmGraph::markReachableFromHere( FsmState *state )
+{
+	/* Base case: return; */
+	if ( state->stateBits & SB_ISMARKED )
+		return;
+	
+	/* Set this state as processed. We are going to visit all states that this
+	 * state has a transition to. */
+	state->stateBits |= SB_ISMARKED;
+
+	/* Recurse on all out transitions. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+		if ( trans->toState != 0 )
+			markReachableFromHere( trans->toState );
+	}
+}
+
+void FsmGraph::markReachableFromHereStopFinal( FsmState *state )
+{
+	/* Base case: return; */
+	if ( state->stateBits & SB_ISMARKED )
+		return;
+	
+	/* Set this state as processed. We are going to visit all states that this
+	 * state has a transition to. */
+	state->stateBits |= SB_ISMARKED;
+
+	/* Recurse on all out transitions. */
+	for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+		FsmState *toState = trans->toState;
+		if ( toState != 0 && !toState->isFinState() )
+			markReachableFromHereStopFinal( toState );
+	}
+}
+
+/* Mark all states reachable from state. Traverse transitions backwards. Used
+ * for removing dead end paths in graphs. */
+void FsmGraph::markReachableFromHereReverse( FsmState *state )
+{
+	/* Base case: return; */
+	if ( state->stateBits & SB_ISMARKED )
+		return;
+	
+	/* Set this state as processed. We are going to visit all states with
+	 * transitions into this state. */
+	state->stateBits |= SB_ISMARKED;
+
+	/* Recurse on all items in transitions. */
+	for ( TransInList::Iter trans = state->inList; trans.lte(); trans++ ) 
+		markReachableFromHereReverse( trans->fromState );
+}
+
+/* Determine if there are any entry points into a start state other than the
+ * start state. Setting starting transitions requires that the start state be
+ * isolated. In most cases a start state will already be isolated. */
+bool FsmGraph::isStartStateIsolated()
+{
+	/* If there are any in transitions then the state is not isolated. */
+	if ( startState->inList.head != 0 )
+		return false;
+
+	/* If there are any entry points then isolated. */
+	if ( startState->entryIds.length() > 0 )
+		return false;
+
+	return true;
+}
+
+/* Bring in other's entry points. Assumes others states are going to be
+ * copied into this machine. */
+void FsmGraph::copyInEntryPoints( FsmGraph *other )
+{
+	/* Use insert multi because names are not unique. */
+	for ( EntryMap::Iter en = other->entryPoints; en.lte(); en++ )
+		entryPoints.insertMulti( en->key, en->value );
+}
+
+
+void FsmGraph::unsetAllFinStates()
+{
+	for ( StateSet::Iter st = finStateSet; st.lte(); st++ )
+		(*st)->stateBits &= ~ SB_ISFINAL;
+	finStateSet.empty();
+}
+
+void FsmGraph::setFinBits( int finStateBits )
+{
+	for ( int s = 0; s < finStateSet.length(); s++ )
+		finStateSet.data[s]->stateBits |= finStateBits;
+}
+
+
+/* Tests the integrity of the transition lists and the fromStates. */
+void FsmGraph::verifyIntegrity()
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ ) {
+		/* Walk the out transitions and assert fromState is correct. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ )
+			assert( trans->fromState == state );
+
+		/* Walk the inlist and assert toState is correct. */
+		for ( TransInList::Iter trans = state->inList; trans.lte(); trans++ ) 
+			assert( trans->toState == state );
+	}
+}
+
+void FsmGraph::verifyReachability()
+{
+	/* Mark all the states that can be reached 
+	 * through the set of entry points. */
+	markReachableFromHere( startState );
+	for ( EntryMap::Iter en = entryPoints; en.lte(); en++ )
+		markReachableFromHere( en->value );
+
+	/* Check that everything got marked. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Assert it got marked and then clear the mark. */
+		assert( st->stateBits & SB_ISMARKED );
+		st->stateBits &= ~ SB_ISMARKED;
+	}
+}
+
+void FsmGraph::verifyNoDeadEndStates()
+{
+	/* Mark all states that have paths to the final states. */
+	for ( StateSet::Iter pst = finStateSet; pst.lte(); pst++ )
+		markReachableFromHereReverse( *pst );
+
+	/* Start state gets honorary marking. Must be done AFTER recursive call. */
+	startState->stateBits |= SB_ISMARKED;
+
+	/* Make sure everything got marked. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Assert the state got marked and unmark it. */
+		assert( st->stateBits & SB_ISMARKED );
+		st->stateBits &= ~ SB_ISMARKED;
+	}
+}
+
+void FsmGraph::depthFirstOrdering( FsmState *state )
+{
+	/* Nothing to do if the state is already on the list. */
+	if ( state->stateBits & SB_ONLIST )
+		return;
+
+	/* Doing depth first, put state on the list. */
+	state->stateBits |= SB_ONLIST;
+	stateList.append( state );
+	
+	/* Recurse on everything ranges. */
+	for ( TransList::Iter tel = state->outList; tel.lte(); tel++ ) {
+		if ( tel->toState != 0 )
+			depthFirstOrdering( tel->toState );
+	}
+}
+
+/* Ordering states by transition connections. */
+void FsmGraph::depthFirstOrdering()
+{
+	/* Init on state list flags. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ )
+		st->stateBits &= ~SB_ONLIST;
+	
+	/* Clear out the state list, we will rebuild it. */
+	int stateListLen = stateList.length();
+	stateList.abandon();
+
+	/* Add back to the state list from the start state and all other entry
+	 * points. */
+	if ( errState != 0 )
+		depthFirstOrdering( errState );
+	depthFirstOrdering( startState );
+	for ( EntryMap::Iter en = entryPoints; en.lte(); en++ )
+		depthFirstOrdering( en->value );
+	
+	/* Make sure we put everything back on. */
+	assert( stateListLen == stateList.length() );
+}
+
+/* Stable sort the states by final state status. */
+void FsmGraph::sortStatesByFinal()
+{
+	/* Move forward through the list and throw final states onto the end. */
+	FsmState *state = 0;
+	FsmState *next = stateList.head;
+	FsmState *last = stateList.tail;
+	while ( state != last ) {
+		/* Move forward and load up the next. */
+		state = next;
+		next = state->next;
+
+		/* Throw to the end? */
+		if ( state->isFinState() ) {
+			stateList.detach( state );
+			stateList.append( state );
+		}
+	}
+}
+
+void FsmGraph::setStateNumbers( int base )
+{
+	for ( StateList::Iter state = stateList; state.lte(); state++ )
+		state->alg.stateNum = base++;
+}
+
+
+bool FsmGraph::checkErrTrans( FsmState *state, FsmTrans *trans )
+{
+	/* Might go directly to error state. */
+	if ( trans->toState == 0 )
+		return true;
+
+	if ( trans->prev == 0 ) {
+		/* If this is the first transition. */
+		if ( keyOps->minKey < trans->lowKey )
+			return true;
+	}
+	else {
+		/* Not the first transition. Compare against the prev. */
+		FsmTrans *prev = trans->prev;
+		Key nextKey = prev->highKey;
+		nextKey.increment();
+		if ( nextKey < trans->lowKey )
+			return true; 
+	}
+	return false;
+}
+
+bool FsmGraph::checkErrTransFinish( FsmState *state )
+{
+	/* Check if there are any ranges already. */
+	if ( state->outList.length() == 0 )
+		return true;
+	else {
+		/* Get the last and check for a gap on the end. */
+		FsmTrans *last = state->outList.tail;
+		if ( last->highKey < keyOps->maxKey )
+			return true;
+	}
+	return 0;
+}
+
+bool FsmGraph::hasErrorTrans()
+{
+	bool result;
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		for ( TransList::Iter tr = st->outList; tr.lte(); tr++ ) {
+			result = checkErrTrans( st, tr );
+			if ( result )
+				return true;
+		}
+		result = checkErrTransFinish( st );
+		if ( result )
+			return true;
+	}
+	return false;
+}
diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
new file mode 100644
index 00000000..025c6dce
--- /dev/null
+++ b/colm/fsmcodegen.cpp
@@ -0,0 +1,1089 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "parsedata.h"
+#include "fsmcodegen.h"
+#include "redfsm.h"
+#include "dotgen.h"
+#include "bstmap.h"
+#include "fsmrun.h"
+#include <sstream>
+#include <string>
+#include <assert.h>
+
+
+using std::ostream;
+using std::ostringstream;
+using std::string;
+using std::cerr;
+using std::endl;
+
+
+/* Init code gen with in parameters. */
+FsmCodeGen::FsmCodeGen( const char *sourceFileName, const char *fsmName, ostream &out, 
+		RedFsm *redFsm, FsmTables *fsmTables )
+:
+	sourceFileName(sourceFileName),
+	fsmName(fsmName), 
+	out(out),
+	redFsm(redFsm), 
+	fsmTables(fsmTables),
+	codeGenErrCount(0),
+	dataPrefix(true),
+	writeFirstFinal(true),
+	writeErr(true)
+{
+}
+
+unsigned int FsmCodeGen::arrayTypeSize( unsigned long maxVal )
+{
+	long long maxValLL = (long long) maxVal;
+	HostType *arrayType = keyOps->typeSubsumes( maxValLL );
+	assert( arrayType != 0 );
+	return arrayType->size;
+}
+
+string FsmCodeGen::ARRAY_TYPE( unsigned long maxVal )
+{
+	long long maxValLL = (long long) maxVal;
+	HostType *arrayType = keyOps->typeSubsumes( maxValLL );
+	assert( arrayType != 0 );
+
+	string ret = arrayType->data1;
+	if ( arrayType->data2 != 0 ) {
+		ret += " ";
+		ret += arrayType->data2;
+	}
+	return ret;
+}
+
+
+/* Write out the fsm name. */
+string FsmCodeGen::FSM_NAME()
+{
+	return fsmName;
+}
+
+/* Emit the offset of the start state as a decimal integer. */
+string FsmCodeGen::START_STATE_ID()
+{
+	ostringstream ret;
+	ret << redFsm->startState->id;
+	return ret.str();
+};
+
+/* Write out the array of actions. */
+std::ostream &FsmCodeGen::ACTIONS_ARRAY()
+{
+	out << "\t0, ";
+	int totalActions = 1;
+	for ( GenActionTableMap::Iter act = redFsm->actionMap; act.lte(); act++ ) {
+		/* Write out the length, which will never be the last character. */
+		out << act->key.length() << ", ";
+		/* Put in a line break every 8 */
+		if ( totalActions++ % 8 == 7 )
+			out << "\n\t";
+
+		for ( GenActionTable::Iter item = act->key; item.lte(); item++ ) {
+			out << item->value->actionId;
+			if ( ! (act.last() && item.last()) )
+				out << ", ";
+
+			/* Put in a line break every 8 */
+			if ( totalActions++ % 8 == 7 )
+				out << "\n\t";
+		}
+	}
+	out << "\n";
+	return out;
+}
+
+
+string FsmCodeGen::CS()
+{
+	ostringstream ret;
+	/* Expression for retrieving the key, use simple dereference. */
+	ret << ACCESS() << "cs";
+	return ret.str();
+}
+
+string FsmCodeGen::GET_WIDE_KEY()
+{
+	if ( redFsm->anyConditions() ) 
+		return "_widec";
+	else
+		return GET_KEY();
+}
+
+string FsmCodeGen::GET_WIDE_KEY( RedState *state )
+{
+	if ( state->stateCondList.length() > 0 )
+		return "_widec";
+	else
+		return GET_KEY();
+}
+
+string FsmCodeGen::GET_KEY()
+{
+	ostringstream ret;
+	/* Expression for retrieving the key, use simple dereference. */
+	ret << "(*" << P() << ")";
+	return ret.str();
+}
+
+/* Write out level number of tabs. Makes the nested binary search nice
+ * looking. */
+string FsmCodeGen::TABS( int level )
+{
+	string result;
+	while ( level-- > 0 )
+		result += "\t";
+	return result;
+}
+
+/* Write out a key from the fsm code gen. Depends on wether or not the key is
+ * signed. */
+string FsmCodeGen::KEY( Key key )
+{
+	ostringstream ret;
+	if ( keyOps->isSigned || !hostLang->explicitUnsigned )
+		ret << key.getVal();
+	else
+		ret << (unsigned long) key.getVal() << 'u';
+	return ret.str();
+}
+
+void FsmCodeGen::SET_ACT( ostream &ret, InlineItem *item )
+{
+	ret << ACT() << " = " << item->longestMatchPart->longestMatchId << ";";
+}
+
+void FsmCodeGen::SET_TOKEND( ostream &ret, InlineItem *item )
+{
+	/* The tokend action sets tokend. */
+	ret << TOKEND() << " = " << P() << "+1;";
+}
+void FsmCodeGen::INIT_TOKSTART( ostream &ret, InlineItem *item )
+{
+	ret << TOKSTART() << " = 0;";
+}
+
+void FsmCodeGen::INIT_ACT( ostream &ret, InlineItem *item )
+{
+	ret << ACT() << " = 0;";
+}
+
+void FsmCodeGen::SET_TOKSTART( ostream &ret, InlineItem *item )
+{
+	ret << TOKSTART() << " = " << P() << ";";
+}
+
+void FsmCodeGen::EMIT_TOKEN( ostream &ret, KlangEl *token )
+{
+	if ( token->ignore )
+		ret << "	sendIgnore( " << token->id << " );\n";
+	else 
+		ret << "	sendToken( " << token->id << " );\n";
+}
+
+void FsmCodeGen::LM_SWITCH( ostream &ret, InlineItem *item, 
+		int targState, int inFinish )
+{
+	ret << 
+		"	" << P() << " = " << TOKEND() << ";\n"
+		"	switch( " << ACT() << " ) {\n";
+
+	/* If the switch handles error then we also forced the error state. It
+	 * will exist. */
+	if ( item->tokenRegion->lmSwitchHandlesError ) {
+		ret << "	case 0: " << P() << " = " << TOKSTART() << 
+				"; goto st" << redFsm->errState->id << ";\n";
+	}
+
+	for ( TokenDefList::Iter lmi = item->tokenRegion->tokenDefList; lmi.lte(); lmi++ ) {
+		if ( lmi->inLmSelect ) {
+			assert( lmi->token != 0 );
+			ret << "	case " << lmi->longestMatchId << ":\n";
+			EMIT_TOKEN( ret, lmi->token );
+			ret << "	break;\n";
+		}
+	}
+
+	ret << 
+		"	}\n"
+		"\t"
+		" goto _resume;\n";
+}
+
+void FsmCodeGen::LM_ON_LAST( ostream &ret, InlineItem *item )
+{
+	assert( item->longestMatchPart->token != 0 );
+
+	ret << "	" << P() << " += 1;\n";
+	EMIT_TOKEN( ret, item->longestMatchPart->token );
+	ret << "	goto _resume;\n";
+}
+
+void FsmCodeGen::LM_ON_NEXT( ostream &ret, InlineItem *item )
+{
+	assert( item->longestMatchPart->token != 0 );
+
+	EMIT_TOKEN( ret, item->longestMatchPart->token );
+	ret << "	goto _resume;\n";
+}
+
+void FsmCodeGen::LM_ON_LAG_BEHIND( ostream &ret, InlineItem *item )
+{
+	assert( item->longestMatchPart->token != 0 );
+
+	ret << "	" << P() << " = " << TOKEND() << ";\n";
+	EMIT_TOKEN( ret, item->longestMatchPart->token );
+	ret << "	goto _resume;\n";
+}
+
+
+/* Write out an inline tree structure. Walks the list and possibly calls out
+ * to virtual functions than handle language specific items in the tree. */
+void FsmCodeGen::INLINE_LIST( ostream &ret, InlineList *inlineList, 
+		int targState, bool inFinish )
+{
+	for ( InlineList::Iter item = *inlineList; item.lte(); item++ ) {
+		switch ( item->type ) {
+		case InlineItem::Text:
+			assert( false );
+			break;
+		case InlineItem::LmSetActId:
+			SET_ACT( ret, item );
+			break;
+		case InlineItem::LmSetTokEnd:
+			SET_TOKEND( ret, item );
+			break;
+		case InlineItem::LmInitTokStart:
+			assert( false );
+			break;
+		case InlineItem::LmInitAct:
+			INIT_ACT( ret, item );
+			break;
+		case InlineItem::LmSetTokStart:
+			SET_TOKSTART( ret, item );
+			break;
+		case InlineItem::LmSwitch:
+			LM_SWITCH( ret, item, targState, inFinish );
+			break;
+		case InlineItem::LmOnLast:
+			LM_ON_LAST( ret, item );
+			break;
+		case InlineItem::LmOnNext:
+			LM_ON_NEXT( ret, item );
+			break;
+		case InlineItem::LmOnLagBehind:
+			LM_ON_LAG_BEHIND( ret, item );
+			break;
+		}
+	}
+}
+
+/* Write out paths in line directives. Escapes any special characters. */
+string FsmCodeGen::LDIR_PATH( char *path )
+{
+	ostringstream ret;
+	for ( char *pc = path; *pc != 0; pc++ ) {
+		if ( *pc == '\\' )
+			ret << "\\\\";
+		else
+			ret << *pc;
+	}
+	return ret.str();
+}
+
+void FsmCodeGen::ACTION( ostream &ret, GenAction *action, int targState, bool inFinish )
+{
+	/* Write the block and close it off. */
+	ret << "\t{";
+	INLINE_LIST( ret, action->inlineList, targState, inFinish );
+
+	if ( action->objField ) {
+		ObjField *field = action->objField;
+		if ( action->markType == MarkEnter )
+			ret << "mark_enter[" << field->offset << "] = " << P() << ";\n";
+		else if ( action->markType == MarkLeave )
+			ret << "mark_leave[" << field->offset << "] = " << P() << ";\n";
+	}
+
+	ret << "}\n";
+
+}
+
+void FsmCodeGen::CONDITION( ostream &ret, GenAction *condition )
+{
+	ret << "\n";
+	INLINE_LIST( ret, condition->inlineList, 0, false );
+}
+
+string FsmCodeGen::ERROR_STATE()
+{
+	ostringstream ret;
+	if ( redFsm->errState != 0 )
+		ret << redFsm->errState->id;
+	else
+		ret << "-1";
+	return ret.str();
+}
+
+string FsmCodeGen::FIRST_FINAL_STATE()
+{
+	ostringstream ret;
+	if ( redFsm->firstFinState != 0 )
+		ret << redFsm->firstFinState->id;
+	else
+		ret << redFsm->nextStateId;
+	return ret.str();
+}
+
+string FsmCodeGen::DATA_PREFIX()
+{
+	if ( dataPrefix )
+		return FSM_NAME() + "_";
+	return "";
+}
+
+/* Emit the alphabet data type. */
+string FsmCodeGen::ALPH_TYPE()
+{
+	string ret = keyOps->alphType->data1;
+	if ( keyOps->alphType->data2 != 0 ) {
+		ret += " ";
+		ret += + keyOps->alphType->data2;
+	}
+	return ret;
+}
+
+/* Emit the alphabet data type. */
+string FsmCodeGen::WIDE_ALPH_TYPE()
+{
+	string ret;
+	if ( redFsm->maxKey <= keyOps->maxKey )
+		ret = ALPH_TYPE();
+	else {
+		long long maxKeyVal = redFsm->maxKey.getLongLong();
+		HostType *wideType = keyOps->typeSubsumes( keyOps->isSigned, maxKeyVal );
+		assert( wideType != 0 );
+
+		ret = wideType->data1;
+		if ( wideType->data2 != 0 ) {
+			ret += " ";
+			ret += wideType->data2;
+		}
+	}
+	return ret;
+}
+
+
+string FsmCodeGen::PTR_CONST()
+{
+	return "const ";
+}
+
+std::ostream &FsmCodeGen::OPEN_ARRAY( string type, string name )
+{
+	out << "static const " << type << " " << name << "[] = {\n";
+	return out;
+}
+
+std::ostream &FsmCodeGen::CLOSE_ARRAY()
+{
+	return out << "};\n";
+}
+
+std::ostream &FsmCodeGen::STATIC_VAR( string type, string name )
+{
+	out << "static const " << type << " " << name;
+	return out;
+}
+
+string FsmCodeGen::UINT( )
+{
+	return "unsigned int";
+}
+
+string FsmCodeGen::ARR_OFF( string ptr, string offset )
+{
+	return ptr + " + " + offset;
+}
+
+string FsmCodeGen::CAST( string type )
+{
+	return "(" + type + ")";
+}
+
+std::ostream &FsmCodeGen::TO_STATE_ACTION_SWITCH()
+{
+	/* Walk the list of functions, printing the cases. */
+	for ( GenActionList::Iter act = redFsm->actionList; act.lte(); act++ ) {
+		/* Write out referenced actions. */
+		if ( act->numToStateRefs > 0 ) {
+			/* Write the case label, the action and the case break. */
+			out << "\tcase " << act->actionId << ":\n";
+			ACTION( out, act, 0, false );
+			out << "\tbreak;\n";
+		}
+	}
+
+	return out;
+}
+
+std::ostream &FsmCodeGen::FROM_STATE_ACTION_SWITCH()
+{
+	/* Walk the list of functions, printing the cases. */
+	for ( GenActionList::Iter act = redFsm->actionList; act.lte(); act++ ) {
+		/* Write out referenced actions. */
+		if ( act->numFromStateRefs > 0 ) {
+			/* Write the case label, the action and the case break. */
+			out << "\tcase " << act->actionId << ":\n";
+			ACTION( out, act, 0, false );
+			out << "\tbreak;\n";
+		}
+	}
+
+	return out;
+}
+
+std::ostream &FsmCodeGen::ACTION_SWITCH()
+{
+	/* Walk the list of functions, printing the cases. */
+	for ( GenActionList::Iter act = redFsm->actionList; act.lte(); act++ ) {
+		/* Write out referenced actions. */
+		if ( act->numTransRefs > 0 ) {
+			/* Write the case label, the action and the case break. */
+			out << "\tcase " << act->actionId << ":\n";
+			ACTION( out, act, 0, false );
+			out << "\tbreak;\n";
+		}
+	}
+
+	return out;
+}
+
+void FsmCodeGen::emitSingleSwitch( RedState *state )
+{
+	/* Load up the singles. */
+	int numSingles = state->outSingle.length();
+	RedTransEl *data = state->outSingle.data;
+
+	if ( numSingles == 1 ) {
+		/* If there is a single single key then write it out as an if. */
+		out << "\tif ( " << GET_WIDE_KEY(state) << " == " << 
+				KEY(data[0].lowKey) << " )\n\t\t"; 
+
+		/* Virtual function for writing the target of the transition. */
+		TRANS_GOTO(data[0].value, 0) << "\n";
+	}
+	else if ( numSingles > 1 ) {
+		/* Write out single keys in a switch if there is more than one. */
+		out << "\tswitch( " << GET_WIDE_KEY(state) << " ) {\n";
+
+		/* Write out the single indicies. */
+		for ( int j = 0; j < numSingles; j++ ) {
+			out << "\t\tcase " << KEY(data[j].lowKey) << ": ";
+			TRANS_GOTO(data[j].value, 0) << "\n";
+		}
+		
+		/* Close off the transition switch. */
+		out << "\t}\n";
+	}
+}
+
+void FsmCodeGen::emitRangeBSearch( RedState *state, int level, int low, int high )
+{
+	/* Get the mid position, staying on the lower end of the range. */
+	int mid = (low + high) >> 1;
+	RedTransEl *data = state->outRange.data;
+
+	/* Determine if we need to look higher or lower. */
+	bool anyLower = mid > low;
+	bool anyHigher = mid < high;
+
+	/* Determine if the keys at mid are the limits of the alphabet. */
+	bool limitLow = data[mid].lowKey == keyOps->minKey;
+	bool limitHigh = data[mid].highKey == keyOps->maxKey;
+
+	if ( anyLower && anyHigher ) {
+		/* Can go lower and higher than mid. */
+		out << TABS(level) << "if ( " << GET_WIDE_KEY(state) << " < " << 
+				KEY(data[mid].lowKey) << " ) {\n";
+		emitRangeBSearch( state, level+1, low, mid-1 );
+		out << TABS(level) << "} else if ( " << GET_WIDE_KEY(state) << " > " << 
+				KEY(data[mid].highKey) << " ) {\n";
+		emitRangeBSearch( state, level+1, mid+1, high );
+		out << TABS(level) << "} else\n";
+		TRANS_GOTO(data[mid].value, level+1) << "\n";
+	}
+	else if ( anyLower && !anyHigher ) {
+		/* Can go lower than mid but not higher. */
+		out << TABS(level) << "if ( " << GET_WIDE_KEY(state) << " < " << 
+				KEY(data[mid].lowKey) << " ) {\n";
+		emitRangeBSearch( state, level+1, low, mid-1 );
+
+		/* if the higher is the highest in the alphabet then there is no
+		 * sense testing it. */
+		if ( limitHigh ) {
+			out << TABS(level) << "} else\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+		else {
+			out << TABS(level) << "} else if ( " << GET_WIDE_KEY(state) << " <= " << 
+					KEY(data[mid].highKey) << " )\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+	}
+	else if ( !anyLower && anyHigher ) {
+		/* Can go higher than mid but not lower. */
+		out << TABS(level) << "if ( " << GET_WIDE_KEY(state) << " > " << 
+				KEY(data[mid].highKey) << " ) {\n";
+		emitRangeBSearch( state, level+1, mid+1, high );
+
+		/* If the lower end is the lowest in the alphabet then there is no
+		 * sense testing it. */
+		if ( limitLow ) {
+			out << TABS(level) << "} else\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+		else {
+			out << TABS(level) << "} else if ( " << GET_WIDE_KEY(state) << " >= " << 
+					KEY(data[mid].lowKey) << " )\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+	}
+	else {
+		/* Cannot go higher or lower than mid. It's mid or bust. What
+		 * tests to do depends on limits of alphabet. */
+		if ( !limitLow && !limitHigh ) {
+			out << TABS(level) << "if ( " << KEY(data[mid].lowKey) << " <= " << 
+					GET_WIDE_KEY(state) << " && " << GET_WIDE_KEY(state) << " <= " << 
+					KEY(data[mid].highKey) << " )\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+		else if ( limitLow && !limitHigh ) {
+			out << TABS(level) << "if ( " << GET_WIDE_KEY(state) << " <= " << 
+					KEY(data[mid].highKey) << " )\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+		else if ( !limitLow && limitHigh ) {
+			out << TABS(level) << "if ( " << KEY(data[mid].lowKey) << " <= " << 
+					GET_WIDE_KEY(state) << " )\n";
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+		else {
+			/* Both high and low are at the limit. No tests to do. */
+			TRANS_GOTO(data[mid].value, level+1) << "\n";
+		}
+	}
+}
+
+void FsmCodeGen::COND_TRANSLATE( GenStateCond *stateCond, int level )
+{
+	GenCondSpace *condSpace = stateCond->condSpace;
+	out << TABS(level) << "_widec = " << CAST(WIDE_ALPH_TYPE()) << "(" <<
+			KEY(condSpace->baseKey) << " + (" << GET_KEY() << 
+			" - " << KEY(keyOps->minKey) << "));\n";
+
+	for ( GenCondSet::Iter csi = condSpace->condSet; csi.lte(); csi++ ) {
+		out << TABS(level) << "if ( ";
+		CONDITION( out, *csi );
+		Size condValOffset = ((1 << csi.pos()) * keyOps->alphSize());
+		out << " ) _widec += " << condValOffset << ";\n";
+	}
+}
+
+void FsmCodeGen::emitCondBSearch( RedState *state, int level, int low, int high )
+{
+	/* Get the mid position, staying on the lower end of the range. */
+	int mid = (low + high) >> 1;
+	GenStateCond **data = state->stateCondVect.data;
+
+	/* Determine if we need to look higher or lower. */
+	bool anyLower = mid > low;
+	bool anyHigher = mid < high;
+
+	/* Determine if the keys at mid are the limits of the alphabet. */
+	bool limitLow = data[mid]->lowKey == keyOps->minKey;
+	bool limitHigh = data[mid]->highKey == keyOps->maxKey;
+
+	if ( anyLower && anyHigher ) {
+		/* Can go lower and higher than mid. */
+		out << TABS(level) << "if ( " << GET_KEY() << " < " << 
+				KEY(data[mid]->lowKey) << " ) {\n";
+		emitCondBSearch( state, level+1, low, mid-1 );
+		out << TABS(level) << "} else if ( " << GET_KEY() << " > " << 
+				KEY(data[mid]->highKey) << " ) {\n";
+		emitCondBSearch( state, level+1, mid+1, high );
+		out << TABS(level) << "} else {\n";
+		COND_TRANSLATE(data[mid], level+1);
+		out << TABS(level) << "}\n";
+	}
+	else if ( anyLower && !anyHigher ) {
+		/* Can go lower than mid but not higher. */
+		out << TABS(level) << "if ( " << GET_KEY() << " < " << 
+				KEY(data[mid]->lowKey) << " ) {\n";
+		emitCondBSearch( state, level+1, low, mid-1 );
+
+		/* if the higher is the highest in the alphabet then there is no
+		 * sense testing it. */
+		if ( limitHigh ) {
+			out << TABS(level) << "} else {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+		else {
+			out << TABS(level) << "} else if ( " << GET_KEY() << " <= " << 
+					KEY(data[mid]->highKey) << " ) {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+	}
+	else if ( !anyLower && anyHigher ) {
+		/* Can go higher than mid but not lower. */
+		out << TABS(level) << "if ( " << GET_KEY() << " > " << 
+				KEY(data[mid]->highKey) << " ) {\n";
+		emitCondBSearch( state, level+1, mid+1, high );
+
+		/* If the lower end is the lowest in the alphabet then there is no
+		 * sense testing it. */
+		if ( limitLow ) {
+			out << TABS(level) << "} else {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+		else {
+			out << TABS(level) << "} else if ( " << GET_KEY() << " >= " << 
+					KEY(data[mid]->lowKey) << " ) {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+	}
+	else {
+		/* Cannot go higher or lower than mid. It's mid or bust. What
+		 * tests to do depends on limits of alphabet. */
+		if ( !limitLow && !limitHigh ) {
+			out << TABS(level) << "if ( " << KEY(data[mid]->lowKey) << " <= " << 
+					GET_KEY() << " && " << GET_KEY() << " <= " << 
+					KEY(data[mid]->highKey) << " ) {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+		else if ( limitLow && !limitHigh ) {
+			out << TABS(level) << "if ( " << GET_KEY() << " <= " << 
+					KEY(data[mid]->highKey) << " ) {\n";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+		else if ( !limitLow && limitHigh ) {
+			out << TABS(level) << "if ( " << KEY(data[mid]->lowKey) << " <= " << 
+					GET_KEY() << " )\n {";
+			COND_TRANSLATE(data[mid], level+1);
+			out << TABS(level) << "}\n";
+		}
+		else {
+			/* Both high and low are at the limit. No tests to do. */
+			COND_TRANSLATE(data[mid], level);
+		}
+	}
+}
+
+std::ostream &FsmCodeGen::STATE_GOTOS()
+{
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		if ( st == redFsm->errState )
+			STATE_GOTO_ERROR();
+		else {
+			/* Writing code above state gotos. */
+			GOTO_HEADER( st );
+
+			if ( st->stateCondVect.length() > 0 ) {
+				out << "	_widec = " << GET_KEY() << ";\n";
+				emitCondBSearch( st, 1, 0, st->stateCondVect.length() - 1 );
+			}
+
+			/* Try singles. */
+			if ( st->outSingle.length() > 0 )
+				emitSingleSwitch( st );
+
+			/* Default case is to binary search for the ranges, if that fails then */
+			if ( st->outRange.length() > 0 )
+				emitRangeBSearch( st, 1, 0, st->outRange.length() - 1 );
+
+			/* Write the default transition. */
+			TRANS_GOTO( st->defTrans, 1 ) << "\n";
+		}
+	}
+	return out;
+}
+
+unsigned int FsmCodeGen::TO_STATE_ACTION( RedState *state )
+{
+	int act = 0;
+	if ( state->toStateAction != 0 )
+		act = state->toStateAction->location+1;
+	return act;
+}
+
+unsigned int FsmCodeGen::FROM_STATE_ACTION( RedState *state )
+{
+	int act = 0;
+	if ( state->fromStateAction != 0 )
+		act = state->fromStateAction->location+1;
+	return act;
+}
+
+std::ostream &FsmCodeGen::TO_STATE_ACTIONS()
+{
+	/* Take one off for the psuedo start state. */
+	int numStates = redFsm->stateList.length();
+	unsigned int *vals = new unsigned int[numStates];
+	memset( vals, 0, sizeof(unsigned int)*numStates );
+
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
+		vals[st->id] = TO_STATE_ACTION(st);
+
+	out << "\t";
+	for ( int st = 0; st < redFsm->nextStateId; st++ ) {
+		/* Write any eof action. */
+		out << vals[st];
+		if ( st < numStates-1 ) {
+			out << ", ";
+			if ( (st+1) % IALL == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n";
+	delete[] vals;
+	return out;
+}
+
+std::ostream &FsmCodeGen::FROM_STATE_ACTIONS()
+{
+	/* Take one off for the psuedo start state. */
+	int numStates = redFsm->stateList.length();
+	unsigned int *vals = new unsigned int[numStates];
+	memset( vals, 0, sizeof(unsigned int)*numStates );
+
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
+		vals[st->id] = FROM_STATE_ACTION(st);
+
+	out << "\t";
+	for ( int st = 0; st < redFsm->nextStateId; st++ ) {
+		/* Write any eof action. */
+		out << vals[st];
+		if ( st < numStates-1 ) {
+			out << ", ";
+			if ( (st+1) % IALL == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n";
+	delete[] vals;
+	return out;
+}
+
+bool FsmCodeGen::IN_TRANS_ACTIONS( RedState *state )
+{
+	/* Emit any transitions that have actions and that go to this state. */
+	for ( int it = 0; it < state->numInTrans; it++ ) {
+		RedTrans *trans = state->inTrans[it];
+		if ( trans->action != 0 && trans->labelNeeded ) {
+			/* Write the label for the transition so it can be jumped to. */
+			out << "tr" << trans->id << ":\n";
+
+			/* If the action contains a next, then we must preload the current
+			 * state since the action may or may not set it. */
+			if ( trans->action->anyNextStmt() )
+				out << "	" << CS() << " = " << trans->targ->id << ";\n";
+
+			/* Write each action in the list. */
+			for ( GenActionTable::Iter item = trans->action->key; item.lte(); item++ )
+				ACTION( out, item->value, trans->targ->id, false );
+
+			out << "\tgoto st" << trans->targ->id << ";\n";
+		}
+	}
+
+	return 0;
+}
+
+/* Called from FsmCodeGen::STATE_GOTOS just before writing the gotos for each
+ * state. */
+void FsmCodeGen::GOTO_HEADER( RedState *state )
+{
+	IN_TRANS_ACTIONS( state );
+
+	if ( state->labelNeeded ) 
+		out << "st" << state->id << ":\n";
+
+	if ( state->toStateAction != 0 ) {
+		/* Remember that we wrote an action. Write every action in the list. */
+		for ( GenActionTable::Iter item = state->toStateAction->key; item.lte(); item++ )
+			ACTION( out, item->value, state->id, false );
+	}
+
+	/* Give the state a switch case. */
+	out << "case " << state->id << ":\n";
+
+	/* Advance and test buffer pos. */
+	out <<
+		"	if ( ++" << P() << " == " << PE() << " )\n"
+		"		goto out" << state->id << ";\n";
+
+	if ( state->fromStateAction != 0 ) {
+		/* Remember that we wrote an action. Write every action in the list. */
+		for ( GenActionTable::Iter item = state->fromStateAction->key; item.lte(); item++ )
+			ACTION( out, item->value, state->id, false );
+	}
+
+	/* Record the prev state if necessary. */
+	if ( state->anyRegCurStateRef() )
+		out << "	_ps = " << state->id << ";\n";
+}
+
+void FsmCodeGen::STATE_GOTO_ERROR()
+{
+	/* In the error state we need to emit some stuff that usually goes into
+	 * the header. */
+	RedState *state = redFsm->errState;
+	IN_TRANS_ACTIONS( state );
+
+	if ( state->labelNeeded ) 
+		out << "st" << state->id << ":\n";
+
+	/* We do not need a case label here because the the error state is checked
+	 * at the head of the loop. */
+
+	/* Break out here. */
+	out << "	goto out" << state->id << ";\n";
+}
+
+
+/* Emit the goto to take for a given transition. */
+std::ostream &FsmCodeGen::TRANS_GOTO( RedTrans *trans, int level )
+{
+	if ( trans->action != 0 ) {
+		/* Go to the transition which will go to the state. */
+		out << TABS(level) << "goto tr" << trans->id << ";";
+	}
+	else {
+		/* Go directly to the target state. */
+		out << TABS(level) << "goto st" << trans->targ->id << ";";
+	}
+	return out;
+}
+
+std::ostream &FsmCodeGen::EXIT_STATES()
+{
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		out << "	case " << st->id << ": out" << st->id << ": ";
+		if ( st->eofTrans != 0 ) {
+			out << "if ( " << PE() << " == " << PEOF() << " ) {";
+			TRANS_GOTO( st->eofTrans, 0 );
+			out << "\n";
+			out << "}";
+		}
+
+		/* Exit. */
+		out << CS() << " = " << st->id << "; goto out; \n";
+	}
+	return out;
+}
+
+/* Set up labelNeeded flag for each state. */
+void FsmCodeGen::setLabelsNeeded()
+{
+	/* Do not use all labels by default, init all labelNeeded vars to false. */
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
+		st->labelNeeded = false;
+
+	if ( redFsm->errState != 0 && redFsm->anyLmSwitchError() )
+		redFsm->errState->labelNeeded = true;
+
+	/* Walk all transitions and set only those that have targs. */
+	for ( RedTransSet::Iter trans = redFsm->transSet; trans.lte(); trans++ ) {
+		/* If there is no action with a next statement, then the label will be
+		 * needed. */
+		if ( trans->action == 0 || !trans->action->anyNextStmt() )
+			trans->targ->labelNeeded = true;
+	}
+
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
+		st->outNeeded = st->labelNeeded;
+}
+
+void FsmCodeGen::writeData()
+{
+	out << "static const int " << START() << " = " << START_STATE_ID() << ";\n";
+	out << "static const int " << FIRST_FINAL() << " = " << FIRST_FINAL_STATE() << ";\n";
+	out << "static const int " << ERROR() << " = " << ERROR_STATE() << ";\n";
+	out << "\n";
+
+	out << "long " << entryByRegion() << "[] = {\n\t";
+	for ( int i = 0; i < fsmTables->numRegions; i++ ) {
+		out << fsmTables->entryByRegion[i];
+
+		if ( i < fsmTables->numRegions-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out <<
+		"FsmTables fsmTables_start =\n"
+		"{\n"
+		"	0, "       /* actions */
+		" 0, "         /* keyOffsets */
+		" 0, "         /* transKeys */
+		" 0, "         /* singleLengths */
+		" 0, "         /* rangeLengths */
+		" 0, "         /* indexOffsets */
+		" 0, "         /* transTargsWI */
+		" 0, "         /* transActionsWI */
+		" 0, "         /* toStateActions */
+		" 0, "         /* fromStateActions */
+		" 0, "         /* eofActions */
+		" 0,\n"        /* eofTargs */
+		"	" << entryByRegion() << ",\n"
+
+		"\n"
+		"	0, "       /* numStates */
+		" 0, "         /* numActions */
+		" 0, "         /* numTransKeys */
+		" 0, "         /* numSingleLengths */
+		" 0, "         /* numRangeLengths */
+		" 0, "         /* numIndexOffsets */
+		" 0, "         /* numTransTargsWI */
+		" 0,\n"        /* numTransActionsWI */
+		"	" << redFsm->regionToEntry.length() << ",\n"
+		"\n"
+		"	" << START() << ",\n"
+		"	" << FIRST_FINAL() << ",\n"
+		"	" << ERROR() << ",\n"
+		"\n"
+		"	0,\n"      /* actionSwitch */
+		"	0\n"       /* numActionSwitch */
+		"};\n"
+		"\n";
+}
+
+void FsmCodeGen::writeInit()
+{
+	out << 
+		"	" << CS() << " = " << START() << ";\n";
+	
+	/* If there are any calls, then the stack top needs initialization. */
+	if ( redFsm->anyActionCalls() || redFsm->anyActionRets() )
+		out << "\t" << TOP() << " = 0;\n";
+
+	out << 
+		"	" << TOKSTART() << " = 0;\n"
+		"	" << TOKEND() << " = 0;\n"
+		"	" << ACT() << " = 0;\n";
+
+	out << "\n";
+}
+
+void FsmCodeGen::writeExec()
+{
+	setLabelsNeeded();
+
+	out <<
+		"void FsmRun::execute()\n"
+		"{\n"
+		"_resume:\n";
+
+	if ( redFsm->errState != 0 ) {
+		out <<
+			"	if ( " << CS() << " == " << redFsm->errState->id << " )\n"
+			"		goto out;\n";
+	}
+
+	out <<
+		"	if ( p == pe )\n"
+		"		goto out_switch;\n"
+		"	--" << P() << ";\n"
+		"\n"
+		"	switch ( " << CS() << " )\n	{\n";
+		STATE_GOTOS() << 
+		"	}\n";
+
+	out << 
+		"out_switch:\n"
+		"	switch ( " << CS() << " )\n	{\n";
+	EXIT_STATES() <<
+		"	}\n";
+
+	out <<
+		"	out: {}\n"
+		"}\n"
+		"\n";
+}
+
+void FsmCodeGen::writeCode()
+{
+	redFsm->depthFirstOrdering();
+
+	out << 
+		"#include <stdio.h>\n"
+		"#include <stdlib.h>\n"
+		"#include <string.h>\n"
+		"#include \"config.h\"\n"
+		"\n"
+		"\n";
+
+	writeData();
+	writeExec();
+
+	out << 
+		"int main( int argc, char **argv )\n"
+		"{\n"
+		"	Program program( true, &main_runtimeData );\n"
+		"	program.freshGlobal();\n"
+		"	program.run();\n"
+		"	program.clear();\n"
+		"	return 0;\n"
+		"}\n"
+		"\n";
+
+	out.flush();
+}
+
+ostream &FsmCodeGen::source_warning( const InputLoc &loc )
+{
+	cerr << sourceFileName << ":" << loc.line << ":" << loc.col << ": warning: ";
+	return cerr;
+}
+
+ostream &FsmCodeGen::source_error( const InputLoc &loc )
+{
+	codeGenErrCount += 1;
+	assert( sourceFileName != 0 );
+	cerr << sourceFileName << ":" << loc.line << ":" << loc.col << ": ";
+	return cerr;
+}
+
+
diff --git a/colm/fsmcodegen.h b/colm/fsmcodegen.h
new file mode 100644
index 00000000..ff804e88
--- /dev/null
+++ b/colm/fsmcodegen.h
@@ -0,0 +1,214 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _FSMCODEGEN_H
+#define _FSMCODEGEN_H
+
+#include <iostream>
+#include <string>
+#include <stdio.h>
+#include "common.h"
+#include "parsedata.h"
+#include "redfsm.h"
+
+using std::string;
+using std::ostream;
+
+/* Integer array line length. */
+#define IALL 8
+
+/* Forwards. */
+struct RedFsm;
+struct RedState;
+struct GenAction;
+struct NameInst;
+struct RedAction;
+struct LongestMatch;
+struct TokenDef;
+struct InlineList;
+struct InlineItem;
+struct FsmRun;
+struct NameInst;
+struct FsmCodeGen;
+
+typedef unsigned long ulong;
+typedef unsigned char uchar;
+
+
+/*
+ * The interface to the parser
+ */
+
+std::ostream *openOutput( char *inputFile );
+
+inline string itoa( int i )
+{
+	char buf[16];
+	sprintf( buf, "%i", i );
+	return buf;
+}
+
+/*
+ * class FsmCodeGen
+ */
+class FsmCodeGen
+{
+public:
+	FsmCodeGen( const char *sourceFileName, const char *fsmName, ostream &out, 
+			RedFsm *redFsm, FsmTables *fsmTables );
+
+protected:
+	string FSM_NAME();
+	string START_STATE_ID();
+	ostream &ACTIONS_ARRAY();
+	string GET_WIDE_KEY();
+	string GET_WIDE_KEY( RedState *state );
+	string TABS( int level );
+	string KEY( Key key );
+	string LDIR_PATH( char *path );
+	void ACTION( ostream &ret, GenAction *action, int targState, bool inFinish );
+	void CONDITION( ostream &ret, GenAction *condition );
+	string ALPH_TYPE();
+	string WIDE_ALPH_TYPE();
+	string ARRAY_TYPE( unsigned long maxVal );
+
+	string ARR_OFF( string ptr, string offset );
+	string CAST( string type );
+	string UINT();
+	string GET_KEY();
+
+	string ACCESS() { return ""; }
+
+	string P() { return ACCESS() + "p"; }
+	string PE() { return ACCESS() + "pe"; }
+	string PEOF() { return ACCESS() + "peof"; }
+
+	string BUF() { return ACCESS() + "buf"; }
+	string HAVE() { return ACCESS() + "have"; }
+	string IGNLEN() { return ACCESS() + "ignlen"; }
+
+	string CS();
+	string STACK() { return ACCESS() + "stack"; }
+	string TOP() { return ACCESS() + "top"; }
+	string TOKSTART() { return ACCESS() + "tokstart"; }
+	string TOKEND() { return ACCESS() + "tokend"; }
+	string ACT() { return ACCESS() + "act"; }
+
+	string DATA_PREFIX();
+
+	string START() { return DATA_PREFIX() + "start"; }
+	string ERROR() { return DATA_PREFIX() + "error"; }
+	string FIRST_FINAL() { return DATA_PREFIX() + "first_final"; }
+
+	string entryByRegion() { return DATA_PREFIX() + "entryByRegion"; }
+
+
+	void INLINE_LIST( ostream &ret, InlineList *inlineList, 
+		int targState, bool inFinish );
+	void EXEC_TOKEND( ostream &ret, InlineItem *item, int targState, int inFinish );
+	void EXECTE( ostream &ret, InlineItem *item, int targState, int inFinish );
+	void LM_SWITCH( ostream &ret, InlineItem *item, int targState, int inFinish );
+	void SET_ACT( ostream &ret, InlineItem *item );
+	void INIT_TOKSTART( ostream &ret, InlineItem *item );
+	void INIT_ACT( ostream &ret, InlineItem *item );
+	void SET_TOKSTART( ostream &ret, InlineItem *item );
+	void SET_TOKEND( ostream &ret, InlineItem *item );
+	void GET_TOKEND( ostream &ret, InlineItem *item );
+	void SUB_ACTION( ostream &ret, InlineItem *item, int targState, bool inFinish );
+	void LM_ON_LAST( ostream &ret, InlineItem *item );
+	void LM_ON_NEXT( ostream &ret, InlineItem *item );
+	void LM_ON_LAG_BEHIND( ostream &ret, InlineItem *item );
+	void EXEC_TOKEND( ostream &ret );
+	void EMIT_TOKEN( ostream &ret, KlangEl *token );
+
+	string ERROR_STATE();
+	string FIRST_FINAL_STATE();
+
+	string PTR_CONST();
+	ostream &OPEN_ARRAY( string type, string name );
+	ostream &CLOSE_ARRAY();
+	ostream &STATIC_VAR( string type, string name );
+
+	string CTRL_FLOW();
+
+	ostream &source_warning(const InputLoc &loc);
+	ostream &source_error(const InputLoc &loc);
+
+	unsigned int arrayTypeSize( unsigned long maxVal );
+
+/* subclass */
+
+public:
+	const char *sourceFileName;
+	const char *fsmName;
+	ostream &out;
+	RedFsm *redFsm;
+	FsmTables *fsmTables;
+	int codeGenErrCount;
+
+	/* Write options. */
+	bool dataPrefix;
+	bool writeFirstFinal;
+	bool writeErr;
+
+	std::ostream &TO_STATE_ACTION_SWITCH();
+	std::ostream &FROM_STATE_ACTION_SWITCH();
+	std::ostream &ACTION_SWITCH();
+	std::ostream &STATE_GOTOS();
+	std::ostream &TRANSITIONS();
+	std::ostream &EXEC_FUNCS();
+
+	unsigned int TO_STATE_ACTION( RedState *state );
+	unsigned int FROM_STATE_ACTION( RedState *state );
+
+	std::ostream &TO_STATE_ACTIONS();
+	std::ostream &FROM_STATE_ACTIONS();
+
+	void COND_TRANSLATE( GenStateCond *stateCond, int level );
+	void emitCondBSearch( RedState *state, int level, int low, int high );
+	void STATE_CONDS( RedState *state, bool genDefault ); 
+
+	void emitSingleSwitch( RedState *state );
+	void emitRangeBSearch( RedState *state, int level, int low, int high );
+
+	std::ostream &EXIT_STATES();
+	std::ostream &TRANS_GOTO( RedTrans *trans, int level );
+	std::ostream &FINISH_CASES();
+
+	void writeData();
+	void writeInit();
+	void writeExec();
+	void writeCode();
+
+protected:
+	bool useAgainLabel();
+
+	/* Called from GotoCodeGen::STATE_GOTOS just before writing the gotos for
+	 * each state. */
+	bool IN_TRANS_ACTIONS( RedState *state );
+	void GOTO_HEADER( RedState *state );
+	void STATE_GOTO_ERROR();
+
+	/* Set up labelNeeded flag for each state. */
+	void setLabelsNeeded();
+};
+
+#endif /* _FSMCODEGEN_H */
diff --git a/colm/fsmexec.cpp b/colm/fsmexec.cpp
new file mode 100644
index 00000000..80370890
--- /dev/null
+++ b/colm/fsmexec.cpp
@@ -0,0 +1,209 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <iostream>
+
+#include "config.h"
+#include "fsmrun.h"
+#include "redfsm.h"
+#include "parsedata.h"
+#include "parsetree.h"
+#include "pdarun.h"
+#include "colm.h"
+
+void FsmRun::execAction( GenAction *genAction )
+{
+	for ( InlineList::Iter item = *genAction->inlineList; item.lte(); item++ ) {
+		switch ( item->type ) {
+		case InlineItem::Text:
+			assert(false);
+			break;
+		case InlineItem::LmSetActId:
+			act = item->longestMatchPart->longestMatchId;
+			break;
+		case InlineItem::LmSetTokEnd:
+			tokend = p + 1;
+			break;
+		case InlineItem::LmInitTokStart:
+			assert(false);
+			break;
+		case InlineItem::LmInitAct:
+			act = 0;
+			break;
+		case InlineItem::LmSetTokStart:
+			tokstart = p;
+			break;
+		case InlineItem::LmSwitch:
+			/* If the switch handles error then we also forced the error state. It
+			 * will exist. */
+			p = tokend;
+			if ( item->tokenRegion->lmSwitchHandlesError && act == 0 ) {
+				p = tokstart;
+				cs = tables->errorState;
+			}
+			else {
+				for ( TokenDefList::Iter lmi = item->tokenRegion->tokenDefList; 
+						lmi.lte(); lmi++ )
+				{
+					if ( lmi->inLmSelect && act == lmi->longestMatchId )
+						emitToken( lmi->token );
+				}
+			}
+			gotoResume = true;
+			break;
+		case InlineItem::LmOnLast:
+			p += 1;
+			emitToken( item->longestMatchPart->token );
+			gotoResume = true;
+			break;
+		case InlineItem::LmOnNext:
+			emitToken( item->longestMatchPart->token );
+			gotoResume = true;
+			break;
+		case InlineItem::LmOnLagBehind:
+			p = tokend;
+			emitToken( item->longestMatchPart->token );
+			gotoResume = true;
+			break;
+		}
+	}
+
+	if ( genAction->objField ) {
+		ObjField *field = genAction->objField;
+		if ( genAction->markType == MarkEnter )
+			mark_enter[field->offset] = p;
+		else if ( genAction->markType == MarkLeave )
+			mark_leave[field->offset] = p;
+	}
+}
+
+void FsmRun::execute()
+{
+	int _klen;
+	unsigned int _trans;
+	const long *_acts;
+	unsigned int _nacts;
+	const char *_keys;
+
+_resume:
+	if ( cs == tables->errorState )
+		goto out;
+
+	if ( p == pe )
+		goto out;
+
+_loop_head:
+	_acts = tables->actions + tables->fromStateActions[cs];
+	_nacts = (unsigned int) *_acts++;
+	while ( _nacts-- > 0 )
+		execAction( tables->actionSwitch[*_acts++] );
+
+	_keys = tables->transKeys + tables->keyOffsets[cs];
+	_trans = tables->indexOffsets[cs];
+
+	_klen = tables->singleLengths[cs];
+	if ( _klen > 0 ) {
+		const char *_lower = _keys;
+		const char *_mid;
+		const char *_upper = _keys + _klen - 1;
+		while (1) {
+			if ( _upper < _lower )
+				break;
+
+			_mid = _lower + ((_upper-_lower) >> 1);
+			if ( (*p) < *_mid )
+				_upper = _mid - 1;
+			else if ( (*p) > *_mid )
+				_lower = _mid + 1;
+			else {
+				_trans += (_mid - _keys);
+				goto _match;
+			}
+		}
+		_keys += _klen;
+		_trans += _klen;
+	}
+
+	_klen = tables->rangeLengths[cs];
+	if ( _klen > 0 ) {
+		const char *_lower = _keys;
+		const char *_mid;
+		const char *_upper = _keys + (_klen<<1) - 2;
+		while (1) {
+			if ( _upper < _lower )
+				break;
+
+			_mid = _lower + (((_upper-_lower) >> 1) & ~1);
+			if ( (*p) < _mid[0] )
+				_upper = _mid - 2;
+			else if ( (*p) > _mid[1] )
+				_lower = _mid + 2;
+			else {
+				_trans += ((_mid - _keys)>>1);
+				goto _match;
+			}
+		}
+		_trans += _klen;
+	}
+
+_match:
+	cs = tables->transTargsWI[_trans];
+
+	if ( tables->transActionsWI[_trans] == 0 )
+		goto _again;
+
+	gotoResume = false;
+	_acts = tables->actions + tables->transActionsWI[_trans];
+	_nacts = (unsigned int) *_acts++;
+	while ( _nacts-- > 0 )
+		execAction( tables->actionSwitch[*_acts++] );
+	if ( gotoResume )
+		goto _resume;
+
+_again:
+	_acts = tables->actions + tables->toStateActions[cs];
+	_nacts = (unsigned int) *_acts++;
+	while ( _nacts-- > 0 )
+		execAction( tables->actionSwitch[*_acts++] );
+
+	if ( cs == tables->errorState )
+		goto out;
+
+	if ( ++p != pe )
+		goto _loop_head;
+out:
+	if ( p == peof ) {
+		gotoResume = false;
+		_acts = tables->actions + tables->eofActions[cs];
+		_nacts = (unsigned int) *_acts++;
+
+		if ( tables->eofTargs[cs] >= 0 )
+			cs = tables->eofTargs[cs];
+
+		while ( _nacts-- > 0 )
+			execAction( tables->actionSwitch[*_acts++] );
+		if ( gotoResume )
+			goto _resume;
+	}
+}
+
+
diff --git a/colm/fsmgraph.cpp b/colm/fsmgraph.cpp
new file mode 100644
index 00000000..6b955ad6
--- /dev/null
+++ b/colm/fsmgraph.cpp
@@ -0,0 +1,1399 @@
+/*
+ *  Copyright 2001, 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <assert.h>
+#include <iostream>
+
+#include "config.h"
+#include "fsmgraph.h"
+#include "mergesort.h"
+
+using std::cerr;
+using std::endl;
+
+/* Make a new state. The new state will be put on the graph's
+ * list of state. The new state can be created final or non final. */
+FsmState *FsmGraph::addState()
+{
+	/* Make the new state to return. */
+	FsmState *state = new FsmState();
+
+	if ( misfitAccounting ) {
+		/* Create the new state on the misfit list. All states are created
+		 * with no foreign in transitions. */
+		misfitList.append( state );
+	}
+	else {
+		/* Create the new state. */
+		stateList.append( state );
+	}
+
+	return state;
+}
+
+/* Construct an FSM that is the concatenation of an array of characters. A new
+ * machine will be made that has len+1 states with one transition between each
+ * state for each integer in str. IsSigned determines if the integers are to
+ * be considered as signed or unsigned ints. */
+void FsmGraph::concatFsm( Key *str, int len )
+{
+	/* Make the first state and set it as the start state. */
+	FsmState *last = addState();
+	setStartState( last );
+
+	/* Attach subsequent states. */
+	for ( int i = 0; i < len; i++ ) {
+		FsmState *newState = addState();
+		attachNewTrans( last, newState, str[i], str[i] );
+		last = newState;
+	}
+
+	/* Make the last state the final state. */
+	setFinState( last );
+}
+
+/* Case insensitive version of concatFsm. */
+void FsmGraph::concatFsmCI( Key *str, int len )
+{
+	/* Make the first state and set it as the start state. */
+	FsmState *last = addState();
+	setStartState( last );
+
+	/* Attach subsequent states. */
+	for ( int i = 0; i < len; i++ ) {
+		FsmState *newState = addState();
+
+		KeySet keySet;
+		if ( str[i].isLower() )
+			keySet.insert( str[i].toUpper() );
+		if ( str[i].isUpper() )
+			keySet.insert( str[i].toLower() );
+		keySet.insert( str[i] );
+
+		for ( int i = 0; i < keySet.length(); i++ )
+			attachNewTrans( last, newState, keySet[i], keySet[i] );
+
+		last = newState;
+	}
+
+	/* Make the last state the final state. */
+	setFinState( last );
+}
+
+/* Construct a machine that matches one character.  A new machine will be made
+ * that has two states with a single transition between the states. IsSigned
+ * determines if the integers are to be considered as signed or unsigned ints. */
+void FsmGraph::concatFsm( Key chr )
+{
+	/* Two states first start, second final. */
+	setStartState( addState() );
+
+	FsmState *end = addState();
+	setFinState( end );
+
+	/* Attach on the character. */
+	attachNewTrans( startState, end, chr, chr );
+}
+
+/* Construct a machine that matches any character in set.  A new machine will
+ * be made that has two states and len transitions between the them. The set
+ * should be ordered correctly accroding to KeyOps and should not contain
+ * any duplicates. */
+void FsmGraph::orFsm( Key *set, int len )
+{
+	/* Two states first start, second final. */
+	setStartState( addState() );
+
+	FsmState *end = addState();
+	setFinState( end );
+
+	for ( int i = 1; i < len; i++ )
+		assert( set[i-1] < set[i] );
+
+	/* Attach on all the integers in the given string of ints. */
+	for ( int i = 0; i < len; i++ )
+		attachNewTrans( startState, end, set[i], set[i] );
+}
+
+/* Construct a machine that matches a range of characters.  A new machine will
+ * be made with two states and a range transition between them. The range will
+ * match any characters from low to high inclusive. Low should be less than or
+ * equal to high otherwise undefined behaviour results.  IsSigned determines
+ * if the integers are to be considered as signed or unsigned ints. */
+void FsmGraph::rangeFsm( Key low, Key high )
+{
+	/* Two states first start, second final. */
+	setStartState( addState() );
+
+	FsmState *end = addState();
+	setFinState( end );
+
+	/* Attach using the range of characters. */
+	attachNewTrans( startState, end, low, high );
+}
+
+/* Construct a machine that a repeated range of characters.  */
+void FsmGraph::rangeStarFsm( Key low, Key high)
+{
+	/* One state which is final and is the start state. */
+	setStartState( addState() );
+	setFinState( startState );
+
+	/* Attach start to start using range of characters. */
+	attachNewTrans( startState, startState, low, high );
+}
+
+/* Construct a machine that matches the empty string.  A new machine will be
+ * made with only one state. The new state will be both a start and final
+ * state. IsSigned determines if the machine has a signed or unsigned
+ * alphabet. Fsm operations must be done on machines with the same alphabet
+ * signedness. */
+void FsmGraph::lambdaFsm( )
+{
+	/* Give it one state with no transitions making it
+	 * the start state and final state. */
+	setStartState( addState() );
+	setFinState( startState );
+}
+
+/* Construct a machine that matches nothing at all. A new machine will be
+ * made with only one state. It will not be final. */
+void FsmGraph::emptyFsm( )
+{
+	/* Give it one state with no transitions making it
+	 * the start state and final state. */
+	setStartState( addState() );
+}
+
+void FsmGraph::transferOutData( FsmState *destState, FsmState *srcState )
+{
+	for ( TransList::Iter trans = destState->outList; trans.lte(); trans++ ) {
+		if ( trans->toState != 0 ) {
+			/* Get the actions data from the outActionTable. */
+			trans->actionTable.setActions( srcState->outActionTable );
+
+			/* Get the priorities from the outPriorTable. */
+			trans->priorTable.setPriors( srcState->outPriorTable );
+		}
+	}
+}
+
+/* Kleene star operator. Makes this machine the kleene star of itself. Any
+ * transitions made going out of the machine and back into itself will be
+ * notified that they are leaving transitions by having the leavingFromState
+ * callback invoked. */
+void FsmGraph::starOp( )
+{
+	/* For the merging process. */
+	MergeData md;
+
+	/* Turn on misfit accounting to possibly catch the old start state. */
+	setMisfitAccounting( true );
+
+	/* Create the new new start state. It will be set final after the merging
+	 * of the final states with the start state is complete. */
+	FsmState *prevStartState = startState;
+	unsetStartState();
+	setStartState( addState() );
+
+	/* Merge the new start state with the old one to isolate it. */
+	mergeStates( md, startState, prevStartState );
+
+	/* Merge the start state into all final states. Except the start state on
+	 * the first pass. If the start state is set final we will be doubling up
+	 * its transitions, which will get transfered to any final states that
+	 * follow it in the final state set. This will be determined by the order
+	 * of items in the final state set. To prevent this we just merge with the
+	 * start on a second pass. */
+	for ( StateSet::Iter st = finStateSet; st.lte(); st++ ) {
+		if ( *st != startState )
+			mergeStatesLeaving( md, *st, startState );
+	}
+
+	/* Now it is safe to merge the start state with itself (provided it
+	 * is set final). */
+	if ( startState->isFinState() )
+		mergeStatesLeaving( md, startState, startState );
+
+	/* Now ensure the new start state is a final state. */
+	setFinState( startState );
+
+	/* Fill in any states that were newed up as combinations of others. */
+	fillInStates( md );
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+void FsmGraph::repeatOp( int times )
+{
+	/* Must be 1 and up. 0 produces null machine and requires deleting this. */
+	assert( times > 0 );
+
+	/* A repeat of one does absolutely nothing. */
+	if ( times == 1 )
+		return;
+
+	/* Make a machine to make copies from. */
+	FsmGraph *copyFrom = new FsmGraph( *this );
+
+	/* Concatentate duplicates onto the end up until before the last. */
+	for ( int i = 1; i < times-1; i++ ) {
+		FsmGraph *dup = new FsmGraph( *copyFrom );
+		doConcat( dup, 0, false );
+	}
+
+	/* Now use the copyFrom on the end. */
+	doConcat( copyFrom, 0, false );
+}
+
+void FsmGraph::optionalRepeatOp( int times )
+{
+	/* Must be 1 and up. 0 produces null machine and requires deleting this. */
+	assert( times > 0 );
+
+	/* A repeat of one optional merely allows zero string. */
+	if ( times == 1 ) {
+		setFinState( startState );
+		return;
+	}
+
+	/* Make a machine to make copies from. */
+	FsmGraph *copyFrom = new FsmGraph( *this );
+
+	/* The state set used in the from end of the concatentation. Starts with
+	 * the initial final state set, then after each concatenation, gets set to
+	 * the the final states that come from the the duplicate. */
+	StateSet lastFinSet( finStateSet );
+
+	/* Set the initial state to zero to allow zero copies. */
+	setFinState( startState );
+
+	/* Concatentate duplicates onto the end up until before the last. */
+	for ( int i = 1; i < times-1; i++ ) {
+		/* Make a duplicate for concating and set the fin bits to graph 2 so we
+		 * can pick out it's final states after the optional style concat. */
+		FsmGraph *dup = new FsmGraph( *copyFrom );
+		dup->setFinBits( SB_GRAPH2 );
+		doConcat( dup, &lastFinSet, true );
+
+		/* Clear the last final state set and make the new one by taking only
+		 * the final states that come from graph 2.*/
+		lastFinSet.empty();
+		for ( int i = 0; i < finStateSet.length(); i++ ) {
+			/* If the state came from graph 2, add it to the last set and clear
+			 * the bits. */
+			FsmState *fs = finStateSet[i];
+			if ( fs->stateBits & SB_GRAPH2 ) {
+				lastFinSet.insert( fs );
+				fs->stateBits &= ~SB_GRAPH2;
+			}
+		}
+	}
+
+	/* Now use the copyFrom on the end, no bits set, no bits to clear. */
+	doConcat( copyFrom, &lastFinSet, true );
+}
+
+
+/* Fsm concatentation worker. Supports treating the concatentation as optional,
+ * which essentially leaves the final states of machine one as final. */
+void FsmGraph::doConcat( FsmGraph *other, StateSet *fromStates, bool optional )
+{
+	/* For the merging process. */
+	StateSet finStateSetCopy, startStateSet;
+	MergeData md;
+
+	/* Turn on misfit accounting for both graphs. */
+	setMisfitAccounting( true );
+	other->setMisfitAccounting( true );
+
+	/* Get the other's start state. */
+	FsmState *otherStartState = other->startState;
+
+	/* Unset other's start state before bringing in the entry points. */
+	other->unsetStartState();
+
+	/* Bring in the rest of other's entry points. */
+	copyInEntryPoints( other );
+	other->entryPoints.empty();
+
+	/* Bring in other's states into our state lists. */
+	stateList.append( other->stateList );
+	misfitList.append( other->misfitList );
+
+	/* If from states is not set, then get a copy of our final state set before
+	 * we clobber it and use it instead. */
+	if ( fromStates == 0 ) {
+		finStateSetCopy = finStateSet;
+		fromStates = &finStateSetCopy;
+	}
+
+	/* Unset all of our final states and get the final states from other. */
+	if ( !optional )
+		unsetAllFinStates();
+	finStateSet.insert( other->finStateSet );
+	
+	/* Since other's lists are empty, we can delete the fsm without
+	 * affecting any states. */
+	delete other;
+
+	/* Merge our former final states with the start state of other. */
+	for ( int i = 0; i < fromStates->length(); i++ ) {
+		FsmState *state = fromStates->data[i];
+
+		/* Merge the former final state with other's start state. */
+		mergeStatesLeaving( md, state, otherStartState );
+
+		/* If the former final state was not reset final then we must clear
+		 * the state's out trans data. If it got reset final then it gets to
+		 * keep its out trans data. This must be done before fillInStates gets
+		 * called to prevent the data from being sourced. */
+		if ( ! state->isFinState() )
+			clearOutData( state );
+	}
+
+	/* Fill in any new states made from merging. */
+	fillInStates( md );
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+/* Concatenates other to the end of this machine. Other is deleted.  Any
+ * transitions made leaving this machine and entering into other are notified
+ * that they are leaving transitions by having the leavingFromState callback
+ * invoked. */
+void FsmGraph::concatOp( FsmGraph *other )
+{
+	/* Assert same signedness and return graph concatenation op. */
+	doConcat( other, 0, false );
+}
+
+
+void FsmGraph::doOr( FsmGraph *other )
+{
+	/* For the merging process. */
+	MergeData md;
+
+	/* Build a state set consisting of both start states */
+	StateSet startStateSet;
+	startStateSet.insert( startState );
+	startStateSet.insert( other->startState );
+
+	/* Both of the original start states loose their start state status. */
+	unsetStartState();
+	other->unsetStartState();
+
+	/* Bring in the rest of other's entry points. */
+	copyInEntryPoints( other );
+	other->entryPoints.empty();
+
+	/* Merge the lists. This will move all the states from other
+	 * into this. No states will be deleted. */
+	stateList.append( other->stateList );
+	misfitList.append( other->misfitList );
+
+	/* Move the final set data from other into this. */
+	finStateSet.insert(other->finStateSet);
+	other->finStateSet.empty();
+
+	/* Since other's list is empty, we can delete the fsm without
+	 * affecting any states. */
+	delete other;
+
+	/* Create a new start state. */
+	setStartState( addState() );
+
+	/* Merge the start states. */
+	mergeStates( md, startState, startStateSet.data, startStateSet.length() );
+
+	/* Fill in any new states made from merging. */
+	fillInStates( md );
+}
+
+/* Unions other with this machine. Other is deleted. */
+void FsmGraph::unionOp( FsmGraph *other )
+{
+	/* Turn on misfit accounting for both graphs. */
+	setMisfitAccounting( true );
+	other->setMisfitAccounting( true );
+
+	/* Call Worker routine. */
+	doOr( other );
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+/* Intersects other with this machine. Other is deleted. */
+void FsmGraph::intersectOp( FsmGraph *other )
+{
+	/* Turn on misfit accounting for both graphs. */
+	setMisfitAccounting( true );
+	other->setMisfitAccounting( true );
+
+	/* Set the fin bits on this and other to want each other. */
+	setFinBits( SB_GRAPH1 );
+	other->setFinBits( SB_GRAPH2 );
+
+	/* Call worker Or routine. */
+	doOr( other );
+
+	/* Unset any final states that are no longer to 
+	 * be final due to final bits. */
+	unsetIncompleteFinals();
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+
+	/* Remove states that have no path to a final state. */
+	removeDeadEndStates();
+}
+
+/* Set subtracts other machine from this machine. Other is deleted. */
+void FsmGraph::subtractOp( FsmGraph *other )
+{
+	/* Turn on misfit accounting for both graphs. */
+	setMisfitAccounting( true );
+	other->setMisfitAccounting( true );
+
+	/* Set the fin bits of other to be killers. */
+	other->setFinBits( SB_GRAPH1 );
+
+	/* Call worker Or routine. */
+	doOr( other );
+
+	/* Unset any final states that are no longer to 
+	 * be final due to final bits. */
+	unsetKilledFinals();
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+
+	/* Remove states that have no path to a final state. */
+	removeDeadEndStates();
+}
+
+bool FsmGraph::inEptVect( EptVect *eptVect, FsmState *state )
+{
+	if ( eptVect != 0 ) {
+		/* Vect is there, walk it looking for state. */
+		for ( int i = 0; i < eptVect->length(); i++ ) {
+			if ( eptVect->data[i].targ == state )
+				return true;
+		}
+	}
+	return false;
+}
+
+/* Fill epsilon vectors in a root state from a given starting point. Epmploys
+ * a depth first search through the graph of epsilon transitions. */
+void FsmGraph::epsilonFillEptVectFrom( FsmState *root, FsmState *from, bool parentLeaving )
+{
+	/* Walk the epsilon transitions out of the state. */
+	for ( EpsilonTrans::Iter ep = from->epsilonTrans; ep.lte(); ep++ ) {
+		/* Find the entry point, if the it does not resove, ignore it. */
+		EntryMapEl *enLow, *enHigh;
+		if ( entryPoints.findMulti( *ep, enLow, enHigh ) ) {
+			/* Loop the targets. */
+			for ( EntryMapEl *en = enLow; en <= enHigh; en++ ) {
+				/* Do not add the root or states already in eptVect. */
+				FsmState *targ = en->value;
+				if ( targ != from && !inEptVect(root->eptVect, targ) ) {
+					/* Maybe need to create the eptVect. */
+					if ( root->eptVect == 0 )
+						root->eptVect = new EptVect();
+
+					/* If moving to a different graph or if any parent is
+					 * leaving then we are leaving. */
+					bool leaving = parentLeaving || 
+							root->owningGraph != targ->owningGraph;
+
+					/* All ok, add the target epsilon and recurse. */
+					root->eptVect->append( EptVectEl(targ, leaving) );
+					epsilonFillEptVectFrom( root, targ, leaving );
+				}
+			}
+		}
+	}
+}
+
+void FsmGraph::shadowReadWriteStates( MergeData &md )
+{
+	/* Init isolatedShadow algorithm data. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ )
+		st->isolatedShadow = 0;
+
+	/* Any states that may be both read from and written to must 
+	 * be shadowed. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Find such states by looping through stateVect lists, which give us
+		 * the states that will be read from. May cause us to visit the states
+		 * that we are interested in more than once. */
+		if ( st->eptVect != 0 ) {
+			/* For all states that will be read from. */
+			for ( EptVect::Iter ept = *st->eptVect; ept.lte(); ept++ ) {
+				/* Check for read and write to the same state. */
+				FsmState *targ = ept->targ;
+				if ( targ->eptVect != 0 ) {
+					/* State is to be written to, if the shadow is not already
+					 * there, create it. */
+					if ( targ->isolatedShadow == 0 ) {
+						FsmState *shadow = addState();
+						mergeStates( md, shadow, targ );
+						targ->isolatedShadow = shadow;
+					}
+
+					/* Write shadow into the state vector so that it is the
+					 * state that the epsilon transition will read from. */
+					ept->targ = targ->isolatedShadow;
+				}
+			}
+		}
+	}
+}
+
+void FsmGraph::resolveEpsilonTrans( MergeData &md )
+{
+	/* Walk the state list and invoke recursive worker on each state. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ )
+		epsilonFillEptVectFrom( st, st, false );
+
+	/* Prevent reading from and writing to of the same state. */
+	shadowReadWriteStates( md );
+
+	/* For all states that have epsilon transitions out, draw the transitions,
+	 * clear the epsilon transitions. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		/* If there is a state vector, then create the pre-merge state. */
+		if ( st->eptVect != 0 ) {
+			/* Merge all the epsilon targets into the state. */
+			for ( EptVect::Iter ept = *st->eptVect; ept.lte(); ept++ ) {
+				if ( ept->leaving )
+					mergeStatesLeaving( md, st, ept->targ );
+				else
+					mergeStates( md, st, ept->targ );
+			}
+
+			/* Clean up the target list. */
+			delete st->eptVect;
+			st->eptVect = 0;
+		}
+
+		/* Clear the epsilon transitions vector. */
+		st->epsilonTrans.empty();
+	}
+}
+
+void FsmGraph::epsilonOp()
+{
+	/* For merging process. */
+	MergeData md;
+
+	setMisfitAccounting( true );
+
+	for ( StateList::Iter st = stateList; st.lte(); st++ )
+		st->owningGraph = 0;
+
+	/* Perform merges. */
+	resolveEpsilonTrans( md );
+
+	/* Epsilons can caused merges which leave behind unreachable states. */
+	fillInStates( md );
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+/* Make a new maching by joining together a bunch of machines without making
+ * any transitions between them. A negative finalId results in there being no
+ * final id. */
+void FsmGraph::joinOp( int startId, int finalId, FsmGraph **others, int numOthers )
+{
+	/* For the merging process. */
+	MergeData md;
+
+	/* Set the owning machines. Start at one. Zero is reserved for the start
+	 * and final states. */
+	for ( StateList::Iter st = stateList; st.lte(); st++ )
+		st->owningGraph = 1;
+	for ( int m = 0; m < numOthers; m++ ) {
+		for ( StateList::Iter st = others[m]->stateList; st.lte(); st++ )
+			st->owningGraph = 2+m;
+	}
+
+	/* All machines loose start state status. */
+	unsetStartState();
+	for ( int m = 0; m < numOthers; m++ )
+		others[m]->unsetStartState();
+	
+	/* Bring the other machines into this. */
+	for ( int m = 0; m < numOthers; m++ ) {
+		/* Bring in the rest of other's entry points. */
+		copyInEntryPoints( others[m] );
+		others[m]->entryPoints.empty();
+
+		/* Merge the lists. This will move all the states from other into
+		 * this. No states will be deleted. */
+		stateList.append( others[m]->stateList );
+		assert( others[m]->misfitList.length() == 0 );
+
+		/* Move the final set data from other into this. */
+		finStateSet.insert( others[m]->finStateSet );
+		others[m]->finStateSet.empty();
+
+		/* Since other's list is empty, we can delete the fsm without
+		 * affecting any states. */
+		delete others[m];
+	}
+
+	/* Look up the start entry point. */
+	EntryMapEl *enLow = 0, *enHigh = 0;
+	bool findRes = entryPoints.findMulti( startId, enLow, enHigh );
+	if ( ! findRes ) {
+		/* No start state. Set a default one and proceed with the join. Note
+		 * that the result of the join will be a very uninteresting machine. */
+		setStartState( addState() );
+	}
+	else {
+		/* There is at least one start state, create a state that will become
+		 * the new start state. */
+		FsmState *newStart = addState();
+		setStartState( newStart );
+
+		/* The start state is in an owning machine class all it's own. */
+		newStart->owningGraph = 0;
+
+		/* Create the set of states to merge from. */
+		StateSet stateSet;
+		for ( EntryMapEl *en = enLow; en <= enHigh; en++ )
+			stateSet.insert( en->value );
+
+		/* Merge in the set of start states into the new start state. */
+		mergeStates( md, newStart, stateSet.data, stateSet.length() );
+	}
+
+	/* Take a copy of the final state set, before unsetting them all. This
+	 * will allow us to call clearOutData on the states that don't get
+	 * final state status back back. */
+	StateSet finStateSetCopy = finStateSet;
+
+	/* Now all final states are unset. */
+	unsetAllFinStates();
+
+	if ( finalId >= 0 ) {
+		/* Create the implicit final state. */
+		FsmState *finState = addState();
+		setFinState( finState );
+
+		/* Assign an entry into the final state on the final state entry id. Note
+		 * that there may already be an entry on this id. That's ok. Also set the
+		 * final state owning machine id. It's in a class all it's own. */
+		setEntry( finalId, finState );
+		finState->owningGraph = 0;
+	}
+
+	/* Hand over to workers for resolving epsilon trans. This will merge states
+	 * with the targets of their epsilon transitions. */
+	resolveEpsilonTrans( md );
+
+	/* Invoke the relinquish final callback on any states that did not get
+	 * final state status back. */
+	for ( StateSet::Iter st = finStateSetCopy; st.lte(); st++ ) {
+		if ( !((*st)->stateBits & SB_ISFINAL) )
+			clearOutData( *st );
+	}
+
+	/* Fill in any new states made from merging. */
+	fillInStates( md );
+
+	/* Joining can be messy. Instead of having misfit accounting on (which is
+	 * tricky here) do a full cleaning. */
+	removeUnreachableStates();
+}
+
+void FsmGraph::globOp( FsmGraph **others, int numOthers )
+{
+	/* All other machines loose start states status. */
+	for ( int m = 0; m < numOthers; m++ )
+		others[m]->unsetStartState();
+	
+	/* Bring the other machines into this. */
+	for ( int m = 0; m < numOthers; m++ ) {
+		/* Bring in the rest of other's entry points. */
+		copyInEntryPoints( others[m] );
+		others[m]->entryPoints.empty();
+
+		/* Merge the lists. This will move all the states from other into
+		 * this. No states will be deleted. */
+		stateList.append( others[m]->stateList );
+		assert( others[m]->misfitList.length() == 0 );
+
+		/* Move the final set data from other into this. */
+		finStateSet.insert( others[m]->finStateSet );
+		others[m]->finStateSet.empty();
+
+		/* Since other's list is empty, we can delete the fsm without
+		 * affecting any states. */
+		delete others[m];
+	}
+}
+
+void FsmGraph::deterministicEntry()
+{
+	/* For the merging process. */
+	MergeData md;
+
+	/* States may loose their entry points, turn on misfit accounting. */
+	setMisfitAccounting( true );
+
+	/* Get a copy of the entry map then clear all the entry points. As we
+	 * iterate the old entry map finding duplicates we will add the entry
+	 * points for the new states that we create. */
+	EntryMap prevEntry = entryPoints;
+	unsetAllEntryPoints();
+
+	for ( int enId = 0; enId < prevEntry.length(); ) {
+		/* Count the number of states on this entry key. */
+		int highId = enId;
+		while ( highId < prevEntry.length() && prevEntry[enId].key == prevEntry[highId].key )
+			highId += 1;
+
+		int numIds = highId - enId;
+		if ( numIds == 1 ) {
+			/* Only a single entry point, just set the entry. */
+			setEntry( prevEntry[enId].key, prevEntry[enId].value );
+		}
+		else {
+			/* Multiple entry points, need to create a new state and merge in
+			 * all the targets of entry points. */
+			FsmState *newEntry = addState();
+			for ( int en = enId; en < highId; en++ )
+				mergeStates( md, newEntry, prevEntry[en].value );
+
+			/* Add the new state as the single entry point. */
+			setEntry( prevEntry[enId].key, newEntry );
+		}
+
+		enId += numIds;
+	}
+
+	/* The old start state may be unreachable. Remove the misfits and turn off
+	 * misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+/* Unset any final states that are no longer to be final due to final bits. */
+void FsmGraph::unsetKilledFinals()
+{
+	/* Duplicate the final state set before we begin modifying it. */
+	StateSet fin( finStateSet );
+
+	for ( int s = 0; s < fin.length(); s++ ) {
+		/* Check for killing bit. */
+		FsmState *state = fin.data[s];
+		if ( state->stateBits & SB_GRAPH1 ) {
+			/* One final state is a killer, set to non-final. */
+			unsetFinState( state );
+		}
+
+		/* Clear all killing bits. Non final states should never have had those
+		 * state bits set in the first place. */
+		state->stateBits &= ~SB_GRAPH1;
+	}
+}
+
+/* Unset any final states that are no longer to be final due to final bits. */
+void FsmGraph::unsetIncompleteFinals()
+{
+	/* Duplicate the final state set before we begin modifying it. */
+	StateSet fin( finStateSet );
+
+	for ( int s = 0; s < fin.length(); s++ ) {
+		/* Check for one set but not the other. */
+		FsmState *state = fin.data[s];
+		if ( state->stateBits & SB_BOTH && 
+				(state->stateBits & SB_BOTH) != SB_BOTH )
+		{
+			/* One state wants the other but it is not there. */
+			unsetFinState( state );
+		}
+
+		/* Clear wanting bits. Non final states should never have had those
+		 * state bits set in the first place. */
+		state->stateBits &= ~SB_BOTH;
+	}
+}
+
+/* Ensure that the start state is free of entry points (aside from the fact
+ * that it is the start state). If the start state has entry points then Make a
+ * new start state by merging with the old one. Useful before modifying start
+ * transitions. If the existing start state has any entry points other than the
+ * start state entry then modifying its transitions changes more than the start
+ * transitions. So isolate the start state by separating it out such that it
+ * only has start stateness as it's entry point. */
+void FsmGraph::isolateStartState( )
+{
+	/* For the merging process. */
+	MergeData md;
+
+	/* Bail out if the start state is already isolated. */
+	if ( isStartStateIsolated() )
+		return;
+
+	/* Turn on misfit accounting to possibly catch the old start state. */
+	setMisfitAccounting( true );
+
+	/* This will be the new start state. The existing start
+	 * state is merged with it. */
+	FsmState *prevStartState = startState;
+	unsetStartState();
+	setStartState( addState() );
+
+	/* Merge the new start state with the old one to isolate it. */
+	mergeStates( md, startState, prevStartState );
+
+	/* Stfil and stateDict will be empty because the merging of the old start
+	 * state into the new one will not have any conflicting transitions. */
+	assert( md.stateDict.treeSize == 0 );
+	assert( md.stfillHead == 0 );
+
+	/* The old start state may be unreachable. Remove the misfits and turn off
+	 * misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+#ifdef COLM_LOG_CONDS
+void logCondSpace( CondSpace *condSpace )
+{
+	if ( condSpace == 0 )
+		cerr << "<empty>";
+	else {
+		for ( CondSet::Iter csi = condSpace->condSet.last(); csi.gtb(); csi-- ) {
+			if ( ! csi.last() )
+				cerr << ',';
+			(*csi)->actionName( cerr );
+		}
+	}
+}
+
+void logNewExpansion( Expansion *exp )
+{
+	cerr << "created expansion:" << endl;
+	cerr << "  range: " << exp->lowKey.getVal() << " .. " << 
+			exp->highKey.getVal() << endl;
+
+	cerr << "  fromCondSpace: ";
+	logCondSpace( exp->fromCondSpace );
+	cerr << endl;
+	cerr << "  fromVals: " << exp->fromVals << endl;
+
+	cerr << "  toCondSpace: ";
+	logCondSpace( exp->toCondSpace );
+	cerr << endl;
+	cerr << "  toValsList: ";
+	for ( LongVect::Iter to = exp->toValsList; to.lte(); to++ )
+		cerr << " " << *to;
+	cerr << endl;
+}
+#endif
+
+
+void FsmGraph::findTransExpansions( ExpansionList &expansionList, 
+		FsmState *destState, FsmState *srcState )
+{
+	PairIter<FsmTrans, StateCond> transCond( destState->outList.head,
+			srcState->stateCondList.head );
+	for ( ; !transCond.end(); transCond++ ) {
+		if ( transCond.userState == RangeOverlap ) {
+			Expansion *expansion = new Expansion( transCond.s1Tel.lowKey, 
+					transCond.s1Tel.highKey );
+			expansion->fromTrans = new FsmTrans(*transCond.s1Tel.trans);
+			expansion->fromTrans->fromState = 0;
+			expansion->fromTrans->toState = transCond.s1Tel.trans->toState;
+			expansion->fromCondSpace = 0;
+			expansion->fromVals = 0;
+			CondSpace *srcCS = transCond.s2Tel.trans->condSpace;
+			expansion->toCondSpace = srcCS;
+
+			long numTargVals = (1 << srcCS->condSet.length());
+			for ( long targVals = 0; targVals < numTargVals; targVals++ )
+				expansion->toValsList.append( targVals );
+
+			#ifdef COLM_LOG_CONDS
+			logNewExpansion( expansion );
+			#endif
+			expansionList.append( expansion );
+		}
+	}
+}
+
+void FsmGraph::findCondExpInTrans( ExpansionList &expansionList, FsmState *state, 
+		Key lowKey, Key highKey, CondSpace *fromCondSpace, CondSpace *toCondSpace,
+		long fromVals, LongVect &toValsList )
+{
+	FsmTrans searchTrans;
+	searchTrans.lowKey = fromCondSpace->baseKey + fromVals * keyOps->alphSize() + 
+			(lowKey - keyOps->minKey);
+	searchTrans.highKey = fromCondSpace->baseKey + fromVals * keyOps->alphSize() + 
+			(highKey - keyOps->minKey);
+	searchTrans.prev = searchTrans.next = 0;
+
+	PairIter<FsmTrans> pairIter( state->outList.head, &searchTrans );
+	for ( ; !pairIter.end(); pairIter++ ) {
+		if ( pairIter.userState == RangeOverlap ) {
+			Expansion *expansion = new Expansion( lowKey, highKey );
+			expansion->fromTrans = new FsmTrans(*pairIter.s1Tel.trans);
+			expansion->fromTrans->fromState = 0;
+			expansion->fromTrans->toState = pairIter.s1Tel.trans->toState;
+			expansion->fromCondSpace = fromCondSpace;
+			expansion->fromVals = fromVals;
+			expansion->toCondSpace = toCondSpace;
+			expansion->toValsList = toValsList;
+
+			expansionList.append( expansion );
+			#ifdef COLM_LOG_CONDS
+			logNewExpansion( expansion );
+			#endif
+		}
+	}
+}
+
+void FsmGraph::findCondExpansions( ExpansionList &expansionList, 
+		FsmState *destState, FsmState *srcState )
+{
+	PairIter<StateCond, StateCond> condCond( destState->stateCondList.head,
+			srcState->stateCondList.head );
+	for ( ; !condCond.end(); condCond++ ) {
+		if ( condCond.userState == RangeOverlap ) {
+			/* Loop over all existing condVals . */
+			CondSet &destCS = condCond.s1Tel.trans->condSpace->condSet;
+			long destLen = destCS.length();
+
+			/* Find the items in src cond set that are not in dest
+			 * cond set. These are the items that we must expand. */
+			CondSet srcOnlyCS = condCond.s2Tel.trans->condSpace->condSet;
+			for ( CondSet::Iter dcsi = destCS; dcsi.lte(); dcsi++ )
+				srcOnlyCS.remove( *dcsi );
+			long srcOnlyLen = srcOnlyCS.length();
+
+			if ( srcOnlyCS.length() > 0 ) {
+				#ifdef COLM_LOG_CONDS
+				cerr << "there are " << srcOnlyCS.length() << " item(s) that are "
+							"only in the srcCS" << endl;
+				#endif
+
+				CondSet mergedCS = destCS;
+				mergedCS.insert( condCond.s2Tel.trans->condSpace->condSet );
+
+				CondSpace *fromCondSpace = addCondSpace( destCS );
+				CondSpace *toCondSpace = addCondSpace( mergedCS );
+
+				/* Loop all values in the dest space. */
+				for ( long destVals = 0; destVals < (1 << destLen); destVals++ ) {
+					long basicVals = 0;
+					for ( CondSet::Iter csi = destCS; csi.lte(); csi++ ) {
+						if ( destVals & (1 << csi.pos()) ) {
+							Action **cim = mergedCS.find( *csi );
+							long bitPos = (cim - mergedCS.data);
+							basicVals |= 1 << bitPos;
+						}
+					}
+
+					/* Loop all new values. */
+					LongVect expandToVals;
+					for ( long soVals = 0; soVals < (1 << srcOnlyLen); soVals++ ) {
+						long targVals = basicVals;
+						for ( CondSet::Iter csi = srcOnlyCS; csi.lte(); csi++ ) {
+							if ( soVals & (1 << csi.pos()) ) {
+								Action **cim = mergedCS.find( *csi );
+								long bitPos = (cim - mergedCS.data);
+								targVals |= 1 << bitPos;
+							}
+						}
+						expandToVals.append( targVals );
+					}
+
+					findCondExpInTrans( expansionList, destState, 
+							condCond.s1Tel.lowKey, condCond.s1Tel.highKey, 
+							fromCondSpace, toCondSpace, destVals, expandToVals );
+				}
+			}
+		}
+	}
+}
+
+void FsmGraph::doExpand( MergeData &md, FsmState *destState, ExpansionList &expList1 )
+{
+	for ( ExpansionList::Iter exp = expList1; exp.lte(); exp++ ) {
+		for ( LongVect::Iter to = exp->toValsList; to.lte(); to++ ) {
+			long targVals = *to;
+
+			/* We will use the copy of the transition that was made when the
+			 * expansion was created. It will get used multiple times. Each
+			 * time we must set up the keys, everything else is constant and
+			 * and already prepared. */
+			FsmTrans *srcTrans = exp->fromTrans;
+
+			srcTrans->lowKey = exp->toCondSpace->baseKey +
+					targVals * keyOps->alphSize() + (exp->lowKey - keyOps->minKey);
+			srcTrans->highKey = exp->toCondSpace->baseKey +
+					targVals * keyOps->alphSize() + (exp->highKey - keyOps->minKey);
+
+			TransList srcList;
+			srcList.append( srcTrans );
+			outTransCopy( md, destState, srcList.head );
+			srcList.abandon();
+		}
+	}
+}
+
+
+void FsmGraph::doRemove( MergeData &md, FsmState *destState, ExpansionList &expList1 )
+{
+	for ( ExpansionList::Iter exp = expList1; exp.lte(); exp++ ) {
+		Removal removal;
+		if ( exp->fromCondSpace == 0 ) {
+			removal.lowKey = exp->lowKey;
+			removal.highKey = exp->highKey;
+		}
+		else {
+			removal.lowKey = exp->fromCondSpace->baseKey + 
+				exp->fromVals * keyOps->alphSize() + (exp->lowKey - keyOps->minKey);
+			removal.highKey = exp->fromCondSpace->baseKey + 
+				exp->fromVals * keyOps->alphSize() + (exp->highKey - keyOps->minKey);
+		}
+		removal.next = 0;
+
+		TransList destList;
+		PairIter<FsmTrans, Removal> pairIter( destState->outList.head, &removal );
+		for ( ; !pairIter.end(); pairIter++ ) {
+			switch ( pairIter.userState ) {
+			case RangeInS1: {
+				FsmTrans *destTrans = pairIter.s1Tel.trans;
+				destTrans->lowKey = pairIter.s1Tel.lowKey;
+				destTrans->highKey = pairIter.s1Tel.highKey;
+				destList.append( destTrans );
+				break;
+			}
+			case RangeInS2:
+				break;
+			case RangeOverlap: {
+				FsmTrans *trans = pairIter.s1Tel.trans;
+				detachTrans( trans->fromState, trans->toState, trans );
+				delete trans;
+				break;
+			}
+			case BreakS1: {
+				pairIter.s1Tel.trans = dupTrans( destState, 
+						pairIter.s1Tel.trans );
+				break;
+			}
+			case BreakS2:
+				break;
+			}
+		}
+		destState->outList.transfer( destList );
+	}
+}
+
+void FsmGraph::mergeStateConds( FsmState *destState, FsmState *srcState )
+{
+	StateCondList destList;
+	PairIter<StateCond> pairIter( destState->stateCondList.head,
+			srcState->stateCondList.head );
+	for ( ; !pairIter.end(); pairIter++ ) {
+		switch ( pairIter.userState ) {
+		case RangeInS1: {
+			StateCond *destCond = pairIter.s1Tel.trans;
+			destCond->lowKey = pairIter.s1Tel.lowKey;
+			destCond->highKey = pairIter.s1Tel.highKey;
+			destList.append( destCond );
+			break;
+		}
+		case RangeInS2: {
+			StateCond *newCond = new StateCond( *pairIter.s2Tel.trans );
+			newCond->lowKey = pairIter.s2Tel.lowKey;
+			newCond->highKey = pairIter.s2Tel.highKey;
+			destList.append( newCond );
+			break;
+		}
+		case RangeOverlap: {
+			StateCond *destCond = pairIter.s1Tel.trans;
+			StateCond *srcCond = pairIter.s2Tel.trans;
+			CondSet mergedCondSet;
+			mergedCondSet.insert( destCond->condSpace->condSet );
+			mergedCondSet.insert( srcCond->condSpace->condSet );
+			destCond->condSpace = addCondSpace( mergedCondSet );
+
+			destCond->lowKey = pairIter.s1Tel.lowKey;
+			destCond->highKey = pairIter.s1Tel.highKey;
+			destList.append( destCond );
+			break;
+		}
+		case BreakS1:
+			pairIter.s1Tel.trans = new StateCond( *pairIter.s1Tel.trans );
+			break;
+
+		case BreakS2:
+			break;
+		}
+	}
+	destState->stateCondList.transfer( destList );
+}
+
+/* A state merge which represents the drawing in of leaving transitions.  If
+ * there is any out data then we duplicate the souce state, transfer the out
+ * data, then merge in the state. The new state will be reaped because it will
+ * not be given any in transitions. */
+void FsmGraph::mergeStatesLeaving( MergeData &md, FsmState *destState, FsmState *srcState )
+{
+	if ( !hasOutData( destState ) )
+		mergeStates( md, destState, srcState );
+	else {
+		FsmState *ssMutable = addState();
+		mergeStates( md, ssMutable, srcState );
+		transferOutData( ssMutable, destState );
+
+		for ( ActionSet::Iter cond = destState->outCondSet; cond.lte(); cond++ )
+			embedCondition( md, ssMutable, *cond );
+
+		mergeStates( md, destState, ssMutable );
+	}
+}
+
+void FsmGraph::mergeStates( MergeData &md, FsmState *destState, 
+		FsmState **srcStates, int numSrc )
+{
+	for ( int s = 0; s < numSrc; s++ )
+		mergeStates( md, destState, srcStates[s] );
+}
+
+void FsmGraph::mergeStates( MergeData &md, FsmState *destState, FsmState *srcState )
+{
+	ExpansionList expList1;
+	ExpansionList expList2;
+
+	findTransExpansions( expList1, destState, srcState );
+	findCondExpansions( expList1, destState, srcState );
+	findTransExpansions( expList2, srcState, destState );
+	findCondExpansions( expList2, srcState, destState );
+
+	mergeStateConds( destState, srcState );
+	
+	outTransCopy( md, destState, srcState->outList.head );
+
+	doExpand( md, destState, expList1 );
+	doExpand( md, destState, expList2 );
+
+	doRemove( md, destState, expList1 );
+	doRemove( md, destState, expList2 );
+
+	expList1.empty();
+	expList2.empty();
+
+	/* Get its bits and final state status. */
+	destState->stateBits |= ( srcState->stateBits & ~SB_ISFINAL );
+	if ( srcState->isFinState() )
+		setFinState( destState );
+
+	/* Draw in any properties of srcState into destState. */
+	if ( srcState == destState ) {
+		/* Duplicate the list to protect against write to source. The
+		 * priorities sets are not copied in because that would have no
+		 * effect. */
+		destState->epsilonTrans.append( EpsilonTrans( srcState->epsilonTrans ) );
+
+		/* Get all actions, duplicating to protect against write to source. */
+		destState->toStateActionTable.setActions( 
+				ActionTable( srcState->toStateActionTable ) );
+		destState->fromStateActionTable.setActions( 
+				ActionTable( srcState->fromStateActionTable ) );
+		destState->outActionTable.setActions( ActionTable( srcState->outActionTable ) );
+		destState->outCondSet.insert( ActionSet( srcState->outCondSet ) );
+		destState->errActionTable.setActions( ErrActionTable( srcState->errActionTable ) );
+		destState->eofActionTable.setActions( ActionTable( srcState->eofActionTable ) );
+	}
+	else {
+		/* Get the epsilons, out priorities. */
+		destState->epsilonTrans.append( srcState->epsilonTrans );
+		destState->outPriorTable.setPriors( srcState->outPriorTable );
+
+		/* Get all actions. */
+		destState->toStateActionTable.setActions( srcState->toStateActionTable );
+		destState->fromStateActionTable.setActions( srcState->fromStateActionTable );
+		destState->outActionTable.setActions( srcState->outActionTable );
+		destState->outCondSet.insert( srcState->outCondSet );
+		destState->errActionTable.setActions( srcState->errActionTable );
+		destState->eofActionTable.setActions( srcState->eofActionTable );
+	}
+}
+
+void FsmGraph::fillInStates( MergeData &md )
+{
+	/* Merge any states that are awaiting merging. This will likey cause
+	 * other states to be added to the stfil list. */
+	FsmState *state = md.stfillHead;
+	while ( state != 0 ) {
+		StateSet *stateSet = &state->stateDictEl->stateSet;
+		mergeStates( md, state, stateSet->data, stateSet->length() );
+		state = state->alg.next;
+	}
+
+	/* Delete the state sets of all states that are on the fill list. */
+	state = md.stfillHead;
+	while ( state != 0 ) {
+		/* Delete and reset the state set. */
+		delete state->stateDictEl;
+		state->stateDictEl = 0;
+
+		/* Next state in the stfill list. */
+		state = state->alg.next;
+	}
+
+	/* StateDict will still have its ptrs/size set but all of it's element
+	 * will be deleted so we don't need to clean it up. */
+}
+
+void FsmGraph::findEmbedExpansions( ExpansionList &expansionList, 
+		FsmState *destState, Action *condAction )
+{
+	StateCondList destList;
+	PairIter<FsmTrans, StateCond> transCond( destState->outList.head,
+			destState->stateCondList.head );
+	for ( ; !transCond.end(); transCond++ ) {
+		switch ( transCond.userState ) {
+			case RangeInS1: {
+				if ( transCond.s1Tel.lowKey <= keyOps->maxKey ) {
+					assert( transCond.s1Tel.highKey <= keyOps->maxKey );
+
+					/* Make a new state cond. */
+					StateCond *newStateCond = new StateCond( transCond.s1Tel.lowKey,
+							transCond.s1Tel.highKey );
+					newStateCond->condSpace = addCondSpace( CondSet( condAction ) );
+					destList.append( newStateCond );
+
+					/* Create the expansion. */
+					Expansion *expansion = new Expansion( transCond.s1Tel.lowKey,
+							transCond.s1Tel.highKey );
+					expansion->fromTrans = new FsmTrans(*transCond.s1Tel.trans);
+					expansion->fromTrans->fromState = 0;
+					expansion->fromTrans->toState = transCond.s1Tel.trans->toState;
+					expansion->fromCondSpace = 0;
+					expansion->fromVals = 0;
+					expansion->toCondSpace = newStateCond->condSpace;
+					expansion->toValsList.append( 1 );
+					#ifdef COLM_LOG_CONDS
+					logNewExpansion( expansion );
+					#endif
+					expansionList.append( expansion );
+				}
+				break;
+			}
+			case RangeInS2: {
+				/* Enhance state cond and find the expansion. */
+				StateCond *stateCond = transCond.s2Tel.trans;
+				stateCond->lowKey = transCond.s2Tel.lowKey;
+				stateCond->highKey = transCond.s2Tel.highKey;
+
+				CondSet &destCS = stateCond->condSpace->condSet;
+				long destLen = destCS.length();
+				CondSpace *fromCondSpace = stateCond->condSpace;
+
+				CondSet mergedCS = destCS;
+				mergedCS.insert( condAction );
+				CondSpace *toCondSpace = addCondSpace( mergedCS );
+				stateCond->condSpace = toCondSpace;
+				destList.append( stateCond );
+
+				/* Loop all values in the dest space. */
+				for ( long destVals = 0; destVals < (1 << destLen); destVals++ ) {
+					long basicVals = 0;
+					for ( CondSet::Iter csi = destCS; csi.lte(); csi++ ) {
+						if ( destVals & (1 << csi.pos()) ) {
+							Action **cim = mergedCS.find( *csi );
+							long bitPos = (cim - mergedCS.data);
+							basicVals |= 1 << bitPos;
+						}
+					}
+
+					long targVals = basicVals;
+					Action **cim = mergedCS.find( condAction );
+					long bitPos = (cim - mergedCS.data);
+					targVals |= 1 << bitPos;
+					
+					LongVect expandToVals( targVals );
+					findCondExpInTrans( expansionList, destState, 
+						transCond.s2Tel.lowKey, transCond.s2Tel.highKey, 
+						fromCondSpace, toCondSpace, destVals, expandToVals );
+				}
+				break;
+			}
+
+
+			case RangeOverlap:
+			case BreakS1:
+			case BreakS2:
+				assert( false );
+				break;
+		}
+	}
+
+	destState->stateCondList.transfer( destList );
+}
+
+void FsmGraph::embedCondition( FsmState *state, Action *condAction )
+{
+	MergeData md;
+	ExpansionList expList;
+
+	/* Turn on misfit accounting to possibly catch the old start state. */
+	setMisfitAccounting( true );
+
+	/* Worker. */
+	embedCondition( md, state, condAction );
+
+	/* Fill in any states that were newed up as combinations of others. */
+	fillInStates( md );
+
+	/* Remove the misfits and turn off misfit accounting. */
+	removeMisfits();
+	setMisfitAccounting( false );
+}
+
+void FsmGraph::embedCondition( MergeData &md, FsmState *state, Action *condAction )
+{
+	ExpansionList expList;
+
+	findEmbedExpansions( expList, state, condAction );
+	doExpand( md, state, expList );
+	doRemove( md, state, expList );
+	expList.empty();
+}
diff --git a/colm/fsmgraph.h b/colm/fsmgraph.h
new file mode 100644
index 00000000..9c002077
--- /dev/null
+++ b/colm/fsmgraph.h
@@ -0,0 +1,1392 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _FSMGRAPH_H
+#define _FSMGRAPH_H
+
+#include <assert.h>
+#include "common.h"
+#include "vector.h"
+#include "bstset.h"
+#include "compare.h"
+#include "avltree.h"
+#include "dlist.h"
+#include "bstmap.h"
+#include "sbstmap.h"
+#include "sbstset.h"
+#include "sbsttable.h"
+#include "avlset.h"
+#include "avlmap.h"
+
+/* Flags that control merging. */
+#define SB_GRAPH1     0x01
+#define SB_GRAPH2     0x02
+#define SB_BOTH       0x03
+#define SB_ISFINAL    0x04
+#define SB_ISMARKED   0x08
+#define SB_ONLIST     0x10
+
+struct FsmTrans;
+struct FsmState;
+struct FsmGraph;
+struct Action;
+struct TokenDef;
+struct NameInst;
+
+/* State list element for unambiguous access to list element. */
+struct FsmListEl 
+{
+	FsmState *prev, *next;
+};
+
+/* This is the marked index for a state pair. Used in minimization. It keeps
+ * track of whether or not the state pair is marked. */
+struct MarkIndex
+{
+	MarkIndex(int states);
+	~MarkIndex();
+
+	void markPair(int state1, int state2);
+	bool isPairMarked(int state1, int state2);
+
+private:
+	int numStates;
+	bool *array;
+};
+
+extern KeyOps *keyOps;
+
+/* Transistion Action Element. */
+typedef SBstMapEl< int, Action* > ActionTableEl;
+
+/* Transition Action Table.  */
+struct ActionTable 
+	: public SBstMap< int, Action*, CmpOrd<int> >
+{
+	void setAction( int ordering, Action *action );
+	void setActions( int *orderings, Action **actions, int nActs );
+	void setActions( const ActionTable &other );
+
+	bool hasAction( Action *action );
+};
+
+typedef SBstSet< Action*, CmpOrd<Action*> > ActionSet;
+typedef CmpSTable< Action*, CmpOrd<Action*> > CmpActionSet;
+
+/* Transistion Action Element. */
+typedef SBstMapEl< int, TokenDef* > LmActionTableEl;
+
+/* Transition Action Table.  */
+struct LmActionTable 
+	: public SBstMap< int, TokenDef*, CmpOrd<int> >
+{
+	void setAction( int ordering, TokenDef *action );
+	void setActions( const LmActionTable &other );
+};
+
+/* Compare of a whole action table element (key & value). */
+struct CmpActionTableEl
+{
+	static int compare( const ActionTableEl &action1, 
+			const ActionTableEl &action2 )
+	{
+		if ( action1.key < action2.key )
+			return -1;
+		else if ( action1.key > action2.key )
+			return 1;
+		else if ( action1.value < action2.value )
+			return -1;
+		else if ( action1.value > action2.value )
+			return 1;
+		return 0;
+	}
+};
+
+/* Compare for ActionTable. */
+typedef CmpSTable< ActionTableEl, CmpActionTableEl > CmpActionTable;
+
+/* Compare of a whole lm action table element (key & value). */
+struct CmpLmActionTableEl
+{
+	static int compare( const LmActionTableEl &lmAction1, 
+			const LmActionTableEl &lmAction2 )
+	{
+		if ( lmAction1.key < lmAction2.key )
+			return -1;
+		else if ( lmAction1.key > lmAction2.key )
+			return 1;
+		else if ( lmAction1.value < lmAction2.value )
+			return -1;
+		else if ( lmAction1.value > lmAction2.value )
+			return 1;
+		return 0;
+	}
+};
+
+/* Compare for ActionTable. */
+typedef CmpSTable< LmActionTableEl, CmpLmActionTableEl > CmpLmActionTable;
+
+/* Action table element for error action tables. Adds the encoding of transfer
+ * point. */
+struct ErrActionTableEl
+{
+	ErrActionTableEl( Action *action, int ordering, int transferPoint )
+		: ordering(ordering), action(action), transferPoint(transferPoint) { }
+
+	/* Ordering and id of the action embedding. */
+	int ordering;
+	Action *action;
+
+	/* Id of point of transfere from Error action table to transtions and
+	 * eofActionTable. */
+	int transferPoint;
+
+	int getKey() const { return ordering; }
+};
+
+struct ErrActionTable
+	: public SBstTable< ErrActionTableEl, int, CmpOrd<int> >
+{
+	void setAction( int ordering, Action *action, int transferPoint );
+	void setActions( const ErrActionTable &other );
+};
+
+/* Compare of an error action table element (key & value). */
+struct CmpErrActionTableEl
+{
+	static int compare( const ErrActionTableEl &action1, 
+			const ErrActionTableEl &action2 )
+	{
+		if ( action1.ordering < action2.ordering )
+			return -1;
+		else if ( action1.ordering > action2.ordering )
+			return 1;
+		else if ( action1.action < action2.action )
+			return -1;
+		else if ( action1.action > action2.action )
+			return 1;
+		else if ( action1.transferPoint < action2.transferPoint )
+			return -1;
+		else if ( action1.transferPoint > action2.transferPoint )
+			return 1;
+		return 0;
+	}
+};
+
+/* Compare for ErrActionTable. */
+typedef CmpSTable< ErrActionTableEl, CmpErrActionTableEl > CmpErrActionTable;
+
+
+/* Descibe a priority, shared among PriorEls. 
+ * Has key and whether or not used. */
+struct PriorDesc
+{
+	int key;
+	int priority;
+};
+
+/* Element in the arrays of priorities for transitions and arrays. Ordering is
+ * unique among instantiations of machines, desc is shared. */
+struct PriorEl
+{
+	PriorEl( int ordering, PriorDesc *desc ) 
+		: ordering(ordering), desc(desc) { }
+
+	int ordering;
+	PriorDesc *desc;
+};
+
+/* Compare priority elements, which are ordered by the priority descriptor
+ * key. */
+struct PriorElCmp
+{
+	static inline int compare( const PriorEl &pel1, const PriorEl &pel2 ) 
+	{
+		if ( pel1.desc->key < pel2.desc->key )
+			return -1;
+		else if ( pel1.desc->key > pel2.desc->key )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+
+/* Priority Table. */
+struct PriorTable 
+	: public SBstSet< PriorEl, PriorElCmp >
+{
+	void setPrior( int ordering, PriorDesc *desc );
+	void setPriors( const PriorTable &other );
+};
+
+/* Compare of prior table elements for distinguising state data. */
+struct CmpPriorEl
+{
+	static inline int compare( const PriorEl &pel1, const PriorEl &pel2 )
+	{
+		if ( pel1.desc < pel2.desc )
+			return -1;
+		else if ( pel1.desc > pel2.desc )
+			return 1;
+		else if ( pel1.ordering < pel2.ordering )
+			return -1;
+		else if ( pel1.ordering > pel2.ordering )
+			return 1;
+		return 0;
+	}
+};
+
+/* Compare of PriorTable distinguising state data. Using a compare of the
+ * pointers is a little more strict than it needs be. It requires that
+ * prioritiy tables have the exact same set of priority assignment operators
+ * (from the input lang) to be considered equal. 
+ *
+ * Really only key-value pairs need be tested and ordering be merged. However
+ * this would require that in the fuseing of states, priority descriptors be
+ * chosen for the new fused state based on priority. Since the out transition
+ * lists and ranges aren't necessarily going to line up, this is more work for
+ * little gain. Final compression resets all priorities first, so this would
+ * only be useful for compression at every operator, which is only an
+ * undocumented test feature.
+ */
+typedef CmpSTable<PriorEl, CmpPriorEl> CmpPriorTable;
+
+/* Plain action list that imposes no ordering. */
+typedef Vector<int> TransFuncList;
+
+/* Comparison for TransFuncList. */
+typedef CmpTable< int, CmpOrd<int> > TransFuncListCompare;
+
+/* Transition class that implements actions and priorities. */
+struct FsmTrans 
+{
+	FsmTrans() : fromState(0), toState(0) {}
+	FsmTrans( const FsmTrans &other ) :
+		lowKey(other.lowKey),
+		highKey(other.highKey),
+		fromState(0), toState(0),
+		actionTable(other.actionTable),
+		priorTable(other.priorTable)
+	{
+		assert( lmActionTable.length() == 0 && other.lmActionTable.length() == 0 );
+	}
+
+	Key lowKey, highKey;
+	FsmState *fromState;
+	FsmState *toState;
+
+	/* Pointers for outlist. */
+	FsmTrans *prev, *next;
+
+	/* Pointers for in-list. */
+	FsmTrans *ilprev, *ilnext;
+
+	/* The function table and priority for the transition. */
+	ActionTable actionTable;
+	PriorTable priorTable;
+
+	LmActionTable lmActionTable;
+};
+
+/* In transition list. Like DList except only has head pointers, which is all
+ * that is required. Insertion and deletion is handled by the graph. This
+ * class provides the iterator of a single list. */
+struct TransInList
+{
+	TransInList() : head(0) { }
+
+	FsmTrans *head;
+
+	struct Iter
+	{
+		/* Default construct. */
+		Iter() : ptr(0) { }
+
+		/* Construct, assign from a list. */
+		Iter( const TransInList &il )  : ptr(il.head) { }
+		Iter &operator=( const TransInList &dl ) { ptr = dl.head; return *this; }
+
+		/* At the end */
+		bool lte() const    { return ptr != 0; }
+		bool end() const    { return ptr == 0; }
+
+		/* At the first, last element. */
+		bool first() const { return ptr && ptr->ilprev == 0; }
+		bool last() const  { return ptr && ptr->ilnext == 0; }
+
+		/* Cast, dereference, arrow ops. */
+		operator FsmTrans*() const   { return ptr; }
+		FsmTrans &operator *() const { return *ptr; }
+		FsmTrans *operator->() const { return ptr; }
+
+		/* Increment, decrement. */
+		inline void operator++(int)   { ptr = ptr->ilnext; }
+		inline void operator--(int)   { ptr = ptr->ilprev; }
+
+		/* The iterator is simply a pointer. */
+		FsmTrans *ptr;
+	};
+};
+
+typedef DList<FsmTrans> TransList;
+
+/* Set of states, list of states. */
+typedef BstSet<FsmState*> StateSet;
+typedef DList<FsmState> StateList;
+
+/* A element in a state dict. */
+struct StateDictEl 
+:
+	public AvlTreeEl<StateDictEl>
+{
+	StateDictEl(const StateSet &stateSet) 
+		: stateSet(stateSet) { }
+
+	const StateSet &getKey() { return stateSet; }
+	StateSet stateSet;
+	FsmState *targState;
+};
+
+/* Dictionary mapping a set of states to a target state. */
+typedef AvlTree< StateDictEl, StateSet, CmpTable<FsmState*> > StateDict;
+
+/* Data needed for a merge operation. */
+struct MergeData
+{
+	MergeData() 
+		: stfillHead(0), stfillTail(0) { }
+
+	StateDict stateDict;
+
+	FsmState *stfillHead;
+	FsmState *stfillTail;
+
+	void fillListAppend( FsmState *state );
+};
+
+struct TransEl
+{
+	/* Constructors. */
+	TransEl() { }
+	TransEl( Key lowKey, Key highKey ) 
+		: lowKey(lowKey), highKey(highKey) { }
+	TransEl( Key lowKey, Key highKey, FsmTrans *value ) 
+		: lowKey(lowKey), highKey(highKey), value(value) { }
+
+	Key lowKey, highKey;
+	FsmTrans *value;
+};
+
+struct CmpKey
+{
+	static int compare( const Key key1, const Key key2 )
+	{
+		if ( key1 < key2 )
+			return -1;
+		else if ( key1 > key2 )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+/* Vector based set of key items. */
+typedef BstSet<Key, CmpKey> KeySet;
+
+struct MinPartition 
+{
+	MinPartition() : active(false) { }
+
+	StateList list;
+	bool active;
+
+	MinPartition *prev, *next;
+};
+
+/* Epsilon transition stored in a state. Specifies the target */
+typedef Vector<int> EpsilonTrans;
+
+/* List of states that are to be drawn into this. */
+struct EptVectEl
+{
+	EptVectEl( FsmState *targ, bool leaving ) 
+		: targ(targ), leaving(leaving) { }
+
+	FsmState *targ;
+	bool leaving;
+};
+typedef Vector<EptVectEl> EptVect;
+
+/* Set of entry ids that go into this state. */
+typedef BstSet<int> EntryIdSet;
+
+/* Set of longest match items that may be active in a given state. */
+typedef BstSet<TokenDef*> LmItemSet;
+
+/* Conditions. */
+typedef BstSet< Action*, CmpOrd<Action*> > CondSet;
+typedef CmpTable< Action*, CmpOrd<Action*> > CmpCondSet;
+
+struct CondSpace
+	: public AvlTreeEl<CondSpace>
+{
+	CondSpace( const CondSet &condSet )
+		: condSet(condSet) {}
+	
+	const CondSet &getKey() { return condSet; }
+
+	CondSet condSet;
+	Key baseKey;
+	long condSpaceId;
+};
+
+typedef Vector<CondSpace*> CondSpaceVect;
+
+typedef AvlTree<CondSpace, CondSet, CmpCondSet> CondSpaceMap;
+
+struct StateCond
+{
+	StateCond( Key lowKey, Key highKey ) :
+		lowKey(lowKey), highKey(highKey) {}
+
+	Key lowKey;
+	Key highKey;
+	CondSpace *condSpace;
+
+	StateCond *prev, *next;
+};
+
+typedef DList<StateCond> StateCondList;
+typedef Vector<long> LongVect;
+
+struct Expansion
+{
+	Expansion( Key lowKey, Key highKey ) :
+		lowKey(lowKey), highKey(highKey),
+		fromTrans(0), fromCondSpace(0), 
+		toCondSpace(0) {}
+	
+	~Expansion()
+	{
+		if ( fromTrans != 0 )
+			delete fromTrans;
+	}
+
+	Key lowKey;
+	Key highKey;
+
+	FsmTrans *fromTrans;
+	CondSpace *fromCondSpace;
+	long fromVals;
+
+	CondSpace *toCondSpace;
+	LongVect toValsList;
+
+	Expansion *prev, *next;
+};
+
+typedef DList<Expansion> ExpansionList;
+
+struct Removal
+{
+	Key lowKey;
+	Key highKey;
+
+	Removal *next;
+};
+
+struct CondData
+{
+	CondData() : nextCondKey(0) {}
+
+	/* Condition info. */
+	Key nextCondKey;
+
+	CondSpaceMap condSpaceMap;
+};
+
+extern CondData *condData;
+
+/* State class that implements actions and priorities. */
+struct FsmState 
+{
+	FsmState();
+	FsmState(const FsmState &other);
+	~FsmState();
+
+	/* Is the state final? */
+	bool isFinState() { return stateBits & SB_ISFINAL; }
+
+	/* Out transition list and the pointer for the default out trans. */
+	TransList outList;
+
+	/* In transition Lists. */
+	TransInList inList;
+
+	/* Entry points into the state. */
+	EntryIdSet entryIds;
+
+	/* Epsilon transitions. */
+	EpsilonTrans epsilonTrans;
+
+	/* Condition info. */
+	StateCondList stateCondList;
+
+	/* Number of in transitions from states other than ourselves. */
+	int foreignInTrans;
+
+	/* Temporary data for various algorithms. */
+	union {
+		/* When duplicating the fsm we need to map each 
+		 * state to the new state representing it. */
+		FsmState *stateMap;
+
+		/* When minimizing machines by partitioning, this maps to the group
+		 * the state is in. */
+		MinPartition *partition;
+
+		/* When merging states (state machine operations) this next pointer is
+		 * used for the list of states that need to be filled in. */
+		FsmState *next;
+
+		/* Identification for printing and stable minimization. */
+		int stateNum;
+
+	} alg;
+
+	/* Data used in epsilon operation, maybe fit into alg? */
+	FsmState *isolatedShadow;
+	int owningGraph;
+
+	/* A pointer to a dict element that contains the set of states this state
+	 * represents. This cannot go into alg, because alg.next is used during
+	 * the merging process. */
+	StateDictEl *stateDictEl;
+
+	/* When drawing epsilon transitions, holds the list of states to merge
+	 * with. */
+	EptVect *eptVect;
+
+	/* Bits controlling the behaviour of the state during collapsing to dfa. */
+	int stateBits;
+
+	/* State list elements. */
+	FsmState *next, *prev;
+
+	/* 
+	 * Priority and Action data.
+	 */
+
+	/* Out priorities transfered to out transitions. */
+	PriorTable outPriorTable;
+
+	/* The following two action tables are distinguished by the fact that when
+	 * toState actions are executed immediatly after transition actions of
+	 * incoming transitions and the current character will be the same as the
+	 * one available then. The fromState actions are executed immediately
+	 * before the transition actions of outgoing transitions and the current
+	 * character is same as the one available then. */
+
+	/* Actions to execute upon entering into a state. */
+	ActionTable toStateActionTable;
+
+	/* Actions to execute when going from the state to the transition. */
+	ActionTable fromStateActionTable;
+
+	/* Actions to add to any future transitions that leave via this state. */
+	ActionTable outActionTable;
+
+	/* Conditions to add to any future transiions that leave via this sttate. */
+	ActionSet outCondSet;
+
+	/* Error action tables. */
+	ErrActionTable errActionTable;
+
+	/* Actions to execute on eof. */
+	ActionTable eofActionTable;
+
+	/* Set of longest match items that may be active in this state. */
+	LmItemSet lmItemSet;
+
+	FsmState *eofTarget;
+};
+
+template <class ListItem> struct NextTrans
+{
+	Key lowKey, highKey;
+	ListItem *trans;
+	ListItem *next;
+
+	void load() {
+		if ( trans == 0 )
+			next = 0;
+		else {
+			next = trans->next;
+			lowKey = trans->lowKey;
+			highKey = trans->highKey;
+		}
+	}
+
+	void set( ListItem *t ) {
+		trans = t;
+		load();
+	}
+
+	void increment() {
+		trans = next;
+		load();
+	}
+};
+
+
+/* Encodes the different states that are meaningful to the of the iterator. */
+enum PairIterUserState
+{
+	RangeInS1, RangeInS2,
+	RangeOverlap,
+	BreakS1, BreakS2
+};
+
+template <class ListItem1, class ListItem2 = ListItem1> struct PairIter
+{
+	/* Encodes the different states that an fsm iterator can be in. */
+	enum IterState {
+		Begin,
+		ConsumeS1Range, ConsumeS2Range,
+		OnlyInS1Range,  OnlyInS2Range,
+		S1SticksOut,    S1SticksOutBreak,
+		S2SticksOut,    S2SticksOutBreak,
+		S1DragsBehind,  S1DragsBehindBreak,
+		S2DragsBehind,  S2DragsBehindBreak,
+		ExactOverlap,   End
+	};
+
+	PairIter( ListItem1 *list1, ListItem2 *list2 );
+	
+	/* Query iterator. */
+	bool lte() { return itState != End; }
+	bool end() { return itState == End; }
+	void operator++(int) { findNext(); }
+	void operator++()    { findNext(); }
+
+	/* Iterator state. */
+	ListItem1 *list1;
+	ListItem2 *list2;
+	IterState itState;
+	PairIterUserState userState;
+
+	NextTrans<ListItem1> s1Tel;
+	NextTrans<ListItem2> s2Tel;
+	Key bottomLow, bottomHigh;
+	ListItem1 *bottomTrans1;
+	ListItem2 *bottomTrans2;
+
+private:
+	void findNext();
+};
+
+/* Init the iterator by advancing to the first item. */
+template <class ListItem1, class ListItem2> PairIter<ListItem1, ListItem2>::PairIter( 
+		ListItem1 *list1, ListItem2 *list2 )
+:
+	list1(list1),
+	list2(list2),
+	itState(Begin)
+{
+	findNext();
+}
+
+/* Return and re-entry for the co-routine iterators. This should ALWAYS be
+ * used inside of a block. */
+#define CO_RETURN(label) \
+	itState = label; \
+	return; \
+	entry##label: backIn = true
+
+/* Return and re-entry for the co-routine iterators. This should ALWAYS be
+ * used inside of a block. */
+#define CO_RETURN2(label, uState) \
+	itState = label; \
+	userState = uState; \
+	return; \
+	entry##label: backIn = true
+
+/* Advance to the next transition. When returns, trans points to the next
+ * transition, unless there are no more, in which case end() returns true. */
+template <class ListItem1, class ListItem2> void PairIter<ListItem1, ListItem2>::findNext()
+{
+	/* This variable is used in dummy statements that follow the entry
+	 * goto labels. The compiler needs some statement to follow the label. */
+	bool backIn;
+
+	/* Jump into the iterator routine base on the iterator state. */
+	switch ( itState ) {
+		case Begin:              goto entryBegin;
+		case ConsumeS1Range:     goto entryConsumeS1Range;
+		case ConsumeS2Range:     goto entryConsumeS2Range;
+		case OnlyInS1Range:      goto entryOnlyInS1Range;
+		case OnlyInS2Range:      goto entryOnlyInS2Range;
+		case S1SticksOut:        goto entryS1SticksOut;
+		case S1SticksOutBreak:   goto entryS1SticksOutBreak;
+		case S2SticksOut:        goto entryS2SticksOut;
+		case S2SticksOutBreak:   goto entryS2SticksOutBreak;
+		case S1DragsBehind:      goto entryS1DragsBehind;
+		case S1DragsBehindBreak: goto entryS1DragsBehindBreak;
+		case S2DragsBehind:      goto entryS2DragsBehind;
+		case S2DragsBehindBreak: goto entryS2DragsBehindBreak;
+		case ExactOverlap:       goto entryExactOverlap;
+		case End:                goto entryEnd;
+	}
+
+entryBegin:
+	/* Set up the next structs at the head of the transition lists. */
+	s1Tel.set( list1 );
+	s2Tel.set( list2 );
+
+	/* Concurrently scan both out ranges. */
+	while ( true ) {
+		if ( s1Tel.trans == 0 ) {
+			/* We are at the end of state1's ranges. Process the rest of
+			 * state2's ranges. */
+			while ( s2Tel.trans != 0 ) {
+				/* Range is only in s2. */
+				CO_RETURN2( ConsumeS2Range, RangeInS2 );
+				s2Tel.increment();
+			}
+			break;
+		}
+		else if ( s2Tel.trans == 0 ) {
+			/* We are at the end of state2's ranges. Process the rest of
+			 * state1's ranges. */
+			while ( s1Tel.trans != 0 ) {
+				/* Range is only in s1. */
+				CO_RETURN2( ConsumeS1Range, RangeInS1 );
+				s1Tel.increment();
+			}
+			break;
+		}
+		/* Both state1's and state2's transition elements are good.
+		 * The signiture of no overlap is a back key being in front of a
+		 * front key. */
+		else if ( s1Tel.highKey < s2Tel.lowKey ) {
+			/* A range exists in state1 that does not overlap with state2. */
+			CO_RETURN2( OnlyInS1Range, RangeInS1 );
+			s1Tel.increment();
+		}
+		else if ( s2Tel.highKey < s1Tel.lowKey ) {
+			/* A range exists in state2 that does not overlap with state1. */
+			CO_RETURN2( OnlyInS2Range, RangeInS2 );
+			s2Tel.increment();
+		}
+		/* There is overlap, must mix the ranges in some way. */
+		else if ( s1Tel.lowKey < s2Tel.lowKey ) {
+			/* Range from state1 sticks out front. Must break it into
+			 * non-overlaping and overlaping segments. */
+			bottomLow = s2Tel.lowKey;
+			bottomHigh = s1Tel.highKey;
+			s1Tel.highKey = s2Tel.lowKey;
+			s1Tel.highKey.decrement();
+			bottomTrans1 = s1Tel.trans;
+
+			/* Notify the caller that we are breaking s1. This gives them a
+			 * chance to duplicate s1Tel[0,1].value. */
+			CO_RETURN2( S1SticksOutBreak, BreakS1 );
+
+			/* Broken off range is only in s1. */
+			CO_RETURN2( S1SticksOut, RangeInS1 );
+
+			/* Advance over the part sticking out front. */
+			s1Tel.lowKey = bottomLow;
+			s1Tel.highKey = bottomHigh;
+			s1Tel.trans = bottomTrans1;
+		}
+		else if ( s2Tel.lowKey < s1Tel.lowKey ) {
+			/* Range from state2 sticks out front. Must break it into
+			 * non-overlaping and overlaping segments. */
+			bottomLow = s1Tel.lowKey;
+			bottomHigh = s2Tel.highKey;
+			s2Tel.highKey = s1Tel.lowKey;
+			s2Tel.highKey.decrement();
+			bottomTrans2 = s2Tel.trans;
+
+			/* Notify the caller that we are breaking s2. This gives them a
+			 * chance to duplicate s2Tel[0,1].value. */
+			CO_RETURN2( S2SticksOutBreak, BreakS2 );
+
+			/* Broken off range is only in s2. */
+			CO_RETURN2( S2SticksOut, RangeInS2 );
+
+			/* Advance over the part sticking out front. */
+			s2Tel.lowKey = bottomLow;
+			s2Tel.highKey = bottomHigh;
+			s2Tel.trans = bottomTrans2;
+		}
+		/* Low ends are even. Are the high ends even? */
+		else if ( s1Tel.highKey < s2Tel.highKey ) {
+			/* Range from state2 goes longer than the range from state1. We
+			 * must break the range from state2 into an evenly overlaping
+			 * segment. */
+			bottomLow = s1Tel.highKey;
+			bottomLow.increment();
+			bottomHigh = s2Tel.highKey;
+			s2Tel.highKey = s1Tel.highKey;
+			bottomTrans2 = s2Tel.trans;
+
+			/* Notify the caller that we are breaking s2. This gives them a
+			 * chance to duplicate s2Tel[0,1].value. */
+			CO_RETURN2( S2DragsBehindBreak, BreakS2 );
+
+			/* Breaking s2 produces exact overlap. */
+			CO_RETURN2( S2DragsBehind, RangeOverlap );
+
+			/* Advance over the front we just broke off of range 2. */
+			s2Tel.lowKey = bottomLow;
+			s2Tel.highKey = bottomHigh;
+			s2Tel.trans = bottomTrans2;
+
+			/* Advance over the entire s1Tel. We have consumed it. */
+			s1Tel.increment();
+		}
+		else if ( s2Tel.highKey < s1Tel.highKey ) {
+			/* Range from state1 goes longer than the range from state2. We
+			 * must break the range from state1 into an evenly overlaping
+			 * segment. */
+			bottomLow = s2Tel.highKey;
+			bottomLow.increment();
+			bottomHigh = s1Tel.highKey;
+			s1Tel.highKey = s2Tel.highKey;
+			bottomTrans1 = s1Tel.trans;
+
+			/* Notify the caller that we are breaking s1. This gives them a
+			 * chance to duplicate s2Tel[0,1].value. */
+			CO_RETURN2( S1DragsBehindBreak, BreakS1 );
+
+			/* Breaking s1 produces exact overlap. */
+			CO_RETURN2( S1DragsBehind, RangeOverlap );
+
+			/* Advance over the front we just broke off of range 1. */
+			s1Tel.lowKey = bottomLow;
+			s1Tel.highKey = bottomHigh;
+			s1Tel.trans = bottomTrans1;
+
+			/* Advance over the entire s2Tel. We have consumed it. */
+			s2Tel.increment();
+		}
+		else {
+			/* There is an exact overlap. */
+			CO_RETURN2( ExactOverlap, RangeOverlap );
+
+			s1Tel.increment();
+			s2Tel.increment();
+		}
+	}
+
+	/* Done, go into end state. */
+	CO_RETURN( End );
+}
+
+
+/* Compare lists of epsilon transitions. Entries are name ids of targets. */
+typedef CmpTable< int, CmpOrd<int> > CmpEpsilonTrans;
+
+/* Compare class for the Approximate minimization. */
+class ApproxCompare
+{
+public:
+	ApproxCompare() { }
+	int compare( const FsmState *pState1, const FsmState *pState2 );
+};
+
+/* Compare class for the initial partitioning of a partition minimization. */
+class InitPartitionCompare
+{
+public:
+	InitPartitionCompare() { }
+	int compare( const FsmState *pState1, const FsmState *pState2 );
+};
+
+/* Compare class for the regular partitioning of a partition minimization. */
+class PartitionCompare
+{
+public:
+	PartitionCompare() { }
+	int compare( const FsmState *pState1, const FsmState *pState2 );
+};
+
+/* Compare class for a minimization that marks pairs. Provides the shouldMark
+ * routine. */
+class MarkCompare
+{
+public:
+	MarkCompare() { }
+	bool shouldMark( MarkIndex &markIndex, const FsmState *pState1, 
+			const FsmState *pState2 );
+};
+
+/* List of partitions. */
+typedef DList< MinPartition > PartitionList;
+
+/* List of transtions out of a state. */
+typedef Vector<TransEl> TransListVect;
+
+/* Entry point map used for keeping track of entry points in a machine. */
+typedef BstSet< int > EntryIdSet;
+typedef BstMapEl< int, FsmState* > EntryMapEl;
+typedef BstMap< int, FsmState* > EntryMap;
+typedef Vector<EntryMapEl> EntryMapBase;
+
+/* Graph class that implements actions and priorities. */
+struct FsmGraph 
+{
+	/* Constructors/Destructors. */
+	FsmGraph( );
+	FsmGraph( const FsmGraph &graph );
+	~FsmGraph();
+
+	/* The list of states. */
+	StateList stateList;
+	StateList misfitList;
+
+	/* The map of entry points. */
+	EntryMap entryPoints;
+
+	/* The start state. */
+	FsmState *startState;
+
+	/* Error state, possibly created only when the final machine has been
+	 * created and the XML machine is about to be written. No transitions
+	 * point to this state. */
+	FsmState *errState;
+
+	/* The set of final states. */
+	StateSet finStateSet;
+
+	/* Misfit Accounting. Are misfits put on a separate list. */
+	bool misfitAccounting;
+
+	bool lmRequiresErrorState;
+	NameInst *rootName;
+	NameInst **nameIndex;
+
+	/*
+	 * Transition actions and priorities.
+	 */
+
+	/* Set priorities on transtions. */
+	void startFsmPrior( int ordering, PriorDesc *prior );
+	void allTransPrior( int ordering, PriorDesc *prior );
+	void finishFsmPrior( int ordering, PriorDesc *prior );
+	void leaveFsmPrior( int ordering, PriorDesc *prior );
+
+	/* Action setting support. */
+	void transferErrorActions( FsmState *state, int transferPoint );
+	void setErrorAction( FsmState *state, int ordering, Action *action );
+	void setErrorActions( FsmState *state, const ActionTable &other );
+
+	/* Fill all spaces in a transition list with an error transition. */
+	void fillGaps( FsmState *state );
+
+	/* Similar to setErrorAction, instead gives a state to go to on error. */
+	void setErrorTarget( FsmState *state, FsmState *target, int *orderings, 
+			Action **actions, int nActs );
+
+	/* Set actions to execute. */
+	void startFsmAction( int ordering, Action *action );
+	void allTransAction( int ordering, Action *action );
+	void finishFsmAction( int ordering, Action *action );
+	void leaveFsmAction( int ordering, Action *action );
+	void longMatchAction( int ordering, TokenDef *lmPart );
+
+	/* Set conditions. */
+	CondSpace *addCondSpace( const CondSet &condSet );
+
+	void findEmbedExpansions( ExpansionList &expansionList, 
+		FsmState *destState, Action *condAction );
+	void embedCondition( MergeData &md, FsmState *state, Action *condAction );
+	void embedCondition( FsmState *state, Action *condAction );
+
+	void startFsmCondition( Action *condAction );
+	void allTransCondition( Action *condAction );
+	void leaveFsmCondition( Action *condAction );
+
+	/* Set error actions to execute. */
+	void startErrorAction( int ordering, Action *action, int transferPoint );
+	void allErrorAction( int ordering, Action *action, int transferPoint );
+	void finalErrorAction( int ordering, Action *action, int transferPoint );
+	void notStartErrorAction( int ordering, Action *action, int transferPoint );
+	void notFinalErrorAction( int ordering, Action *action, int transferPoint );
+	void middleErrorAction( int ordering, Action *action, int transferPoint );
+
+	/* Set EOF actions. */
+	void startEOFAction( int ordering, Action *action );
+	void allEOFAction( int ordering, Action *action );
+	void finalEOFAction( int ordering, Action *action );
+	void notStartEOFAction( int ordering, Action *action );
+	void notFinalEOFAction( int ordering, Action *action );
+	void middleEOFAction( int ordering, Action *action );
+
+	/* Set To State actions. */
+	void startToStateAction( int ordering, Action *action );
+	void allToStateAction( int ordering, Action *action );
+	void finalToStateAction( int ordering, Action *action );
+	void notStartToStateAction( int ordering, Action *action );
+	void notFinalToStateAction( int ordering, Action *action );
+	void middleToStateAction( int ordering, Action *action );
+
+	/* Set From State actions. */
+	void startFromStateAction( int ordering, Action *action );
+	void allFromStateAction( int ordering, Action *action );
+	void finalFromStateAction( int ordering, Action *action );
+	void notStartFromStateAction( int ordering, Action *action );
+	void notFinalFromStateAction( int ordering, Action *action );
+	void middleFromStateAction( int ordering, Action *action );
+
+	/* Shift the action ordering of the start transitions to start at
+	 * fromOrder and increase in units of 1. Useful before kleene star
+	 * operation.  */
+	int shiftStartActionOrder( int fromOrder );
+
+	/* Clear all priorities from the fsm to so they won't affcet minimization
+	 * of the final fsm. */
+	void clearAllPriorities();
+
+	/* Zero out all the function keys. */
+	void nullActionKeys();
+
+	/* Walk the list of states and verify state properties. */
+	void verifyStates();
+
+	/* Misfit Accounting. Are misfits put on a separate list. */
+	void setMisfitAccounting( bool val ) 
+		{ misfitAccounting = val; }
+
+	/* Set and Unset a state as final. */
+	void setFinState( FsmState *state );
+	void unsetFinState( FsmState *state );
+
+	void setStartState( FsmState *state );
+	void unsetStartState( );
+	
+	/* Set and unset a state as an entry point. */
+	void setEntry( int id, FsmState *state );
+	void changeEntry( int id, FsmState *to, FsmState *from );
+	void unsetEntry( int id, FsmState *state );
+	void unsetEntry( int id );
+	void unsetAllEntryPoints();
+
+	/* Epsilon transitions. */
+	void epsilonTrans( int id );
+	void shadowReadWriteStates( MergeData &md );
+
+	/*
+	 * Basic attaching and detaching.
+	 */
+
+	/* Common to attaching/detaching list and default. */
+	void attachToInList( FsmState *from, FsmState *to, FsmTrans *&head, FsmTrans *trans );
+	void detachFromInList( FsmState *from, FsmState *to, FsmTrans *&head, FsmTrans *trans );
+
+	/* Attach with a new transition. */
+	FsmTrans *attachNewTrans( FsmState *from, FsmState *to,
+			Key onChar1, Key onChar2 );
+
+	/* Attach with an existing transition that already in an out list. */
+	void attachTrans( FsmState *from, FsmState *to, FsmTrans *trans );
+	
+	/* Redirect a transition away from error and towards some state. */
+	void redirectErrorTrans( FsmState *from, FsmState *to, FsmTrans *trans );
+
+	/* Detach a transition from a target state. */
+	void detachTrans( FsmState *from, FsmState *to, FsmTrans *trans );
+
+	/* Detach a state from the graph. */
+	void detachState( FsmState *state );
+
+	/*
+	 * NFA to DFA conversion routines.
+	 */
+
+	/* Duplicate a transition that will dropin to a free spot. */
+	FsmTrans *dupTrans( FsmState *from, FsmTrans *srcTrans );
+
+	/* In crossing, two transitions both go to real states. */
+	FsmTrans *fsmAttachStates( MergeData &md, FsmState *from,
+			FsmTrans *destTrans, FsmTrans *srcTrans );
+
+	/* Two transitions are to be crossed, handle the possibility of either
+	 * going to the error state. */
+	FsmTrans *mergeTrans( MergeData &md, FsmState *from,
+			FsmTrans *destTrans, FsmTrans *srcTrans );
+
+	/* Compare deterimne relative priorities of two transition tables. */
+	int comparePrior( const PriorTable &priorTable1, const PriorTable &priorTable2 );
+
+	/* Cross a src transition with one that is already occupying a spot. */
+	FsmTrans *crossTransitions( MergeData &md, FsmState *from,
+			FsmTrans *destTrans, FsmTrans *srcTrans );
+
+	void outTransCopy( MergeData &md, FsmState *dest, FsmTrans *srcList );
+
+	void doRemove( MergeData &md, FsmState *destState, ExpansionList &expList1 );
+	void doExpand( MergeData &md, FsmState *destState, ExpansionList &expList1 );
+	void findCondExpInTrans( ExpansionList &expansionList, FsmState *state, 
+			Key lowKey, Key highKey, CondSpace *fromCondSpace, CondSpace *toCondSpace,
+			long destVals, LongVect &toValsList );
+	void findTransExpansions( ExpansionList &expansionList, 
+			FsmState *destState, FsmState *srcState );
+	void findCondExpansions( ExpansionList &expansionList, 
+			FsmState *destState, FsmState *srcState );
+	void mergeStateConds( FsmState *destState, FsmState *srcState );
+
+	/* Merge a set of states into newState. */
+	void mergeStates( MergeData &md, FsmState *destState, 
+			FsmState **srcStates, int numSrc );
+	void mergeStatesLeaving( MergeData &md, FsmState *destState, FsmState *srcState );
+	void mergeStates( MergeData &md, FsmState *destState, FsmState *srcState );
+
+	/* Make all states that are combinations of other states and that
+	 * have not yet had their out transitions filled in. This will 
+	 * empty out stateDict and stFil. */
+	void fillInStates( MergeData &md );
+
+	/*
+	 * Transition Comparison.
+	 */
+
+	/* Compare transition data. Either of the pointers may be null. */
+	static inline int compareDataPtr( FsmTrans *trans1, FsmTrans *trans2 );
+
+	/* Compare target state and transition data. Either pointer may be null. */
+	static inline int compareFullPtr( FsmTrans *trans1, FsmTrans *trans2 );
+
+	/* Compare target partitions. Either pointer may be null. */
+	static inline int comparePartPtr( FsmTrans *trans1, FsmTrans *trans2 );
+
+	/* Check marked status of target states. Either pointer may be null. */
+	static inline bool shouldMarkPtr( MarkIndex &markIndex, 
+			FsmTrans *trans1, FsmTrans *trans2 );
+
+	/*
+	 * Callbacks.
+	 */
+
+	/* Compare priority and function table of transitions. */
+	static int compareTransData( FsmTrans *trans1, FsmTrans *trans2 );
+
+	/* Add in the properties of srcTrans into this. */
+	void addInTrans( FsmTrans *destTrans, FsmTrans *srcTrans );
+
+	/* Compare states on data stored in the states. */
+	static int compareStateData( const FsmState *state1, const FsmState *state2 );
+
+	/* Out transition data. */
+	void clearOutData( FsmState *state );
+	bool hasOutData( FsmState *state );
+	void transferOutData( FsmState *destState, FsmState *srcState );
+
+	/*
+	 * Allocation.
+	 */
+
+	/* New up a state and add it to the graph. */
+	FsmState *addState();
+
+	/*
+	 * Building basic machines
+	 */
+
+	void concatFsm( Key c );
+	void concatFsm( Key *str, int len );
+	void concatFsmCI( Key *str, int len );
+	void orFsm( Key *set, int len );
+	void rangeFsm( Key low, Key high );
+	void rangeStarFsm( Key low, Key high );
+	void emptyFsm( );
+	void lambdaFsm( );
+
+	/*
+	 * Fsm operators.
+	 */
+
+	void starOp( );
+	void repeatOp( int times );
+	void optionalRepeatOp( int times );
+	void concatOp( FsmGraph *other );
+	void unionOp( FsmGraph *other );
+	void intersectOp( FsmGraph *other );
+	void subtractOp( FsmGraph *other );
+	void epsilonOp();
+	void joinOp( int startId, int finalId, FsmGraph **others, int numOthers );
+	void globOp( FsmGraph **others, int numOthers );
+	void deterministicEntry();
+
+	/*
+	 * Operator workers
+	 */
+
+	/* Determine if there are any entry points into a start state other than
+	 * the start state. */
+	bool isStartStateIsolated();
+
+	/* Make a new start state that has no entry points. Will not change the
+	 * identity of the fsm. */
+	void isolateStartState();
+
+	/* Workers for resolving epsilon transitions. */
+	bool inEptVect( EptVect *eptVect, FsmState *targ );
+	void epsilonFillEptVectFrom( FsmState *root, FsmState *from, bool parentLeaving );
+	void resolveEpsilonTrans( MergeData &md );
+
+	/* Workers for concatenation and union. */
+	void doConcat( FsmGraph *other, StateSet *fromStates, bool optional );
+	void doOr( FsmGraph *other );
+
+	/*
+	 * Final states
+	 */
+
+	/* Unset any final states that are no longer to be final 
+	 * due to final bits. */
+	void unsetIncompleteFinals();
+	void unsetKilledFinals();
+
+	/* Bring in other's entry points. Assumes others states are going to be
+	 * copied into this machine. */
+	void copyInEntryPoints( FsmGraph *other );
+
+	/* Ordering states. */
+	void depthFirstOrdering( FsmState *state );
+	void depthFirstOrdering();
+	void sortStatesByFinal();
+
+	/* Set sqequential state numbers starting at 0. */
+	void setStateNumbers( int base );
+
+	/* Unset all final states. */
+	void unsetAllFinStates();
+
+	/* Set the bits of final states and clear the bits of non final states. */
+	void setFinBits( int finStateBits );
+
+	/*
+	 * Self-consistency checks.
+	 */
+
+	/* Run a sanity check on the machine. */
+	void verifyIntegrity();
+
+	/* Verify that there are no unreachable states, or dead end states. */
+	void verifyReachability();
+	void verifyNoDeadEndStates();
+
+	/*
+	 * Path pruning
+	 */
+
+	/* Mark all states reachable from state. */
+	void markReachableFromHereReverse( FsmState *state );
+
+	/* Mark all states reachable from state. */
+	void markReachableFromHere( FsmState *state );
+	void markReachableFromHereStopFinal( FsmState *state );
+
+	/* Removes states that cannot be reached by any path in the fsm and are
+	 * thus wasted silicon. */
+	void removeDeadEndStates();
+
+	/* Removes states that cannot be reached by any path in the fsm and are
+	 * thus wasted silicon. */
+	void removeUnreachableStates();
+
+	/* Remove error actions from states on which the error transition will
+	 * never be taken. */
+	bool outListCovers( FsmState *state );
+	bool anyErrorRange( FsmState *state );
+
+	/* Remove states that are on the misfit list. */
+	void removeMisfits();
+
+	/*
+	 * FSM Minimization
+	 */
+
+	/* Minimization by partitioning. */
+	void minimizePartition1();
+	void minimizePartition2();
+
+	/* Minimize the final state Machine. The result is the minimal fsm. Slow
+	 * but stable, correct minimization. Uses n^2 space (lookout) and average
+	 * n^2 time. Worst case n^3 time, but a that is a very rare case. */
+	void minimizeStable();
+
+	/* Minimize the final state machine. Does not find the minimal fsm, but a
+	 * pretty good approximation. Does not use any extra space. Average n^2
+	 * time. Worst case n^3 time, but a that is a very rare case. */
+	void minimizeApproximate();
+
+	/* This is the worker for the minimize approximate solution. It merges
+	 * states that have identical out transitions. */
+	bool minimizeRound( );
+
+	/* Given an intial partioning of states, split partitions that have out trans
+	 * to differing partitions. */
+	int partitionRound( FsmState **statePtrs, MinPartition *parts, int numParts );
+
+	/* Split partitions that have a transition to a previously split partition, until
+	 * there are no more partitions to split. */
+	int splitCandidates( FsmState **statePtrs, MinPartition *parts, int numParts );
+
+	/* Fuse together states in the same partition. */
+	void fusePartitions( MinPartition *parts, int numParts );
+
+	/* Mark pairs where out final stateness differs, out trans data differs,
+	 * trans pairs go to a marked pair or trans data differs. Should get 
+	 * alot of pairs. */
+	void initialMarkRound( MarkIndex &markIndex );
+
+	/* One marking round on all state pairs. Considers if trans pairs go
+	 * to a marked state only. Returns whether or not a pair was marked. */
+	bool markRound( MarkIndex &markIndex );
+
+	/* Move the in trans into src into dest. */
+	void inTransMove(FsmState *dest, FsmState *src);
+	
+	/* Make state src and dest the same state. */
+	void fuseEquivStates(FsmState *dest, FsmState *src);
+
+	/* Find any states that didn't get marked by the marking algorithm and
+	 * merge them into the primary states of their equivalence class. */
+	void fuseUnmarkedPairs( MarkIndex &markIndex );
+
+	/* Merge neighboring transitions go to the same state and have the same
+	 * transitions data. */
+	void compressTransitions();
+
+	/* Returns true if there is a transtion (either explicit or by a gap) to
+	 * the error state. */
+	bool checkErrTrans( FsmState *state, FsmTrans *trans );
+	bool checkErrTransFinish( FsmState *state );
+	bool hasErrorTrans();
+};
+
+
+#endif /* _FSMGRAPH_H */
diff --git a/colm/fsmmin.cpp b/colm/fsmmin.cpp
new file mode 100644
index 00000000..901659f5
--- /dev/null
+++ b/colm/fsmmin.cpp
@@ -0,0 +1,732 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "fsmgraph.h"
+#include "mergesort.h"
+
+int FsmGraph::partitionRound( FsmState **statePtrs, MinPartition *parts, int numParts )
+{
+	/* Need a mergesort object and a single partition compare. */
+	MergeSort<FsmState*, PartitionCompare> mergeSort;
+	PartitionCompare partCompare;
+
+	/* For each partition. */
+	for ( int p = 0; p < numParts; p++ ) {
+		/* Fill the pointer array with the states in the partition. */
+		StateList::Iter state = parts[p].list;
+		for ( int s = 0; state.lte(); state++, s++ )
+			statePtrs[s] = state;
+
+		/* Sort the states using the partitioning compare. */
+		int numStates = parts[p].list.length();
+		mergeSort.sort( statePtrs, numStates );
+
+		/* Assign the states into partitions based on the results of the sort. */
+		int destPart = p, firstNewPart = numParts;
+		for ( int s = 1; s < numStates; s++ ) {
+			/* If this state differs from the last then move to the next partition. */
+			if ( partCompare.compare( statePtrs[s-1], statePtrs[s] ) < 0 ) {
+				/* The new partition is the next avail spot. */
+				destPart = numParts;
+				numParts += 1;
+			}
+
+			/* If the state is not staying in the first partition, then
+			 * transfer it to its destination partition. */
+			if ( destPart != p ) {
+				FsmState *state = parts[p].list.detach( statePtrs[s] );
+				parts[destPart].list.append( state );
+			}
+		}
+
+		/* Fix the partition pointer for all the states that got moved to a new
+		 * partition. This must be done after the states are transfered so the
+		 * result of the sort is not altered. */
+		for ( int newPart = firstNewPart; newPart < numParts; newPart++ ) {
+			StateList::Iter state = parts[newPart].list;
+			for ( ; state.lte(); state++ )
+				state->alg.partition = &parts[newPart];
+		}
+	}
+
+	return numParts;
+}
+
+/**
+ * \brief Minimize by partitioning version 1.
+ *
+ * Repeatedly tries to split partitions until all partitions are unsplittable.
+ * Produces the most minimal FSM possible.
+ */
+void FsmGraph::minimizePartition1()
+{
+	/* Need one mergesort object and partition compares. */
+	MergeSort<FsmState*, InitPartitionCompare> mergeSort;
+	InitPartitionCompare initPartCompare;
+
+	/* Nothing to do if there are no states. */
+	if ( stateList.length() == 0 )
+		return;
+
+	/* 
+	 * First thing is to partition the states by final state status and
+	 * transition functions. This gives us an initial partitioning to work
+	 * with.
+	 */
+
+	/* Make a array of pointers to states. */
+	int numStates = stateList.length();
+	FsmState** statePtrs = new FsmState*[numStates];
+
+	/* Fill up an array of pointers to the states for easy sorting. */
+	StateList::Iter state = stateList;
+	for ( int s = 0; state.lte(); state++, s++ )
+		statePtrs[s] = state;
+		
+	/* Sort the states using the array of states. */
+	mergeSort.sort( statePtrs, numStates );
+
+	/* An array of lists of states is used to partition the states. */
+	MinPartition *parts = new MinPartition[numStates];
+
+	/* Assign the states into partitions. */
+	int destPart = 0;
+	for ( int s = 0; s < numStates; s++ ) {
+		/* If this state differs from the last then move to the next partition. */
+		if ( s > 0 && initPartCompare.compare( statePtrs[s-1], statePtrs[s] ) < 0 ) {
+			/* Move to the next partition. */
+			destPart += 1;
+		}
+
+		/* Put the state into its partition. */
+		statePtrs[s]->alg.partition = &parts[destPart];
+		parts[destPart].list.append( statePtrs[s] );
+	}
+
+	/* We just moved all the states from the main list into partitions without
+	 * taking them off the main list. So clean up the main list now. */
+	stateList.abandon();
+
+	/* Split partitions. */
+	int numParts = destPart + 1;
+	while ( true ) {
+		/* Test all partitions for splitting. */
+		int newNum = partitionRound( statePtrs, parts, numParts );
+
+		/* When no partitions can be split, stop. */
+		if ( newNum == numParts )
+			break;
+
+		numParts = newNum;
+	}
+
+	/* Fuse states in the same partition. The states will end up back on the
+	 * main list. */
+	fusePartitions( parts, numParts );
+
+	/* Cleanup. */
+	delete[] statePtrs;
+	delete[] parts;
+}
+
+/* Split partitions that need splittting, decide which partitions might need
+ * to be split as a result, continue until there are no more that might need
+ * to be split. */
+int FsmGraph::splitCandidates( FsmState **statePtrs, MinPartition *parts, int numParts )
+{
+	/* Need a mergesort and a partition compare. */
+	MergeSort<FsmState*, PartitionCompare> mergeSort;
+	PartitionCompare partCompare;
+
+	/* The lists of unsplitable (partList) and splitable partitions. 
+	 * Only partitions in the splitable list are check for needing splitting. */
+	PartitionList partList, splittable;
+
+	/* Initially, all partitions are born from a split (the initial
+	 * partitioning) and can cause other partitions to be split. So any
+	 * partition with a state with a transition out to another partition is a
+	 * candidate for splitting. This will make every partition except possibly
+	 * partitions of final states split candidates. */
+	for ( int p = 0; p < numParts; p++ ) {
+		/* Assume not active. */
+		parts[p].active = false;
+
+		/* Look for a trans out of any state in the partition. */
+		for ( StateList::Iter state = parts[p].list; state.lte(); state++ ) {
+			/* If there is at least one transition out to another state then 
+			 * the partition becomes splittable. */
+			if ( state->outList.length() > 0 ) {
+				parts[p].active = true;
+				break;
+			}
+		}
+
+		/* If it was found active then it goes on the splittable list. */
+		if ( parts[p].active )
+			splittable.append( &parts[p] );
+		else
+			partList.append( &parts[p] );
+	}
+
+	/* While there are partitions that are splittable, pull one off and try
+	 * to split it. If it splits, determine which partitions may now be split
+	 * as a result of the newly split partition. */
+	while ( splittable.length() > 0 ) {
+		MinPartition *partition = splittable.detachFirst();
+
+		/* Fill the pointer array with the states in the partition. */
+		StateList::Iter state = partition->list;
+		for ( int s = 0; state.lte(); state++, s++ )
+			statePtrs[s] = state;
+
+		/* Sort the states using the partitioning compare. */
+		int numStates = partition->list.length();
+		mergeSort.sort( statePtrs, numStates );
+
+		/* Assign the states into partitions based on the results of the sort. */
+		MinPartition *destPart = partition;
+		int firstNewPart = numParts;
+		for ( int s = 1; s < numStates; s++ ) {
+			/* If this state differs from the last then move to the next partition. */
+			if ( partCompare.compare( statePtrs[s-1], statePtrs[s] ) < 0 ) {
+				/* The new partition is the next avail spot. */
+				destPart = &parts[numParts];
+				numParts += 1;
+			}
+
+			/* If the state is not staying in the first partition, then
+			 * transfer it to its destination partition. */
+			if ( destPart != partition ) {
+				FsmState *state = partition->list.detach( statePtrs[s] );
+				destPart->list.append( state );
+			}
+		}
+
+		/* Fix the partition pointer for all the states that got moved to a new
+		 * partition. This must be done after the states are transfered so the
+		 * result of the sort is not altered. */
+		int newPart;
+		for ( newPart = firstNewPart; newPart < numParts; newPart++ ) {
+			StateList::Iter state = parts[newPart].list;
+			for ( ; state.lte(); state++ )
+				state->alg.partition = &parts[newPart];
+		}
+
+		/* Put the partition we just split and any new partitions that came out
+		 * of the split onto the inactive list. */
+		partition->active = false;
+		partList.append( partition );
+		for ( newPart = firstNewPart; newPart < numParts; newPart++ ) {
+			parts[newPart].active = false;
+			partList.append( &parts[newPart] );
+		}
+
+		if ( destPart == partition )
+			continue;
+
+		/* Now determine which partitions are splittable as a result of
+		 * splitting partition by walking the in lists of the states in
+		 * partitions that got split. Partition is the faked first item in the
+		 * loop. */
+		MinPartition *causalPart = partition;
+		newPart = firstNewPart - 1;
+		while ( newPart < numParts ) {
+			/* Loop all states in the causal partition. */
+			StateList::Iter state = causalPart->list;
+			for ( ; state.lte(); state++ ) {
+				/* Walk all transition into the state and put the partition
+				 * that the from state is in onto the splittable list. */
+				for ( TransInList::Iter trans = state->inList; trans.lte(); trans++ ) {
+					MinPartition *fromPart = trans->fromState->alg.partition;
+					if ( ! fromPart->active ) {
+						fromPart->active = true;
+						partList.detach( fromPart );
+						splittable.append( fromPart );
+					}
+				}
+			}
+
+			newPart += 1;
+			causalPart = &parts[newPart];
+		}
+	}
+	return numParts;
+}
+
+
+/**
+ * \brief Minimize by partitioning version 2 (best alg).
+ *
+ * Repeatedly tries to split partitions that may splittable until there are no
+ * more partitions that might possibly need splitting. Runs faster than
+ * version 1. Produces the most minimal fsm possible.
+ */
+void FsmGraph::minimizePartition2()
+{
+	/* Need a mergesort and an initial partition compare. */
+	MergeSort<FsmState*, InitPartitionCompare> mergeSort;
+	InitPartitionCompare initPartCompare;
+
+	/* Nothing to do if there are no states. */
+	if ( stateList.length() == 0 )
+		return;
+
+	/* 
+	 * First thing is to partition the states by final state status and
+	 * transition functions. This gives us an initial partitioning to work
+	 * with.
+	 */
+
+	/* Make a array of pointers to states. */
+	int numStates = stateList.length();
+	FsmState** statePtrs = new FsmState*[numStates];
+
+	/* Fill up an array of pointers to the states for easy sorting. */
+	StateList::Iter state = stateList;
+	for ( int s = 0; state.lte(); state++, s++ )
+		statePtrs[s] = state;
+		
+	/* Sort the states using the array of states. */
+	mergeSort.sort( statePtrs, numStates );
+
+	/* An array of lists of states is used to partition the states. */
+	MinPartition *parts = new MinPartition[numStates];
+
+	/* Assign the states into partitions. */
+	int destPart = 0;
+	for ( int s = 0; s < numStates; s++ ) {
+		/* If this state differs from the last then move to the next partition. */
+		if ( s > 0 && initPartCompare.compare( statePtrs[s-1], statePtrs[s] ) < 0 ) {
+			/* Move to the next partition. */
+			destPart += 1;
+		}
+
+		/* Put the state into its partition. */
+		statePtrs[s]->alg.partition = &parts[destPart];
+		parts[destPart].list.append( statePtrs[s] );
+	}
+
+	/* We just moved all the states from the main list into partitions without
+	 * taking them off the main list. So clean up the main list now. */
+	stateList.abandon();
+
+	/* Split partitions. */
+	int numParts = splitCandidates( statePtrs, parts, destPart+1 );
+
+	/* Fuse states in the same partition. The states will end up back on the
+	 * main list. */
+	fusePartitions( parts, numParts );
+
+	/* Cleanup. */
+	delete[] statePtrs;
+	delete[] parts;
+}
+
+void FsmGraph::initialMarkRound( MarkIndex &markIndex )
+{
+	/* P and q for walking pairs. */
+	FsmState *p = stateList.head, *q;
+
+	/* Need an initial partition compare. */
+	InitPartitionCompare initPartCompare;
+
+	/* Walk all unordered pairs of (p, q) where p != q.
+	 * The second depth of the walk stops before reaching p. This
+	 * gives us all unordered pairs of states (p, q) where p != q. */
+	while ( p != 0 ) {
+		q = stateList.head;
+		while ( q != p ) {
+			/* If the states differ on final state status, out transitions or
+			 * any transition data then they should be separated on the initial
+			 * round. */
+			if ( initPartCompare.compare( p, q ) != 0 )
+				markIndex.markPair( p->alg.stateNum, q->alg.stateNum );
+
+			q = q->next;
+		}
+		p = p->next;
+	}
+}
+
+bool FsmGraph::markRound( MarkIndex &markIndex )
+{
+	/* P an q for walking pairs. Take note if any pair gets marked. */
+	FsmState *p = stateList.head, *q;
+	bool pairWasMarked = false;
+
+	/* Need a mark comparison. */
+	MarkCompare markCompare;
+
+	/* Walk all unordered pairs of (p, q) where p != q.
+	 * The second depth of the walk stops before reaching p. This
+	 * gives us all unordered pairs of states (p, q) where p != q. */
+	while ( p != 0 ) {
+		q = stateList.head;
+		while ( q != p ) {
+			/* Should we mark the pair? */
+			if ( !markIndex.isPairMarked( p->alg.stateNum, q->alg.stateNum ) ) {
+				if ( markCompare.shouldMark( markIndex, p, q ) ) {
+					markIndex.markPair( p->alg.stateNum, q->alg.stateNum );
+					pairWasMarked = true;
+				}
+			}
+			q = q->next;
+		}
+		p = p->next;
+	}
+
+	return pairWasMarked;
+}
+
+
+/**
+ * \brief Minimize by pair marking.
+ *
+ * Decides if each pair of states is distinct or not. Uses O(n^2) memory and
+ * should only be used on small graphs. Produces the most minmimal FSM
+ * possible.
+ */
+void FsmGraph::minimizeStable()
+{
+	/* Set the state numbers. */
+	setStateNumbers( 0 );
+
+	/* This keeps track of which pairs have been marked. */
+	MarkIndex markIndex( stateList.length() );
+
+	/* Mark pairs where final stateness, out trans, or trans data differ. */
+	initialMarkRound( markIndex );
+
+	/* While the last round of marking succeeded in marking a state
+	 * continue to do another round. */
+	int modified = markRound( markIndex );
+	while (modified)
+		modified = markRound( markIndex );
+
+	/* Merge pairs that are unmarked. */
+	fuseUnmarkedPairs( markIndex );
+}
+
+bool FsmGraph::minimizeRound()
+{
+	/* Nothing to do if there are no states. */
+	if ( stateList.length() == 0 )
+		return false;
+
+	/* Need a mergesort on approx compare and an approx compare. */
+	MergeSort<FsmState*, ApproxCompare> mergeSort;
+	ApproxCompare approxCompare;
+
+	/* Fill up an array of pointers to the states. */
+	FsmState **statePtrs = new FsmState*[stateList.length()];
+	StateList::Iter state = stateList;
+	for ( int s = 0; state.lte(); state++, s++ )
+		statePtrs[s] = state;
+
+	bool modified = false;
+
+	/* Sort The list. */
+	mergeSort.sort( statePtrs, stateList.length() );
+
+	/* Walk the list looking for duplicates next to each other, 
+	 * merge in any duplicates. */
+	FsmState **pLast = statePtrs;
+	FsmState **pState = statePtrs + 1;
+	for ( int i = 1; i < stateList.length(); i++, pState++ ) {
+		if ( approxCompare.compare( *pLast, *pState ) == 0 ) {
+			/* Last and pState are the same, so fuse together. Move forward
+			 * with pState but not with pLast. If any more are identical, we
+			 * must */
+			fuseEquivStates( *pLast, *pState );
+			modified = true;
+		}
+		else {
+			/* Last and this are different, do not set to merge them. Move
+			 * pLast to the current (it may be way behind from merging many
+			 * states) and pState forward one to consider the next pair. */
+			pLast = pState;
+		}
+	}
+	delete[] statePtrs;
+	return modified;
+}
+
+/**
+ * \brief Minmimize by an approximation.
+ *
+ * Repeatedly tries to find states with transitions out to the same set of
+ * states on the same set of keys until no more identical states can be found.
+ * Does not produce the most minimial FSM possible.
+ */
+void FsmGraph::minimizeApproximate()
+{
+	/* While the last minimization round succeeded in compacting states,
+	 * continue to try to compact states. */
+	while ( true ) {
+		bool modified = minimizeRound();
+		if ( ! modified )
+			break;
+	}
+}
+
+
+/* Remove states that have no path to them from the start state. Recursively
+ * traverses the graph marking states that have paths into them. Then removes
+ * all states that did not get marked. */
+void FsmGraph::removeUnreachableStates()
+{
+	/* Misfit accounting should be off and there should be no states on the
+	 * misfit list. */
+	assert( !misfitAccounting && misfitList.length() == 0 );
+
+	/* Mark all the states that can be reached 
+	 * through the existing set of entry points. */
+	markReachableFromHere( startState );
+	for ( EntryMap::Iter en = entryPoints; en.lte(); en++ )
+		markReachableFromHere( en->value );
+
+	/* Delete all states that are not marked
+	 * and unmark the ones that are marked. */
+	FsmState *state = stateList.head;
+	while ( state ) {
+		FsmState *next = state->next;
+
+		if ( state->stateBits & SB_ISMARKED )
+			state->stateBits &= ~ SB_ISMARKED;
+		else {
+			detachState( state );
+			stateList.detach( state );
+			delete state;
+		}
+
+		state = next;
+	}
+}
+
+bool FsmGraph::outListCovers( FsmState *state )
+{
+	/* Must be at least one range to cover. */
+	if ( state->outList.length() == 0 )
+		return false;
+	
+	/* The first must start at the lower bound. */
+	TransList::Iter trans = state->outList.first();
+	if ( keyOps->minKey < trans->lowKey )
+		return false;
+
+	/* Loop starts at second el. */
+	trans.increment();
+
+	/* Loop checks lower against prev upper. */
+	for ( ; trans.lte(); trans++ ) {
+		/* Lower end of the trans must be one greater than the
+		 * previous' high end. */
+		Key lowKey = trans->lowKey;
+		lowKey.decrement();
+		if ( trans->prev->highKey < lowKey )
+			return false;
+	}
+
+	/* Require that the last range extends to the upper bound. */
+	trans = state->outList.last();
+	if ( trans->highKey < keyOps->maxKey )
+		return false;
+
+	return true;
+}
+
+/* Remove states that that do not lead to a final states. Works recursivly traversing
+ * the graph in reverse (starting from all final states) and marking seen states. Then
+ * removes states that did not get marked. */
+void FsmGraph::removeDeadEndStates()
+{
+	/* Misfit accounting should be off and there should be no states on the
+	 * misfit list. */
+	assert( !misfitAccounting && misfitList.length() == 0 );
+
+	/* Mark all states that have paths to the final states. */
+	FsmState **st = finStateSet.data;
+	int nst = finStateSet.length();
+	for ( int i = 0; i < nst; i++, st++ )
+		markReachableFromHereReverse( *st );
+
+	/* Start state gets honorary marking. If the machine accepts nothing we
+	 * still want the start state to hang around. This must be done after the
+	 * recursive call on all the final states so that it does not cause the
+	 * start state in transitions to be skipped when the start state is
+	 * visited by the traversal. */
+	startState->stateBits |= SB_ISMARKED;
+
+	/* Delete all states that are not marked
+	 * and unmark the ones that are marked. */
+	FsmState *state = stateList.head;
+	while ( state != 0 ) {
+		FsmState *next = state->next;
+
+		if ( state->stateBits & SB_ISMARKED  )
+			state->stateBits &= ~ SB_ISMARKED;
+		else {
+			detachState( state );
+			stateList.detach( state );
+			delete state;
+		}
+		
+		state = next;
+	}
+}
+
+/* Remove states on the misfit list. To work properly misfit accounting should
+ * be on when this is called. The detaching of a state will likely cause
+ * another misfit to be collected and it can then be removed. */
+void FsmGraph::removeMisfits()
+{
+	while ( misfitList.length() > 0 ) {
+		/* Get the first state. */
+		FsmState *state = misfitList.head;
+
+		/* Detach and delete. */
+		detachState( state );
+
+		/* The state was previously on the misfit list and detaching can only
+		 * remove in transitions so the state must still be on the misfit
+		 * list. */
+		misfitList.detach( state );
+		delete state;
+	}
+}
+
+/* Fuse src into dest because they have been deemed equivalent states.
+ * Involves moving transitions into src to go into dest and invoking
+ * callbacks. Src is deleted detached from the graph and deleted. */
+void FsmGraph::fuseEquivStates( FsmState *dest, FsmState *src )
+{
+	/* This would get ugly. */
+	assert( dest != src );
+
+	/* Cur is a duplicate. We can merge it with trail. */
+	inTransMove( dest, src );
+
+	detachState( src );
+	stateList.detach( src );
+	delete src;
+}
+
+void FsmGraph::fuseUnmarkedPairs( MarkIndex &markIndex )
+{
+	FsmState *p = stateList.head, *nextP, *q;
+
+	/* Definition: The primary state of an equivalence class is the first state
+	 * encounterd that belongs to the equivalence class. All equivalence
+	 * classes have primary state including equivalence classes with one state
+	 * in it. */
+
+	/* For each unmarked pair merge p into q and delete p. q is always the
+	 * primary state of it's equivalence class. We wouldn't have landed on it
+	 * here if it were not, because it would have been deleted.
+	 *
+	 * Proof that q is the primaray state of it's equivalence class: Assume q
+	 * is not the primary state of it's equivalence class, then it would be
+	 * merged into some state that came before it and thus p would be
+	 * equivalent to that state. But q is the first state that p is equivalent
+	 * to so we have a contradiction. */
+
+	/* Walk all unordered pairs of (p, q) where p != q.
+	 * The second depth of the walk stops before reaching p. This
+	 * gives us all unordered pairs of states (p, q) where p != q. */
+	while ( p != 0 ) {
+		nextP = p->next;
+
+		q = stateList.head;
+		while ( q != p ) {
+			/* If one of p or q is a final state then mark. */
+			if ( ! markIndex.isPairMarked( p->alg.stateNum, q->alg.stateNum ) ) {
+				fuseEquivStates( q, p );
+				break;
+			}
+			q = q->next;
+		}
+		p = nextP;
+	}
+}
+
+void FsmGraph::fusePartitions( MinPartition *parts, int numParts )
+{
+	/* For each partition, fuse state 2, 3, ... into state 1. */
+	for ( int p = 0; p < numParts; p++ ) {
+		/* Assume that there will always be at least one state. */
+		FsmState *first = parts[p].list.head, *toFuse = first->next;
+
+		/* Put the first state back onto the main state list. Don't bother
+		 * removing it from the partition list first. */
+		stateList.append( first );
+
+		/* Fuse the rest of the state into the first. */
+		while ( toFuse != 0 ) {
+			/* Save the next. We will trash it before it is needed. */
+			FsmState *next = toFuse->next;
+
+			/* Put the state to be fused in to the first back onto the main
+			 * list before it is fuse.  the graph. The state needs to be on
+			 * the main list for the detach from the graph to work.  Don't
+			 * bother removing the state from the partition list first. We
+			 * need not maintain it. */
+			stateList.append( toFuse );
+
+			/* Now fuse to the first. */
+			fuseEquivStates( first, toFuse );
+
+			/* Go to the next that we saved before trashing the next pointer. */
+			toFuse = next;
+		}
+
+		/* We transfered the states from the partition list into the main list without
+		 * removing the states from the partition list first. Clean it up. */
+		parts[p].list.abandon();
+	}
+}
+
+
+/* Merge neighboring transitions go to the same state and have the same
+ * transitions data. */
+void FsmGraph::compressTransitions()
+{
+	for ( StateList::Iter st = stateList; st.lte(); st++ ) {
+		if ( st->outList.length() > 1 ) {
+			for ( TransList::Iter trans = st->outList, next = trans.next(); next.lte();  ) {
+				Key nextLow = next->lowKey;
+				nextLow.decrement();
+				if ( trans->highKey == nextLow && trans->toState == next->toState &&
+					CmpActionTable::compare( trans->actionTable, next->actionTable ) == 0 )
+				{
+					trans->highKey = next->highKey;
+					st->outList.detach( next );
+					detachTrans( next->fromState, next->toState, next );
+					delete next;
+					next = trans.next();
+				}
+				else {
+					trans.increment();
+					next.increment();
+				}
+			}
+		}
+	}
+}
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
new file mode 100644
index 00000000..9edb584b
--- /dev/null
+++ b/colm/fsmrun.cpp
@@ -0,0 +1,890 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <iostream>
+#include <stdlib.h>
+
+#include "config.h"
+#include "fsmrun.h"
+#include "redfsm.h"
+#include "parsedata.h"
+#include "parsetree.h"
+#include "pdarun.h"
+#include "colm.h"
+
+using std::cerr;
+using std::endl;
+
+exit_object endp;
+
+void operator<<( ostream &out, exit_object & )
+{
+	out << endl;
+	exit(1);
+}
+
+FsmRun::FsmRun( FsmTables *tables ) :
+	tables(tables),
+	parser(0),
+	position(0)
+{
+}
+
+FsmRun::~FsmRun()
+{
+//	RunBuf *rb = runBuf;
+//	while ( rb != 0 ) {
+//		RunBuf *next = rb->next;
+//		delete rb;
+//		rb = next;
+//	}
+}
+
+void FsmRun::undoStreamPush( long length )
+{
+	long remainder = pe - p;
+	memmove( runBuf->buf, runBuf->buf + length, remainder );
+	pe -= length;
+}
+
+void FsmRun::streamPush( const char *data, long length )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "readying fake push" << endl;
+	#endif
+
+	if ( p == runBuf->buf ) {
+		cerr << "case 1" << endl;
+		assert(false);
+	}
+	else if ( p == (runBuf->buf + runBuf->length) ) {
+		cerr << "case 2" << endl;
+		assert(false);
+	}
+	else {
+		cerr << "case 3" << endl;
+
+		/* Send back the second half of the current run buffer. */
+		RunBuf *dup = new RunBuf;
+		memcpy( dup, runBuf, sizeof(RunBuf) );
+
+		/* Need to fix the offset. */
+		dup->length = pe - runBuf->buf;
+		dup->offset = p - runBuf->buf;
+
+		/* Send it back. */
+		inputStream->pushBack( dup );
+
+		/* Since the second half is gone the current buffer now ends at p. */
+		pe = p;
+		runBuf->length = p - runBuf->buf;
+
+		/* Create a new buffer for the data. This is the easy implementation.
+		 * Something better is needed here. It puts a max on the amount of
+		 * data that can be pushed back to the stream. */
+		assert( length < FSM_BUFSIZE );
+		RunBuf *newBuf = new RunBuf;
+		newBuf->next = runBuf;
+		newBuf->offset = 0;
+		newBuf->length = length;
+		memcpy( newBuf->buf, data, length );
+
+		p = newBuf->buf;
+		pe = newBuf->buf + newBuf->length;
+		runBuf = newBuf;
+	}
+}
+
+/* Should only be sending back whole tokens/ignores, therefore the send back
+ * should never cross a buffer boundary. Either we slide back p, or we move to
+ * a previous buffer and slide back p. */
+void FsmRun::sendBackText( const char *data, long length )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "push back of " << length << " characters" << endl;
+	#endif
+
+	if ( length == 0 )
+		return;
+
+	if ( p == runBuf->buf ) {
+		#ifdef COLM_LOG_PARSE
+		cerr << "pushing back runbuf" << endl;
+		#endif
+
+		/* Move to the next run buffer. */
+		RunBuf *back = runBuf;
+		runBuf = runBuf->next;
+		
+		/* Flush out the input buffer. */
+		back->length = pe-p;
+		back->offset = 0;
+		inputStream->pushBack( back );
+
+		/* Set p and pe. */
+		assert( runBuf != 0 );
+		p = pe = runBuf->buf + runBuf->length;
+	}
+
+	/* If there is data in the current buffer then the whole send back
+	 * should be in this buffer. */
+	assert( (p - runBuf->buf) >= length );
+
+	/* slide p back. */
+	p -= length;
+
+	#ifdef COLM_LOG_PARSE
+	if ( memcmp( data, p, length ) != 0 )
+		cerr << "mismatch of pushed back text" << endl;
+	#endif
+
+	assert( memcmp( data, p, length ) == 0 );
+		
+	position -= length;
+
+	/* We are adjusting p so this must be reset. */
+	tokstart = 0;
+}
+
+void FsmRun::queueBack( Kid *input )
+{
+	Alg *alg = input->tree->alg;
+
+	if ( alg->flags & AF_GROUP_MEM ) {
+		#ifdef COLM_LOG_PARSE
+		LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+		cerr << "queuing back: " << lelInfo[input->tree->id].name << endl;
+		#endif
+
+		if ( parser->queue == 0 )
+			parser->queue = parser->queueLast = input;
+		else {
+			parser->queueLast->next = input;
+			parser->queueLast = input;
+		}
+	}
+	else {
+		/* If there are queued items send them back starting at the tail
+		 * (newest). */
+		if ( parser->queue != 0 ) {
+			/* Reverse the list. */
+			Kid *kid = parser->queue, *last = 0;
+			while ( kid != 0 ) {
+				Kid *next = kid->next;
+				kid->next = last;
+				last = kid;
+				kid = next;
+			}
+
+			/* Send them back. */
+			while ( last != 0 ) {
+				Kid *next = last->next;
+				sendBack( last );
+				last = next;
+			}
+
+			parser->queue = 0;
+		}
+
+		/* Now that the queue is flushed, can send back the original item. */
+		sendBack( input );
+	}
+}
+
+void FsmRun::sendBackIgnore( Kid *ignore )
+{
+	/* Ignore tokens are queued in reverse order. */
+	while ( tree_is_ignore( parser->prg, ignore ) ) {
+		#ifdef COLM_LOG_PARSE
+		LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+		cerr << "sending back: " << lelInfo[ignore->tree->id].name;
+		if ( ignore->tree->alg != 0 && ignore->tree->alg->flags & AF_ARTIFICIAL )
+			cerr << " (artificial)";
+		cerr << endl;
+		#endif
+
+		Head *head = ignore->tree->tokdata;
+		bool artificial = ignore->tree->alg != 0 && 
+				ignore->tree->alg->flags & AF_ARTIFICIAL;
+
+		if ( head != 0 && !artificial )
+			sendBackText( string_data( head ), head->length );
+
+		/* Check for reverse code. */
+		Alg *alg = ignore->tree->alg;
+		if ( alg != 0 && alg->flags & AF_HAS_RCODE ) {
+			Execution execution( parser->prg, parser->reverseCode, 
+					parser, 0, 0, 0 );
+
+			/* Do the reverse exeuction. */
+			execution.rexecute( parser->root, 0, parser->allReverseCode );
+			alg->flags &= ~AF_HAS_RCODE;
+		}
+
+		ignore = ignore->next;
+	}
+}
+
+void FsmRun::sendBack( Kid *input )
+{
+	#ifdef COLM_LOG_PARSE
+	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+	cerr << "sending back: " << lelInfo[input->tree->id].name;
+	if ( input->tree->alg->flags & AF_ARTIFICIAL )
+		cerr << " (artificial)";
+	cerr << endl;
+	#endif
+
+	Alg *alg = input->tree->alg;
+	if ( alg->flags & AF_NAMED ) {
+		/* Send back anything that is in the buffer. */
+		inputStream->pushBack( p, pe-p );
+		p = pe = runBuf->buf;
+
+		/* Send the named lang el back first, then send back any leading
+		 * whitespace. */
+		inputStream->pushBackNamed();
+	}
+
+	if ( !(alg->flags & AF_ARTIFICIAL) ) {
+		/* Push back the token data. */
+		sendBackText( string_data( input->tree->tokdata ), 
+				string_length( input->tree->tokdata ) );
+	}
+
+	/* Check for reverse code. */
+	if ( alg->flags & AF_HAS_RCODE ) {
+		Execution execution( parser->prg, parser->reverseCode, 
+				parser, 0, 0, 0 );
+
+		/* Do the reverse exeuction. */
+		execution.rexecute( parser->root, 0, parser->allReverseCode );
+		alg->flags &= ~AF_HAS_RCODE;
+	}
+
+	/* Always push back the ignore text. */
+	sendBackIgnore( tree_ignore( parser->prg, input->tree ) );
+
+	/* If eof was just sent back remember that it needs to be sent again. */
+	if ( input->tree->id == parser->tables->gbl->eofId )
+		eofSent = false;
+
+	/* If the item is bound then store remove it from the bindings array. */
+	Tree *lastBound = parser->bindings.top();
+	if ( lastBound == input->tree ) {
+		parser->bindings.pop();
+		tree_downref( parser->prg, input->tree );
+	}
+
+	/* Downref the tree that was sent back and free the kid. */
+	tree_downref( parser->prg, input->tree );
+	parser->prg->kidPool.free( input );
+}
+
+void FsmRun::sendEOF( )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "token: _EOF" << endl;
+	#endif
+
+	Kid *input = parser->prg->kidPool.allocate();
+	input->tree = parser->prg->treePool.allocate();
+	input->tree->alg = parser->prg->algPool.allocate();
+
+	input->tree->refs = 1;
+	input->tree->id = parser->tables->gbl->eofId;
+
+	bool ctxDepParsing = parser->prg->ctxDepParsing;
+	long frameId = parser->tables->gbl->regionInfo[region].eofFrameId;
+	if ( ctxDepParsing && frameId >= 0 ) {
+		#ifdef COLM_LOG_PARSE
+		cerr << "HAVE PRE_EOF BLOCK" << endl;
+		#endif
+
+		Code *code = parser->tables->gbl->frameInfo[frameId].code;
+	
+		/* Execute the translation. */
+		Execution execution( parser->prg, parser->reverseCode, 
+				parser, code, 0, 0 );
+		execution.execute( parser->root );
+
+		set_AF_GROUP_MEM();
+
+		sendQueuedTokens();
+	}
+
+	parser->send( input );
+
+	if ( parser->errCount > 0 ) {
+		parser->parse_error( parser->tables->gbl->eofId, input->tree ) << 
+				"parse error" << endp;
+	}
+
+	tokstart = 0;
+	region = parser->getNextRegion();
+	cs = tables->entryByRegion[region];
+}
+
+void FsmRun::sendQueuedTokens()
+{
+	while ( parser->queue != 0 ) {
+		/* Pull an item to send off the queue. */
+		Kid *send = parser->queue;
+		parser->queue = parser->queue->next;
+
+		/* Must clear next, since the parsing algorithm uses it. */
+		send->next = 0;
+		if ( send->tree->alg->flags & AF_IGNORE ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "ignoring queued item: " << 
+					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+			#endif
+			
+			parser->ignore( send->tree );
+			parser->prg->kidPool.free( send );
+		}
+		else {
+			#ifdef COLM_LOG_PARSE
+			cerr << "sending queue item: " << 
+					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+			#endif
+			sendLangEl( send );
+		}
+	}
+}
+
+void FsmRun::sendToken( long id )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "token: " << parser->tables->gbl->lelInfo[id].name << endl;
+	#endif
+
+	bool ctxDepParsing = parser->prg->ctxDepParsing;
+	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+
+	/* Copy the token data. */
+	long length = p-tokstart;
+	Head *tokdata = string_alloc_const( parser->prg, tokstart, length );
+
+	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
+		translateLangEl( id, tokdata, false, 0 );
+		sendQueuedTokens();
+	}
+	else {
+		makeToken( id, tokdata, false, 0 );
+		assert( parser->queue == 0 );
+	}
+
+	memset( mark_leave, 0, sizeof(mark_leave) );
+}
+
+void FsmRun::sendNamedLangEl()
+{
+	/* All three set by getLangEl. */
+	long bindId;
+	char *data;
+	long length;
+
+	KlangEl *klangEl = inputStream->getLangEl( bindId, data, length );
+	if ( klangEl->termDup != 0 )
+		klangEl = klangEl->termDup;
+	
+	#ifdef COLM_LOG_PARSE
+	cerr << "named langEl: " << parser->tables->gbl->lelInfo[klangEl->id].name << endl;
+	#endif
+
+	/* Copy the token data. */
+	Head *tokdata = 0;
+	if ( data != 0 )
+		tokdata = string_alloc_new( parser->prg, data, length );
+
+	makeToken( klangEl->id, tokdata, true, bindId );
+}
+
+void FsmRun::set_AF_GROUP_MEM()
+{
+	/* Set AF_GROUP_MEM now. */
+	long sendCount = 0;
+	Kid *queued = parser->queue;
+	while ( queued != 0 ) {
+		if ( !(queued->tree->alg->flags & AF_IGNORE) ) {
+			if ( sendCount > 0 )
+				queued->tree->alg->flags |= AF_GROUP_MEM;
+			sendCount += 1;
+		}
+		queued = queued->next;
+	}
+}
+
+/* 
+ * Implmented:
+ *  -shorten the match (possibly to zero length)
+ *  -change the token to a new identifier 
+ *  -change global state (it can, but it isn't reverted during backtracking).
+ *
+ * Not implemented:
+ *  -invoke failure (and hence the backtracker)
+ */
+
+void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "translating: " << 
+			parser->tables->gbl->lelInfo[id].name << endl;
+	#endif
+
+	Code *code = parser->tables->gbl->frameInfo[
+			parser->tables->gbl->lelInfo[id].frameId].code;
+	
+	p = tokstart;
+
+	/* Execute the translation. */
+	Execution execution( parser->prg, parser->reverseCode, 
+			parser, code, 0, tokdata );
+	execution.execute( parser->root );
+
+	string_free( parser->prg, tokdata );
+
+	set_AF_GROUP_MEM();
+}
+
+void FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
+{
+	/* Make the token object. */
+	long objectLength = parser->tables->gbl->lelInfo[id].objectLength;
+	Kid *attrs = alloc_attrs( parser->prg, objectLength );
+
+	Kid *input = 0;
+	input = parser->prg->kidPool.allocate();
+	input->tree = parser->prg->treePool.allocate();
+	input->tree->alg = parser->prg->algPool.allocate();
+
+	if ( namedLangEl )
+		input->tree->alg->flags |= AF_NAMED;
+
+	input->tree->refs = 1;
+	input->tree->id = id;
+	input->tree->tokdata = tokdata;
+
+	/* No children and ignores get added later. */
+	input->tree->child = attrs;
+
+	/* Set attributes for the labelled components. */
+	for ( int i = 0; i < 32; i++ ) {
+		if ( mark_leave[i] != 0 ) {
+			Head *data = string_alloc_new( parser->prg, 
+					mark_enter[i], mark_leave[i] - mark_enter[i] );
+			set_attr( input->tree, i, construct_string( parser->prg, data ) );
+			tree_upref( get_attr( input->tree, i ) );
+		}
+	}
+	
+	/* If the item is bound then store it in the bindings array. */
+	if ( bindId > 0 ) {
+		parser->bindings.push( input->tree );
+		tree_upref( input->tree );
+	}
+
+	sendLangEl( input );
+}
+
+/* Send back the accumulated ignore tokens. */
+void PdaRun::sendBackIgnore()
+{
+	Kid *ignore = extractIgnore();
+	fsmRun->sendBackIgnore( ignore );
+	while ( ignore != 0 ) {
+		Kid *next = ignore->next;
+		tree_downref( prg, ignore->tree );
+		prg->kidPool.free( ignore );
+		ignore = next;
+	}
+}
+
+Kid *PdaRun::extractIgnore()
+{
+	Kid *ignore = accumIgnore;
+	accumIgnore = 0;
+	return ignore;
+}
+
+void PdaRun::send( Kid *input )
+{
+	long length = string_length( input->tree->tokdata );
+	//input->tree->pos = fsmRun->position;
+	fsmRun->position += length;
+
+	/* Pull the ignore tokens out and store in the token. */
+	Kid *ignore = extractIgnore();
+	if ( ignore != 0 ) {
+		Kid *child = input->tree->child;
+		input->tree->child = ignore;
+		while ( ignore->next != 0 )
+			ignore = ignore->next;
+		ignore->next = child;
+	}
+		
+	/* Pull the reverse code out and store in the token. */
+	bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+	if ( hasrcode )
+		input->tree->alg->flags |= AF_HAS_RCODE;
+
+	parseToken( input );
+}
+
+void FsmRun::sendLangEl( Kid *input )
+{
+	long id = input->tree->id;
+
+	/* Send the token to the parser. */
+	parser->send( input );
+		
+	/* Check the result. */
+	if ( parser->errCount > 0 ) {
+		/* Error occured in the top-level parser. */
+		parser->parse_error(id, input->tree) << "parse error" << endp;
+	}
+	else {
+		/* Set the current state from the next region. */
+		region = parser->getNextRegion();
+		cs = tables->entryByRegion[region];
+
+		if ( parser->isParserStopFinished() ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "stopping the parse" << endl;
+			#endif
+			cs = tables->errorState;
+			parser->stopParsing = true;
+		}
+	}
+
+	/* Reset tokstart. */
+	tokstart = 0;
+
+	#ifdef COLM_LOG_PARSE
+	cerr << "new token region: " << 
+			parser->tables->gbl->regionInfo[region].name << endl;
+	#endif
+}
+
+void PdaRun::ignore( Tree *tree )
+{
+	/* Add the ignore string to the head of the ignore list. */
+	Kid *ignore = prg->kidPool.allocate();
+	ignore->tree = tree;
+
+	/* Pull the reverse code out and store in the token. */
+	bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+	if ( hasrcode ) {
+		if ( tree->alg == 0 )
+			tree->alg = prg->algPool.allocate();
+		tree->alg->flags |= AF_HAS_RCODE;
+	}
+
+	/* Prepend it to the list of ignore tokens. */
+	ignore->next = accumIgnore;
+	accumIgnore = ignore;
+}
+
+void FsmRun::sendIgnore( long id )
+{
+	int length = p-tokstart;
+
+	#ifdef COLM_LOG_PARSE
+	cerr << "ignoring: " << parser->tables->gbl->lelInfo[id].name << endl;
+	#endif
+
+	/* Make the ignore string. */
+	Head *ignoreStr = string_alloc_const( parser->prg, tokstart, length );
+	
+	Tree *tree = parser->prg->treePool.allocate();
+	tree->refs = 1;
+	tree->id = id;
+	tree->tokdata = ignoreStr;
+
+	/* Send it to the parser. */
+	parser->ignore( tree );
+
+	/* Prepare for more scanning. */
+	tokstart = 0;
+	position += length;
+	region = parser->getNextRegion();
+	cs = tables->entryByRegion[region];
+
+	memset( mark_leave, 0, sizeof(mark_leave) );
+}
+
+void FsmRun::emitToken( KlangEl *token )
+{
+	if ( token->ignore )
+		sendIgnore( token->id );
+	else
+		sendToken( token->id );
+}
+
+/* Load up a token, starting from tokstart if it is set. If not set then
+ * start it at p. */
+Head *FsmRun::extractToken( long length )
+{
+	/* How much do we have already? Tokstart may or may not be set. */
+	long have = 0;
+	if ( tokstart != 0 )
+		have = p - tokstart;
+	else
+		tokstart = p;
+
+	/* The generated token length has been stuffed into tokdata. */
+	if ( tokstart + length > pe ) {
+		/* There is not enough data in the buffer to generate the token.
+		 * Shift data over and fill the buffer. */
+		if ( have > 0 ) {
+			/* There is data that needs to be shifted over. */
+			memmove( runBuf->buf, tokstart, have );
+			tokend -= (tokstart - runBuf->buf);
+			tokstart = runBuf->buf;
+		}
+		p = pe = runBuf->buf + have;
+		peof = 0;
+
+		long space = runBuf->buf + FSM_BUFSIZE - pe;
+			
+		if ( space == 0 )
+			cerr << "OUT OF BUFFER SPACE" << endp;
+			
+		long len = inputStream->getData( p, space );
+		pe = p + len;
+	}
+
+	if ( tokstart + length > pe )
+		cerr << "NOT ENOUGH DATA TO FETCH TOKEN" << endp;
+
+	Head *tokdata = string_alloc_const( parser->prg, tokstart, length );
+	p = tokstart + length;
+	tokstart = 0;
+
+	return tokdata;
+}
+
+void FsmRun::attachInputStream( InputStream *in )
+{
+	/* Run buffers need to stick around because 
+	 * token strings point into them. */
+	runBuf = new RunBuf;
+	runBuf->next = 0;
+
+	inputStream = in;
+	p = pe = runBuf->buf;
+	peof = 0;
+	eofSent = false;
+	position = 0;
+}
+
+long PdaRun::run()
+{
+	/* PDA must be init first to set next region. */
+	init();
+	return fsmRun->run( this );
+}
+
+long PdaRun::undoParse( Tree *tree, CodeVect *rev )
+{
+	/* PDA must be init first to set next region. */
+	init();
+	Kid *top = prg->kidPool.allocate();
+	top->next = stackTop;
+	top->tree = tree;
+	stackTop = top;
+	numRetry += 1;
+	allReverseCode.transfer( *rev );
+
+	parseToken( 0 );
+
+	assert( stackTop->next == 0 );
+
+	prg->algPool.free( stackTop->tree->alg );
+	prg->treePool.free( stackTop->tree );
+	prg->kidPool.free( stackTop );
+	return 0;
+}
+
+long FsmRun::run( PdaRun *destParser )
+{
+	long space, prevState = cs;
+
+	PdaRun *prevParser = parser;
+	parser = destParser;
+
+	act = 0;
+	tokstart = 0;
+	tokend = 0;
+	region = parser->getNextRegion();
+	cs = tables->entryByRegion[region];
+	memset( mark_leave, 0, sizeof(mark_leave) );
+
+	/* Start with the EOF test. The pattern and replacement input sources can
+	 * be EOF from the start. */
+
+	while ( true ) {
+		/* Check for eof. */
+ 		if ( p == pe && inputStream->isEOF() ) {
+			if ( tokstart != 0 ) {
+				/* If a token has been started, but not finshed 
+				 * this is an error. */
+				cs = tables->errorState;
+			}
+			else {
+				eofSent = true;
+				sendEOF();
+				if ( !eofSent )
+					continue;
+				break;
+			}
+		}
+
+		if ( p == pe ) {
+			/* We don't have any data. What is next in the input stream? */
+			if ( inputStream->isLangEl() )
+				sendNamedLangEl( );
+			else {
+				space = runBuf->buf + FSM_BUFSIZE - pe;
+			
+				if ( space == 0 )
+					cerr << "OUT OF BUFFER SPACE" << endp;
+			
+				int len = inputStream->getData( p, space );
+				pe = p + len;
+				if ( inputStream->needFlush() )
+					peof = pe;
+			}
+		}
+
+		execute();
+
+		/* Fall through here either when the input buffer has been exhausted
+		 * or the scanner is in an error state. Otherwise we must continue. */
+
+		if ( cs == tables->errorState && parser->stopParsing ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "scanner has been stopped" << endl;
+			#endif
+			goto done;
+		}
+
+		/* First thing check for error. */
+		if ( cs == tables->errorState ) {
+			/* If a token was started, but not finished (tokstart != 0) then
+			 * restore p to the beginning of that token. */
+			if ( tokstart != 0 )
+				p = tokstart;
+
+			/* Check for a default token in the region. If one is there
+			 * then send it and continue with the processing loop. */
+			if ( parser->tables->gbl->regionInfo[region].defaultToken >= 0 ) {
+				tokstart = tokend = p;
+				sendToken( parser->tables->gbl->regionInfo[region].defaultToken );
+				continue;
+			}
+
+			if ( parser->getNextRegion( 1 ) != 0 ) {
+				#ifdef COLM_LOG_PARSE
+				cerr << "scanner failed, trying next region" << endl;
+				#endif
+
+				/* May have accumulated ignore tokens from a previous region.
+				 * need to rescan them since we won't be sending tokens from
+				 * this region. */
+				parser->sendBackIgnore();
+
+				parser->nextRegionInd += 1;
+				region = parser->getNextRegion();
+				cs = tables->entryByRegion[region];
+				#ifdef COLM_LOG_PARSE
+				cerr << "new token region: " << 
+						parser->tables->gbl->regionInfo[region].name << endl;
+				#endif
+				continue;
+			}
+
+			if ( parser->numRetry > 0 ) {
+				/* Invoke the parser's error handling. */
+				#ifdef COLM_LOG_PARSE
+				cerr << "invoking parse error from the scanner" << endl;
+				#endif
+
+				parser->sendBackIgnore();
+				parser->parseToken( 0 );
+
+				if ( parser->errCount > 0 ) {
+					/* Error occured in the top-level parser. */
+					cerr << "PARSE ERROR" << endp;
+				}
+				else {
+					region = parser->getNextRegion();
+					cs = tables->entryByRegion[region];
+					#ifdef COLM_LOG_PARSE
+					cerr << "new token region: " << 
+							parser->tables->gbl->regionInfo[region].name << endl;
+					#endif
+					continue;
+				}
+			}
+
+			/* Machine failed before finding a token. */
+			cerr << "SCANNER ERROR" << endp;
+		}
+
+		space = runBuf->buf + FSM_BUFSIZE - pe;
+		if ( space == 0 ) {
+			/* Create a new run buf. */
+			RunBuf *buf = new RunBuf;
+			buf->next = runBuf;
+			runBuf = buf;
+
+			/* If partway through a token then preserve the prefix. */
+			long have = 0;
+
+			if ( tokstart == 0 ) {
+				/* No prefix, the previous buffer was filled. */
+				runBuf->next->length = FSM_BUFSIZE;
+			}
+			else {
+				/* There is data that needs to be shifted over. */
+				have = pe - tokstart;
+				memcpy( runBuf->buf, tokstart, have );
+
+				/* Compute the length of the previous buffer. */
+				runBuf->next->length = FSM_BUFSIZE - have;
+
+				/* Compute tokstart and tokend. */
+				tokend = runBuf->buf + (tokend - tokstart);
+				tokstart = runBuf->buf;
+			}
+			p = pe = runBuf->buf + have;
+			peof = 0;
+		}
+	}
+
+done:
+	parser = prevParser;
+	cs = prevState;
+	return 0;
+}
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
new file mode 100644
index 00000000..43f8cc8c
--- /dev/null
+++ b/colm/fsmrun.h
@@ -0,0 +1,132 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _FSMRUN_H
+#define _FSMRUN_H
+
+#include "astring.h"
+#include "pdarun.h"
+#include "input.h"
+
+#define FSM_BUFSIZE 8192
+//#define FSM_BUFSIZE 8
+
+struct GenAction;
+struct KlangEl;
+struct PdaRun;
+struct ParseData;
+struct Kid;
+struct Pattern;
+struct PatternItem;
+struct Replacement;
+struct ReplItem;
+
+struct FsmTables
+{
+	long *actions;
+	long *keyOffsets;
+	char *transKeys;
+	long *singleLengths;
+	long *rangeLengths;
+	long *indexOffsets;
+	long *transTargsWI;
+	long *transActionsWI;
+	long *toStateActions;
+	long *fromStateActions;
+	long *eofActions;
+	long *eofTargs;
+	long *entryByRegion;
+
+	long numStates;
+	long numActions;
+	long numTransKeys;
+	long numSingleLengths;
+	long numRangeLengths;
+	long numIndexOffsets;
+	long numTransTargsWI;
+	long numTransActionsWI;
+	long numRegions;
+
+	long startState;
+	long firstFinal;
+	long errorState;
+
+	GenAction **actionSwitch;
+	long numActionSwitch;
+};
+
+struct RunBuf
+{
+	char buf[FSM_BUFSIZE];
+	long length;
+	long offset;
+	RunBuf *next;
+};
+
+struct FsmRun
+{
+	FsmRun( FsmTables *tables );
+	~FsmRun();
+
+	void set_AF_GROUP_MEM();
+
+	void sendLangEl( Kid *input );
+	void makeToken( int id, Head *tokdata, bool namedLangEl, int bindId );
+	void translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId );
+	void sendNamedLangEl();
+	void sendEOF();
+	void sendIgnore( long id );
+	void sendQueuedTokens();
+	void sendToken( long id );
+
+	void sendBackIgnore( Kid *ignore );
+	void sendBack( Kid *input );
+	void queueBack( Kid *input );
+	void sendBackText( const char *data, long length );
+	void emitToken( KlangEl *token );
+	void execAction( GenAction *action );
+
+	long run( PdaRun *parser );
+	void attachInputStream( InputStream *in );
+	void streamPush( const char *data, long length );
+	void undoStreamPush( long length );
+
+	Head *extractToken( long len );
+
+	void execute();
+
+	FsmTables *tables;
+	PdaRun *parser;
+	InputStream *inputStream;
+
+	/* FsmRun State. */
+	int region, cs, act;
+	char *tokstart, *tokend;
+	char *p, *pe, *peof;
+	bool eofSent;
+	RunBuf *runBuf;
+	bool gotoResume;
+	long position;
+	char *mark_enter[32];
+	char *mark_leave[32];
+};
+
+#endif
diff --git a/colm/fsmstate.cpp b/colm/fsmstate.cpp
new file mode 100644
index 00000000..d9df91ad
--- /dev/null
+++ b/colm/fsmstate.cpp
@@ -0,0 +1,467 @@
+/*
+ *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <assert.h>
+#include "fsmgraph.h"
+
+#include <iostream>
+using namespace std;
+
+/* Construct a mark index for a specified number of states. Must new up
+ * an array that is states^2 in size. */
+MarkIndex::MarkIndex( int states ) : numStates(states)
+{
+	/* Total pairs is states^2. Actually only use half of these, but we allocate
+	 * them all to make indexing into the array easier. */
+	int total = states * states;
+
+	/* New up chars so that individual DListEl constructors are
+	 * not called. Zero out the mem manually. */
+	array = new bool[total];
+	memset( array, 0, sizeof(bool) * total );
+}
+
+/* Free the array used to store state pairs. */
+MarkIndex::~MarkIndex()
+{
+	delete[] array;
+}
+
+/* Mark a pair of states. States are specified by their number. The
+ * marked states are moved from the unmarked list to the marked list. */
+void MarkIndex::markPair(int state1, int state2)
+{
+	int pos = ( state1 >= state2 ) ?
+		( state1 * numStates ) + state2 :
+		( state2 * numStates ) + state1;
+
+	array[pos] = true;
+}
+
+/* Returns true if the pair of states are marked. Returns false otherwise.
+ * Ordering of states given does not matter. */
+bool MarkIndex::isPairMarked(int state1, int state2)
+{
+	int pos = ( state1 >= state2 ) ?
+		( state1 * numStates ) + state2 :
+		( state2 * numStates ) + state1;
+
+	return array[pos];
+}
+
+/* Create a new fsm state. State has not out transitions or in transitions, not
+ * out out transition data and not number. */
+FsmState::FsmState()
+:
+	/* No out or in transitions. */
+	outList(),
+	inList(),
+
+	/* No entry points, or epsilon trans. */
+	entryIds(),
+	epsilonTrans(),
+
+	/* Conditions. */
+	stateCondList(),
+
+	/* No transitions in from other states. */
+	foreignInTrans(0),
+
+	/* Only used during merging. Normally null. */
+	stateDictEl(0),
+	eptVect(0),
+
+	/* No state identification bits. */
+	stateBits(0),
+
+	/* No Priority data. */
+	outPriorTable(),
+
+	/* No Action data. */
+	toStateActionTable(),
+	fromStateActionTable(),
+	outActionTable(),
+	outCondSet(),
+	errActionTable(),
+	eofActionTable(),
+
+	eofTarget(0)
+{
+}
+
+/* Copy everything except actual the transitions. That is left up to the
+ * FsmGraph copy constructor. */
+FsmState::FsmState(const FsmState &other)
+:
+	/* All lists are cleared. They will be filled in when the
+	 * individual transitions are duplicated and attached. */
+	outList(),
+	inList(),
+
+	/* Duplicate the entry id set and epsilon transitions. These
+	 * are sets of integers and as such need no fixing. */
+	entryIds(other.entryIds),
+	epsilonTrans(other.epsilonTrans),
+
+	/* Copy in the elements of the conditions. */
+	stateCondList( other.stateCondList ),
+
+	/* No transitions in from other states. */
+	foreignInTrans(0),
+
+	/* This is only used during merging. Normally null. */
+	stateDictEl(0),
+	eptVect(0),
+
+	/* Fsm state data. */
+	stateBits(other.stateBits),
+
+	/* Copy in priority data. */
+	outPriorTable(other.outPriorTable),
+
+	/* Copy in action data. */
+	toStateActionTable(other.toStateActionTable),
+	fromStateActionTable(other.fromStateActionTable),
+	outActionTable(other.outActionTable),
+	outCondSet(other.outCondSet),
+	errActionTable(other.errActionTable),
+	eofActionTable(other.eofActionTable),
+
+	eofTarget(0)
+{
+	/* Duplicate all the transitions. */
+	for ( TransList::Iter trans = other.outList; trans.lte(); trans++ ) {
+		/* Dupicate and store the orginal target in the transition. This will
+		 * be corrected once all the states have been created. */
+		FsmTrans *newTrans = new FsmTrans(*trans);
+		newTrans->toState = trans->toState;
+		outList.append( newTrans );
+	}
+}
+
+/* If there is a state dict element, then delete it. Everything else is left
+ * up to the FsmGraph destructor. */
+FsmState::~FsmState()
+{
+	if ( stateDictEl != 0 )
+		delete stateDictEl;
+}
+
+/* Compare two states using pointers to the states. With the approximate
+ * compare the idea is that if the compare finds them the same, they can
+ * immediately be merged. */
+int ApproxCompare::compare( const FsmState *state1 , const FsmState *state2 )
+{
+	int compareRes;
+
+	/* Test final state status. */
+	if ( (state1->stateBits & SB_ISFINAL) && !(state2->stateBits & SB_ISFINAL) )
+		return -1;
+	else if ( !(state1->stateBits & SB_ISFINAL) && (state2->stateBits & SB_ISFINAL) )
+		return 1;
+	
+	/* Test epsilon transition sets. */
+	compareRes = CmpEpsilonTrans::compare( state1->epsilonTrans, 
+			state2->epsilonTrans );
+	if ( compareRes != 0 )
+		return compareRes;
+	
+	/* Compare the out transitions. */
+	compareRes = FsmGraph::compareStateData( state1, state2 );
+	if ( compareRes != 0 )
+		return compareRes;
+
+	/* Use a pair iterator to get the transition pairs. */
+	PairIter<FsmTrans> outPair( state1->outList.head, state2->outList.head );
+	for ( ; !outPair.end(); outPair++ ) {
+		switch ( outPair.userState ) {
+
+		case RangeInS1:
+			compareRes = FsmGraph::compareFullPtr( outPair.s1Tel.trans, 0 );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeInS2:
+			compareRes = FsmGraph::compareFullPtr( 0, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeOverlap:
+			compareRes = FsmGraph::compareFullPtr( 
+					outPair.s1Tel.trans, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case BreakS1:
+		case BreakS2:
+			break;
+		}
+	}
+
+	/* Got through the entire state comparison, deem them equal. */
+	return 0;
+}
+
+/* Compare class for the sort that does the intial partition of compaction. */
+int InitPartitionCompare::compare( const FsmState *state1 , const FsmState *state2 )
+{
+	int compareRes;
+
+	/* Test final state status. */
+	if ( (state1->stateBits & SB_ISFINAL) && !(state2->stateBits & SB_ISFINAL) )
+		return -1;
+	else if ( !(state1->stateBits & SB_ISFINAL) && (state2->stateBits & SB_ISFINAL) )
+		return 1;
+
+	/* Test epsilon transition sets. */
+	compareRes = CmpEpsilonTrans::compare( state1->epsilonTrans, 
+			state2->epsilonTrans );
+	if ( compareRes != 0 )
+		return compareRes;
+
+	/* Compare the out transitions. */
+	compareRes = FsmGraph::compareStateData( state1, state2 );
+	if ( compareRes != 0 )
+		return compareRes;
+
+	/* Use a pair iterator to test the condition pairs. */
+	PairIter<StateCond> condPair( state1->stateCondList.head, state2->stateCondList.head );
+	for ( ; !condPair.end(); condPair++ ) {
+		switch ( condPair.userState ) {
+		case RangeInS1:
+			return 1;
+		case RangeInS2:
+			return -1;
+
+		case RangeOverlap: {
+			CondSpace *condSpace1 = condPair.s1Tel.trans->condSpace;
+			CondSpace *condSpace2 = condPair.s2Tel.trans->condSpace;
+			if ( condSpace1 < condSpace2 )
+				return -1;
+			else if ( condSpace1 > condSpace2 )
+				return 1;
+			break;
+		}
+		case BreakS1:
+		case BreakS2:
+			break;
+		}
+	}
+
+	/* Use a pair iterator to test the transition pairs. */
+	PairIter<FsmTrans> outPair( state1->outList.head, state2->outList.head );
+	for ( ; !outPair.end(); outPair++ ) {
+		switch ( outPair.userState ) {
+
+		case RangeInS1:
+			compareRes = FsmGraph::compareDataPtr( outPair.s1Tel.trans, 0 );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeInS2:
+			compareRes = FsmGraph::compareDataPtr( 0, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeOverlap:
+			compareRes = FsmGraph::compareDataPtr( 
+					outPair.s1Tel.trans, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case BreakS1:
+		case BreakS2:
+			break;
+		}
+	}
+
+	return 0;
+}
+
+/* Compare class for the sort that does the partitioning. */
+int PartitionCompare::compare( const FsmState *state1, const FsmState *state2 )
+{
+	int compareRes;
+
+	/* Use a pair iterator to get the transition pairs. */
+	PairIter<FsmTrans> outPair( state1->outList.head, state2->outList.head );
+	for ( ; !outPair.end(); outPair++ ) {
+		switch ( outPair.userState ) {
+
+		case RangeInS1:
+			compareRes = FsmGraph::comparePartPtr( outPair.s1Tel.trans, 0 );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeInS2:
+			compareRes = FsmGraph::comparePartPtr( 0, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case RangeOverlap:
+			compareRes = FsmGraph::comparePartPtr( 
+					outPair.s1Tel.trans, outPair.s2Tel.trans );
+			if ( compareRes != 0 )
+				return compareRes;
+			break;
+
+		case BreakS1:
+		case BreakS2:
+			break;
+		}
+	}
+
+	return 0;
+}
+
+/* Compare class for the sort that does the partitioning. */
+bool MarkCompare::shouldMark( MarkIndex &markIndex, const FsmState *state1, 
+			const FsmState *state2 )
+{
+	/* Use a pair iterator to get the transition pairs. */
+	PairIter<FsmTrans> outPair( state1->outList.head, state2->outList.head );
+	for ( ; !outPair.end(); outPair++ ) {
+		switch ( outPair.userState ) {
+
+		case RangeInS1:
+			if ( FsmGraph::shouldMarkPtr( markIndex, outPair.s1Tel.trans, 0 ) )
+				return true;
+			break;
+
+		case RangeInS2:
+			if ( FsmGraph::shouldMarkPtr( markIndex, 0, outPair.s2Tel.trans ) )
+				return true;
+			break;
+
+		case RangeOverlap:
+			if ( FsmGraph::shouldMarkPtr( markIndex,
+					outPair.s1Tel.trans, outPair.s2Tel.trans ) )
+				return true;
+			break;
+
+		case BreakS1:
+		case BreakS2:
+			break;
+		}
+	}
+
+	return false;
+}
+
+/*
+ * Transition Comparison.
+ */
+
+/* Compare target partitions. Either pointer may be null. */
+int FsmGraph::comparePartPtr( FsmTrans *trans1, FsmTrans *trans2 )
+{
+	if ( trans1 != 0 ) {
+		/* If trans1 is set then so should trans2. The initial partitioning
+		 * guarantees this for us. */
+		if ( trans1->toState == 0 && trans2->toState != 0 )
+			return -1;
+		else if ( trans1->toState != 0 && trans2->toState == 0 )
+			return 1;
+		else if ( trans1->toState != 0 ) {
+			/* Both of targets are set. */
+			return CmpOrd< MinPartition* >::compare( 
+				trans1->toState->alg.partition, trans2->toState->alg.partition );
+		}
+	}
+	return 0;
+}
+
+
+/* Compares two transition pointers according to priority and functions.
+ * Either pointer may be null. Does not consider to state or from state. */
+int FsmGraph::compareDataPtr( FsmTrans *trans1, FsmTrans *trans2 )
+{
+	if ( trans1 == 0 && trans2 != 0 )
+		return -1;
+	else if ( trans1 != 0 && trans2 == 0 )
+		return 1;
+	else if ( trans1 != 0 ) {
+		/* Both of the transition pointers are set. */
+		int compareRes = compareTransData( trans1, trans2 );
+		if ( compareRes != 0 )
+			return compareRes;
+	}
+	return 0;
+}
+
+/* Compares two transitions according to target state, priority and functions.
+ * Does not consider from state. Either of the pointers may be null. */
+int FsmGraph::compareFullPtr( FsmTrans *trans1, FsmTrans *trans2 )
+{
+	if ( (trans1 != 0) ^ (trans2 != 0) ) {
+		/* Exactly one of the transitions is set. */
+		if ( trans1 != 0 )
+			return -1;
+		else
+			return 1;
+	}
+	else if ( trans1 != 0 ) {
+		/* Both of the transition pointers are set. Test target state,
+		 * priority and funcs. */
+		if ( trans1->toState < trans2->toState )
+			return -1;
+		else if ( trans1->toState > trans2->toState )
+			return 1;
+		else if ( trans1->toState != 0 ) {
+			/* Test transition data. */
+			int compareRes = compareTransData( trans1, trans2 );
+			if ( compareRes != 0 )
+				return compareRes;
+		}
+	}
+	return 0;
+}
+
+
+bool FsmGraph::shouldMarkPtr( MarkIndex &markIndex, FsmTrans *trans1, 
+				FsmTrans *trans2 )
+{
+	if ( (trans1 != 0) ^ (trans2 != 0) ) {
+		/* Exactly one of the transitions is set. The initial mark round
+		 * should rule out this case. */
+		assert( false );
+	}
+	else if ( trans1 != 0 ) {
+		/* Both of the transitions are set. If the target pair is marked, then
+		 * the pair we are considering gets marked. */
+		return markIndex.isPairMarked( trans1->toState->alg.stateNum, 
+				trans2->toState->alg.stateNum );
+	}
+
+	/* Neither of the transitiosn are set. */
+	return false;
+}
+
+
diff --git a/colm/input.cpp b/colm/input.cpp
new file mode 100644
index 00000000..d9a3c7e0
--- /dev/null
+++ b/colm/input.cpp
@@ -0,0 +1,144 @@
+/*
+ *  Copyright 2007, 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "input.h"
+#include "colm.h"
+#include "fsmrun.h"
+#include <stdio.h>
+#include <iostream>
+
+using std::cerr;
+using std::endl;
+
+/*
+ * String
+ */
+
+int InputStreamString::getData( char *dest, int length )
+{ 
+	int available = data.length() - offset;
+
+	if ( available < length )
+		length = available;
+
+	memcpy( dest, data.data+offset, length );
+	offset += length;
+
+	if ( offset == data.length() )
+		eof = true;
+
+	return length;
+}
+
+void InputStreamString::pushBack( char *data, long len )
+{
+	assert( len <= offset );
+	offset -= len;
+}
+
+/*
+ * File
+ */
+
+int InputStreamFile::isEOF()
+{
+	return queue == 0 && feof( file );
+}
+
+int InputStreamFile::needFlush()
+{
+	return queue == 0 && feof( file );
+}
+
+int InputStreamFile::getData( char *dest, int length )
+{
+	/* If there is any data in queue, read from that first. */
+	if ( queue != 0 ) {
+		long avail = queue->length - queue->offset;
+		if ( length >= avail ) {
+			memcpy( dest, &queue->buf[queue->offset], avail );
+			RunBuf *del = queue;
+			queue = queue->next;
+			delete del;
+			return avail;
+		}
+		else {
+			memcpy( dest, &queue->buf[queue->offset], length );
+			queue->offset += length;
+			return length;
+		}
+	}
+	else {
+		return fread( dest, 1, length, file );
+	}
+}
+
+void InputStreamFile::pushBack( RunBuf *runBuf )
+{
+	runBuf->next = queue;
+	queue = runBuf;
+}
+
+/*
+ * FD
+ */
+
+int InputStreamFD::isEOF()
+{
+	return queue == 0 && eof;
+}
+
+int InputStreamFD::needFlush()
+{
+	return queue == 0 && eof;
+}
+
+void InputStreamFD::pushBack( RunBuf *runBuf )
+{
+	runBuf->next = queue;
+	queue = runBuf;
+}
+
+int InputStreamFD::getData( char *dest, int length )
+{
+	/* If there is any data in queue, read from that first. */
+	if ( queue != 0 ) {
+		long avail = queue->length - queue->offset;
+		if ( length >= avail ) {
+			memcpy( dest, &queue->buf[queue->offset], avail );
+			RunBuf *del = queue;
+			queue = queue->next;
+			delete del;
+			return avail;
+		}
+		else {
+			memcpy( dest, &queue->buf[queue->offset], length );
+			queue->offset += length;
+			return length;
+		}
+	}
+	else {
+		long got = read( fd, dest, length );
+		if ( got == 0 )
+			eof = true;
+		return got;
+	}
+}
diff --git a/colm/input.h b/colm/input.h
new file mode 100644
index 00000000..e8e6655b
--- /dev/null
+++ b/colm/input.h
@@ -0,0 +1,145 @@
+/*
+ *  Copyright 2007, 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _INPUT_H
+#define _INPUT_H
+
+#include "astring.h"
+
+struct KlangEl;
+struct Pattern;
+struct PatternItem;
+struct Replacement;
+struct ReplItem;
+struct RunBuf;
+
+struct InputStream
+{
+	virtual ~InputStream() {}
+
+	/* Basic functions. */
+	virtual int getData( char *dest, int length ) = 0;
+	virtual int isEOF() = 0;
+	virtual int needFlush() = 0;
+
+	virtual void pushBack( char *data, long len ) 
+		{ assert(false); }
+	virtual void pushBack( RunBuf *runBuf )
+		{ assert(false); }
+
+	/* Named language elements for patterns and replacements. */
+	virtual int isLangEl() { return false; }
+	virtual KlangEl *getLangEl( long &bindId, char *&data, long &length )
+		{ assert( false ); return 0; }
+	virtual void pushBackNamed()
+		{ assert( false ); }
+};
+
+struct InputStreamString : public InputStream
+{
+	InputStreamString( const String &data )
+		: data(data), offset(0), eof(false) {}
+
+	int getData( char *dest, int length );
+	int isEOF() { return eof; }
+	int needFlush() { return eof; }
+	void pushBack( char *data, long len );
+
+	String data;
+	int offset;
+	bool eof;
+};
+
+struct InputStreamFile : public InputStream
+{
+	InputStreamFile( FILE *file )
+		: file(file), queue(0) {}
+
+	int getData( char *dest, int length );
+	int isEOF();
+	int needFlush();
+
+	void pushBack( RunBuf *runBuf );
+
+	FILE *file;
+	RunBuf *queue;
+};
+
+struct InputStreamFD : public InputStream
+{
+	InputStreamFD( long fd )
+		: fd(fd), eof(false), queue(0) {}
+
+	int isEOF();
+	int needFlush();
+	int getData( char *dest, int length );
+
+	void pushBack( RunBuf *runBuf );
+
+	long fd;
+	bool eof;
+	RunBuf *queue;
+};
+
+struct InputStreamPattern : public InputStream
+{
+	InputStreamPattern( Pattern *pattern );
+
+	int isLangEl();
+	int getData( char *dest, int length );
+	KlangEl *getLangEl( long &bindId, char *&data, long &length );
+	int isEOF();
+	int needFlush();
+	void pushBack( char *data, long len );
+	void pushBackNamed();
+
+	void backup();
+	int shouldFlush();
+
+	Pattern *pattern;
+	PatternItem *patItem;
+	int offset;
+	bool flush;
+};
+
+struct InputStreamRepl : public InputStream
+{
+	InputStreamRepl( Replacement *replacement );
+
+	int isLangEl();
+	int getData( char *dest, int length );
+	KlangEl *getLangEl( long &bindId, char *&data, long &length );
+	int isEOF();
+	int needFlush();
+	void pushBack( char *data, long len );
+	void pushBackNamed();
+
+	void backup();
+	int shouldFlush();
+
+	Replacement *replacement;
+	ReplItem *replItem;
+	int offset;
+	bool flush;
+};
+
+#endif /* _INPUT_H */
+
diff --git a/colm/list.cpp b/colm/list.cpp
new file mode 100644
index 00000000..5d0fc7f1
--- /dev/null
+++ b/colm/list.cpp
@@ -0,0 +1,105 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pdarun.h"
+
+void List::addAfter(ListEl *prev_el, ListEl *new_el)
+{
+	/* Set the previous pointer of new_el to prev_el. We do
+	 * this regardless of the state of the list. */
+	new_el->prev = prev_el; 
+
+	/* Set forward pointers. */
+	if (prev_el == 0) {
+		/* There was no prev_el, we are inserting at the head. */
+		new_el->next = head;
+		head = new_el;
+	} 
+	else {
+		/* There was a prev_el, we can access previous next. */
+		new_el->next = prev_el->next;
+		prev_el->next = new_el;
+	} 
+
+	/* Set reverse pointers. */
+	if (new_el->next == 0) {
+		/* There is no next element. Set the tail pointer. */
+		tail = new_el;
+	}
+	else {
+		/* There is a next element. Set it's prev pointer. */
+		new_el->next->prev = new_el;
+	}
+
+	/* Update list length. */
+	listLen++;
+}
+
+void List::addBefore(ListEl *next_el, ListEl *new_el)
+{
+	/* Set the next pointer of the new element to next_el. We do
+	 * this regardless of the state of the list. */
+	new_el->next = next_el; 
+
+	/* Set reverse pointers. */
+	if (next_el == 0) {
+		/* There is no next elememnt. We are inserting at the tail. */
+		new_el->prev = tail;
+		tail = new_el;
+	} 
+	else {
+		/* There is a next element and we can access next's previous. */
+		new_el->prev = next_el->prev;
+		next_el->prev = new_el;
+	} 
+
+	/* Set forward pointers. */
+	if (new_el->prev == 0) {
+		/* There is no previous element. Set the head pointer.*/
+		head = new_el;
+	}
+	else {
+		/* There is a previous element, set it's next pointer to new_el. */
+		new_el->prev->next = new_el;
+	}
+
+	listLen++;
+}
+
+ListEl *List::detach(ListEl *el)
+{
+	/* Set forward pointers to skip over el. */
+	if (el->prev == 0) 
+		head = el->next; 
+	else
+		el->prev->next = el->next; 
+
+	/* Set reverse pointers to skip over el. */
+	if (el->next == 0) 
+		tail = el->prev; 
+	else
+		el->next->prev = el->prev; 
+
+	/* Update List length and return element we detached. */
+	listLen--;
+	return el;
+}
+
diff --git a/colm/lmparse.kh b/colm/lmparse.kh
new file mode 100644
index 00000000..598edf84
--- /dev/null
+++ b/colm/lmparse.kh
@@ -0,0 +1,106 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef RLPARSE_H
+#define RLPARSE_H
+
+#include <iostream>
+#include "avltree.h"
+#include "parsedata.h"
+
+struct Parser
+{
+	%%{
+	parser Parser;
+
+	# Use a class for tokens.
+	token uses class Token;
+
+	# Atoms.
+	token TK_Word, TK_Literal, TK_SingleLit, TK_DoubleLit, TK_Number, TK_UInt,
+		TK_Hex, KW_Nil, KW_True, KW_False;
+
+	# General tokens.
+	token TK_DotDot, TK_ColonGt, TK_ColonGtGt, TK_LtColon,
+		TK_DoubleArrow, TK_StarStar, TK_NameSep, TK_DashDash, TK_DoubleEql,
+		TK_NotEql, TK_DoubleColon, TK_LessEql, TK_GrtrEql, TK_RightArrow,
+		TK_LitPat, TK_AmpAmp, TK_BarBar, TK_SqOpen, TK_SqOpenNeg, TK_SqClose,
+		TK_Dash, TK_ReChar;
+
+	# Defining things.
+	token KW_Rl, KW_Def, KW_Lex, KW_Ignore, KW_Token, KW_Commit, KW_Namespace,
+		KW_Literal, KW_ReduceFirst, KW_Map, KW_List, KW_Vector, KW_Global,
+		KW_Iter, KW_Reject, KW_Ptr, KW_Ref, KW_Deref;
+
+	# Language.
+	token KW_If, KW_While, KW_Else, KW_Elsif, KW_For, KW_Return, KW_Yield, KW_In,
+		KW_Break, KW_PrintXML, KW_Print, KW_Require;
+
+	# Patterns.
+	token KW_Match, KW_Construct, KW_Parse, KW_ParseStop, KW_New, KW_MakeToken,
+		KW_MakeTree, KW_TypeId;
+
+	token KW_Include, KW_Preeof;
+
+	}%%
+
+	%% write instance_data;
+
+	void init();
+	int parseLangEl( int type, const Token *token );
+
+	Parser( const char *fileName, const char *sectionName, const InputLoc &sectionLoc )
+		: sectionName(sectionName)
+	{
+		pd = new ParseData( fileName, sectionName, sectionLoc, std::cout );
+	}
+
+	int token( InputLoc &loc, int tokId, char *tokstart, int toklen );
+	void addRegularDef( const InputLoc &loc, Namespace *nspace, 
+		const String &name, JoinOrLm *joinOrLm, bool isInstance );
+	void addProduction( InputLoc &loc, const String &name, 
+		ProdElList *prodElList, bool commit, CodeBlock *redBlock );
+
+	/* Report an error encountered by the parser. */
+	ostream &parse_error( int tokId, Token &token );
+
+	ParseData *pd;
+
+	/* The name of the root section, this does not change during an include. */
+	const char *sectionName;
+
+	NameRef nameRef;
+	NameRefList nameRefList;
+
+	KlangElVect langElVect;
+
+	PatternItemList *patternItemList;
+	ReplItemList *replItemList;
+	RegionVect regionStack;
+	NamespaceVect namespaceStack;
+
+	String curDefineId;
+	ProdElList *curProdElList;
+};
+
+%% write token_defs;
+
+#endif
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
new file mode 100644
index 00000000..ef04b711
--- /dev/null
+++ b/colm/lmparse.kl
@@ -0,0 +1,2013 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <errno.h>
+
+#include "config.h"
+#include "lmparse.h"
+#include "colm.h"
+
+using std::cout;
+using std::cerr;
+using std::endl;
+
+ParserDict parserDict;
+
+%%{
+
+parser Parser;
+
+include "lmparse.kh";
+
+start: root_item_list
+	final {
+		#ifdef COLM_LOG_COMPILE
+		cerr << "parsing complete" << endl;
+		#endif
+
+		pd->rootCodeBlock = new CodeBlock( $1->stmtList );
+	};
+
+nonterm root_item_list uses lang_stmt_list;
+
+root_item_list: root_item_list root_item
+	final {
+		$$->stmtList = $1->stmtList;
+
+		/* Maybe a statement. */
+		if ( $2->stmt != 0 )
+			$$->stmtList->append( $2->stmt );
+	};
+
+root_item_list: 
+	final {
+		$$->stmtList = new StmtList;
+	};
+
+nonterm root_item uses statement;
+
+root_item: literal_def commit final { $$->stmt = 0; };
+root_item: rl_def commit final { $$->stmt = 0; };
+root_item: token_def commit final { $$->stmt = 0; };
+root_item: cfl_def commit final { $$->stmt = 0; };
+root_item: region_def commit final { $$->stmt = 0; };
+root_item: namespace_def commit final { $$->stmt = 0; };
+root_item: function_def commit final { $$->stmt = 0; };
+root_item: generic_def commit final { $$->stmt = 0; };
+root_item: iter_def commit final { $$->stmt = 0; };
+root_item: global_def commit final { $$->stmt = $1->stmt; };
+root_item: statement commit final { $$->stmt = $1->stmt; };
+root_item: pre_eof commit final { $$->stmt = 0; };
+
+nonterm block_open
+{
+	ObjectDef *localFrame;
+};
+
+block_open: '{' 
+	final {
+		/* Init the object representing the local frame. */
+		$$->localFrame = new ObjectDef( ObjectDef::FrameType, 
+				"local", new ObjFieldMap(), new ObjMethodMap(), pd->nextObjectId++ );
+		pd->curLocalFrame = $$->localFrame;
+	};
+
+block_close: '}' 
+	final {
+		/* Pop the cur local frame, back to the root. */
+		pd->curLocalFrame = pd->rootLocalFrame;
+	};
+
+
+iter_def: 
+	KW_Iter TK_Word '(' opt_param_list ')' block_open lang_stmt_list block_close
+	final {
+		CodeBlock *codeBlock = new CodeBlock( $7->stmtList );
+		codeBlock->localFrame = $6->localFrame;
+		Function *newFunction = new Function( 0, $2->data, 
+				$4->paramList, codeBlock, pd->nextFuncId++, true );
+		pd->functionList.append( newFunction );
+	};
+
+function_def: 
+	type_ref TK_Word '(' opt_param_list ')' block_open lang_stmt_list block_close
+	final {
+		CodeBlock *codeBlock = new CodeBlock( $7->stmtList );
+		codeBlock->localFrame = $6->localFrame;
+		Function *newFunction = new Function( $1->typeRef, $2->data, 
+				$4->paramList, codeBlock, pd->nextFuncId++, false );
+		pd->functionList.append( newFunction );
+	};
+
+nonterm opt_param_list uses param_list;
+
+opt_param_list: param_list
+	final {
+		$$->paramList = $1->paramList;
+	};
+		
+opt_param_list: 
+	final {
+		$$->paramList = new ParameterList;
+	};
+
+nonterm param_list
+{
+	ParameterList *paramList;
+};
+
+param_list: param_list ',' param_var_def
+	final {
+		$$->paramList = $1->paramList;
+		$$->paramList->append( $3->objField );
+	};
+
+param_list: param_var_def
+	final {
+		/* Create the map and insert the first item. */
+		$$->paramList = new ParameterList;
+		$$->paramList->append( $1->objField );
+	};
+
+nonterm param_var_def uses var_def;
+
+param_var_def: var_def
+	final {
+		$$->objField = $1->objField;
+	};
+param_var_def: reference_type_ref TK_Word
+	final {
+		/* Return an object field object. The user of this nonterminal must
+		 * load it into the approrpriate map and do error checking. */
+		$$->objField = new ObjField( $2->loc, $1->typeRef, $2->data );
+	};
+
+nonterm reference_type_ref uses type_ref;
+
+reference_type_ref: KW_Ref region_qual TK_Word
+	final {
+		$$->typeRef = new TypeRef( $1->loc, $2->nspaceQual, $3->data );
+		$$->typeRef->isRef = true;
+	};
+
+generic_def: KW_Map TK_Word '[' type_ref type_ref ']'
+	final {
+		Namespace *nspace = namespaceStack.top();
+
+		KlangEl *langEl = getKlangEl( pd, nspace, $2->data, KlangEl::NonTerm );
+
+		/* Check that the element wasn't previously defined as something else. */
+		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
+			error($1->loc) << "'" << curDefineId << 
+				"' already defined as something else" << endp;
+		}
+
+		GenericType *generic = new GenericType( $2->data, GEN_MAP,
+				pd->nextGenericId++, langEl, $5->typeRef );
+		generic->keyTypeArg = $4->typeRef;
+
+		/* Add one empty production. */
+		ProdElList *emptyList = new ProdElList;
+		addProduction( $1->loc, $2->data, emptyList, false, 0 );
+
+		nspace->genericList.append( generic );
+		langEl->generic = generic;
+	};
+
+generic_def: KW_List TK_Word '[' type_ref ']'
+	final {
+		/* Get the language element. */
+		Namespace *nspace = namespaceStack.top();
+		KlangEl *langEl = getKlangEl( pd, nspace, $2->data, KlangEl::NonTerm );
+
+		/* Check that the element wasn't previously defined as something else. */
+		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
+			error($1->loc) << "'" << curDefineId << 
+				"' already defined as something else" << endp;
+		}
+
+		GenericType *generic = new GenericType( $2->data, GEN_LIST, 
+				pd->nextGenericId++, langEl, $4->typeRef );
+
+		/* Add one empty production. */
+		ProdElList *emptyList = new ProdElList;
+		addProduction( $1->loc, $2->data, emptyList, false, 0 );
+
+		nspace->genericList.append( generic );
+		langEl->generic = generic;
+	};
+
+generic_def: KW_Vector TK_Word '[' type_ref ']'
+	final {
+		GenericType *generic = new GenericType( $2->data, GEN_VECTOR,
+				pd->nextGenericId++, 0, $4->typeRef );
+
+		Namespace *nspace = namespaceStack.top();
+		nspace->genericList.append( generic );
+	};
+
+nonterm global_def uses statement;
+
+global_def: KW_Global var_def opt_def_init
+	final {
+		$$->stmt = 0;
+		ObjectDef *globalObj = pd->globalObjectDef;
+
+		if ( globalObj->objFieldMap->find( $2->objField->name ) != 0 )
+			error($2->objField->loc) << "object field renamed" << endp;
+
+		globalObj->objFieldMap->insert( $2->objField->name, $2->objField );
+
+		if ( $3->expr != 0 ) {
+			LangVarRef *varRef = new LangVarRef( $2->objField->loc, 
+					new QualItemVect, $2->objField->name );
+
+			$$->stmt = new LangStmt( $2->objField->loc, 
+					$3->assignType, varRef, $3->expr );
+		}
+	};
+
+cfl_def: KW_Def cfl_id obj_var_list properties_list cfl_prod_list
+	final {
+		/* Get the language element. */
+		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), 
+				curDefineId, KlangEl::NonTerm );
+
+		/* Check that the element wasn't previously defined as something else. */
+		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
+			error($1->loc) << "'" << curDefineId << 
+				"' already defined as something else" << endp;
+		}
+
+		/* Make a new object definition. */
+		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, curDefineId, 
+				pd->objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+
+		langEl->objectDef = objectDef;
+	};
+
+cfl_id: TK_Word
+	final {
+		curDefineId = $1->data;
+	};
+
+cfl_prod_list: cfl_prod_list '|' define_prod;
+cfl_prod_list: define_prod;
+
+properties_list: properties_list property;
+properties_list: ;
+
+property: 
+	KW_ReduceFirst
+	final {
+		/* Get the language element. */
+		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
+				curDefineId, KlangEl::NonTerm );
+		prodName->reduceFirst = true;
+	};
+
+define_prod: '[' prod_el_list ']' opt_commit opt_reduce_code
+	final {
+		addProduction( $1->loc, curDefineId, curProdElList, $4->commit, $5->codeBlock ); 
+	};
+
+obj_var_list: obj_var_list var_def
+	final {
+		if ( pd->objFieldMap->find( $2->objField->name ) != 0 )
+			error() << "object field renamed" << endp;
+
+		pd->objFieldMap->insert( $2->objField->name, $2->objField );
+	};
+
+obj_var_list:
+	final {
+		pd->objFieldMap = new ObjFieldMap;
+	};
+
+
+nonterm type_ref
+{
+	TypeRef *typeRef;
+};
+
+type_ref: basic_type_ref
+	final {
+		$$->typeRef = $1->typeRef;
+	};
+
+nonterm basic_type_ref uses type_ref;
+
+basic_type_ref: region_qual TK_Word opt_repeat
+	final {
+		$$->typeRef = new TypeRef( $2->loc, $1->nspaceQual, $2->data );
+		$$->typeRef->isRepeat = $3->repeat;
+		$$->typeRef->isOpt = $3->opt;
+	};
+
+basic_type_ref: KW_Ptr region_qual TK_Word opt_repeat
+	final {
+		$$->typeRef = new TypeRef( $1->loc, $2->nspaceQual, $3->data );
+		$$->typeRef->isRepeat = $4->repeat;
+		$$->typeRef->isOpt = $4->opt;
+		$$->typeRef->isPtr = true;
+	};
+
+nonterm var_def
+{
+	InputLoc loc;
+	ObjField *objField;
+};
+
+var_def: type_ref TK_Word
+	final {
+		/* Return an object field object. The user of this nonterminal must
+		 * load it into the approrpriate map and do error checking. */
+		$$->objField = new ObjField( $2->loc, $1->typeRef, $2->data );
+	};
+
+region_def: 
+	region_head '{' root_item_list '}'
+	final {
+		/* Pop the top of the stack. */
+		regionStack.pop();
+	};
+
+region_head: 
+	KW_Lex TK_Word 
+	final {
+		/* Make the new token region. */
+		TokenRegion *tokenRegion = new TokenRegion( InputLoc(), $2->data,
+				pd->regionList.length(), regionStack.top() );
+		regionStack.top()->childRegions.append( tokenRegion );
+		pd->regionList.append( tokenRegion );
+		JoinOrLm *joinOrLm = new JoinOrLm( tokenRegion );
+		String scannerName( $2->data.length() + 2, "<%s>", $2->data.data );
+		addRegularDef( InputLoc(), namespaceStack.top(), scannerName, joinOrLm, true );
+		regionStack.push( tokenRegion );
+	};
+
+namespace_def: 
+	namespace_head '{' root_item_list '}'
+	final{
+		/* Pop the top of the stack. */
+		namespaceStack.pop();
+	};
+
+namespace_head: 
+	KW_Namespace TK_Word 
+	final {
+		/* Make the new namespace. */
+		Namespace *nspace = new Namespace( InputLoc(), $2->data,
+				pd->namespaceList.length(), namespaceStack.top() );
+		namespaceStack.top()->childNamespaces.append( nspace );
+		pd->namespaceList.append( nspace );
+		namespaceStack.push( nspace );
+	};
+
+pattern_list: pattern_list pattern;
+pattern_list: init_pattern_list pattern;
+
+init_pattern_list:
+	final {
+		patternItemList = new PatternItemList;
+	};
+
+pattern: '"' litpat_el_list '"';
+pattern: '[' pattern_el_list ']';
+
+litpat_el_list: litpat_el_list litpat_el;
+litpat_el_list: ;
+
+litpat_el: TK_LitPat
+	final {
+		PatternItem *patternItem = new PatternItem( $1->data,
+			PatternItem::InputText );
+		patternItemList->append( patternItem );
+	};
+
+litpat_el: '[' pattern_el_list ']';
+
+pattern_el_list: pattern_el_list pattern_el;
+pattern_el_list: ;
+
+pattern_el: opt_label pattern_el_type_or_lit
+	final {
+		/* Store the variable reference in the pattern itemm. */
+		$2->patternItem->varRef = $1->varRef;
+
+		if ( $1->varRef != 0 ) {
+			if ( pd->curLocalFrame->objFieldMap->find( $1->varRef->name ) != 0 ) {
+				error( $1->varRef->loc ) << "variable " << $1->varRef->name << 
+						" redeclared" << endp;
+			}
+
+			TypeRef *typeRef = new TypeRef( InputLoc(), $2->patternItem->factor );
+			ObjField *objField = new ObjField( InputLoc(), typeRef, $1->varRef->name );
+
+			/* Insert it into the field map. */
+			pd->curLocalFrame->objFieldMap->insert( $1->varRef->name, objField );
+		}
+	};
+
+pattern_el: '"' litpat_el_list '"';
+pattern_el: '?' TK_Word
+	final {
+		/* FIXME: Implement */
+		assert(false);
+	};
+
+nonterm pattern_el_type_or_lit
+{
+	PatternItem *patternItem;
+};
+
+pattern_el_type_or_lit: region_qual TK_Word opt_repeat
+	final {
+		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
+				$2->data, 0, $3->opt, $3->repeat );
+		$$->patternItem = new PatternItem( factor, PatternItem::FactorType );
+		patternItemList->append( $$->patternItem );
+	};
+
+pattern_el_type_or_lit: region_qual TK_Literal opt_repeat
+	final {
+		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
+		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
+				literal, 0, $3->opt, $3->repeat );
+		$$->patternItem = new PatternItem( factor, PatternItem::FactorType );
+		patternItemList->append( $$->patternItem );
+	};
+
+nonterm opt_label
+{
+	/* Variable reference. */
+	LangVarRef *varRef;
+};
+
+opt_label: TK_Word ':'
+	final {
+		$$->varRef = new LangVarRef( $1->loc, new QualItemVect, $1->data );
+	};
+opt_label: 
+	final {
+		$$->varRef = 0;
+	};
+
+repl_list: repl_list replacement;
+repl_list: init_repl_list replacement;
+
+init_repl_list: 
+	final {
+		replItemList = new ReplItemList;
+	};
+
+replacement: '"' litrepl_el_list '"';
+replacement: '[' repl_el_list ']';
+
+litrepl_el_list: litrepl_el_list litrepl_el;
+litrepl_el_list: ;
+
+litrepl_el: TK_LitPat
+	final {
+		ReplItem *replItem = new ReplItem( ReplItem::InputText, $1->data );
+		replItemList->append( replItem );
+	};
+
+litrepl_el: '[' repl_el_list ']';
+
+repl_el_list: repl_el_list repl_el;
+repl_el_list: ;
+
+repl_el: var_ref
+	final {
+		ReplItem *replItem = new ReplItem( ReplItem::VarRefType, $1->varRef );
+		replItemList->append( replItem );
+	};
+
+repl_el: region_qual TK_Literal
+	final {
+		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
+		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
+				literal, 0, false, false );
+		ReplItem *replItem = new ReplItem( ReplItem::FactorType, factor );
+		replItemList->append( replItem );
+	};
+
+repl_el: '"' litrepl_el_list '"';
+
+prod_el_list: 
+	prod_el_list prod_el 
+	final {
+		curProdElList->append( $2->factor );
+	};
+
+prod_el_list: 
+	final { curProdElList = new ProdElList; };
+
+nonterm prod_el
+{
+	PdaFactor *factor;
+};
+
+prod_el: 
+	opt_commit region_qual TK_Word opt_repeat
+	final {
+		$$->factor = new PdaFactor( $3->loc, $1->commit, 
+				$2->nspaceQual, $3->data, 0, $4->opt, $4->repeat );
+	};
+
+prod_el: 
+	opt_commit region_qual TK_Literal opt_repeat
+	final {
+		/* Create a new factor node going to a concat literal. */
+		PdaLiteral *literal = new PdaLiteral( $3->loc, *$3 );
+		$$->factor = new PdaFactor( $3->loc, $1->commit, $2->nspaceQual, 
+				literal, 0, $4->opt, $4->repeat );
+	};
+
+nonterm opt_repeat
+{
+	bool opt;
+	bool repeat;
+};
+
+opt_repeat: '?' final { $$->opt = true; $$->repeat = false; };
+opt_repeat: '*' final { $$->opt = false; $$->repeat = true; };
+opt_repeat:     final { $$->opt = false; $$->repeat = false; };
+
+nonterm region_qual
+{
+	NamespaceQual *nspaceQual;
+};
+
+region_qual: region_qual TK_Word TK_DoubleColon
+	final {
+		$$->nspaceQual = $1->nspaceQual;
+		$$->nspaceQual->qualNames.append( $2->data );
+	};
+
+region_qual: 
+	final {
+		$$->nspaceQual = new NamespaceQual( namespaceStack.top(), regionStack.top() );
+	};
+
+literal_def: KW_Literal literal_list;
+
+literal_list: literal_list ',' literal_item;
+literal_list: literal_item;
+
+literal_item: TK_Literal
+	final {
+		/* Create a name for the literal. */
+		String name( 32, "_literal_%.4x", pd->nextTokenId );
+
+		bool insideRegion = regionStack.top() != pd->rootRegion;
+		if ( !insideRegion ) {
+			/* Make a new token region just for the token. */
+			TokenRegion *tokenRegion = new TokenRegion( InputLoc(), $1->data,
+					pd->regionList.length(), regionStack.top() );
+			regionStack.top()->childRegions.append( tokenRegion );
+			pd->regionList.append( tokenRegion );
+			JoinOrLm *joinOrLm = new JoinOrLm( tokenRegion );
+			String scannerName( name.length() + 2, "<%s>", name.data );
+			addRegularDef( InputLoc(), namespaceStack.top(), scannerName, joinOrLm, true );
+			regionStack.push( tokenRegion );
+		}
+
+		bool unusedCI;
+		String interp;
+		prepareLitString( interp, unusedCI, $1->data, $1->loc );
+
+		/* Look for the production's associated region. */
+		Namespace *nspace = namespaceStack.top();
+		TokenRegion *region = regionStack.top();
+
+		LiteralDictEl *ldel = nspace->literalDict.find( interp );
+		if ( ldel != 0 )
+			error( $1->loc ) << "literal already defined in this namespace" << endp;
+		else {
+			/* Create a token for the literal. */
+			KlangEl *newLangEl = getKlangEl( pd, nspace, name, KlangEl::Term );
+			assert( newLangEl != 0 );
+			assert( newLangEl->type == KlangEl::Term );
+			newLangEl->lit = $1->data;
+			newLangEl->isLiteral = true;
+
+			Join *join = new Join( new Expression( new Term( new FactorWithAug(
+				new FactorWithRep( $1->loc, new FactorWithNeg( $1->loc, new Factor(
+				new Literal( $1->loc, $1->data, 
+					Literal::LitString ) ) ) ) ) ) ) );
+			
+			TokenDef *tokenDef = new TokenDef( join, newLangEl, $1->loc, 
+					pd->nextTokenId, nspace, region );
+			newLangEl->tokenDef = tokenDef;
+
+			region->tokenDefList.append( tokenDef );
+			ldel = nspace->literalDict.insert( interp, newLangEl );
+			pd->nextTokenId += 1;
+		}
+
+		if ( !insideRegion ) {
+			/* Leave the region just for this token. */
+			regionStack.pop();
+		}
+	};
+
+token_def: 
+	token_or_ignore token_def_name obj_var_list
+	'/' opt_rl_join '/' opt_translate
+	final {
+		bool ignore = $1->ignore;
+		String name = $2->name;
+		Join *join = $5->join;
+		CodeBlock *transBlock = $7->transBlock;
+
+		/* Check the region if this is for an ignore. */
+		if ( ignore && !pd->insideRegion )
+			error($1->loc) << "ignore tokens can only appear inside scanners" << endp;
+
+		/* Check the name if this is a token. */
+		if ( !ignore && name == 0 )
+			error($1->loc) << "tokens must have a name" << endp;
+
+		/* Give a default name to ignores. */ 
+		if ( name == 0 )
+			name.setAs( 32, "_ignore_%.4x", pd->nextTokenId );
+
+		/* Create the token. */
+		KlangEl *tokEl = getKlangEl( pd, namespaceStack.top(), name, KlangEl::Term );
+		if ( tokEl->type != KlangEl::Unknown && tokEl->type != KlangEl::Term )
+			error($1->loc) << "'" << name << "' already defined as something else" << endp;
+
+		tokEl->type = KlangEl::Term;
+		tokEl->ignore = ignore;
+		tokEl->transBlock = transBlock;
+
+		Namespace *nspace = namespaceStack.top();
+		TokenRegion *region = regionStack.top();
+
+		TokenDef *tokenDef = new TokenDef( join, tokEl, $1->loc, 
+				pd->nextTokenId++, nspace, region );
+		region->tokenDefList.append( tokenDef );
+		tokEl->tokenDef = tokenDef;
+
+		/* Create the object def for the token. */
+		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, name, 
+				pd->objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+
+		tokEl->objectDef = objectDef;
+
+		/* This is created and pushed in the name. */
+		if ( !pd->insideRegion ) {
+			/* Leave the region that we made just for this token. */
+			regionStack.pop();
+		}
+
+		if ( join != 0 ) {
+			/* Create a regular language definition so the token can be used to
+			 * make other tokens */
+			JoinOrLm *joinOrLm = new JoinOrLm( join );
+			addRegularDef( $1->loc, namespaceStack.top(), name, joinOrLm, false );
+		}
+	};
+
+nonterm token_or_ignore
+{
+	InputLoc loc;
+	bool ignore;
+};
+
+token_or_ignore: KW_Token
+	final { $$->loc = $1->loc; $$->ignore = false; };
+	
+token_or_ignore: KW_Ignore
+	final { $$->loc = $1->loc; $$->ignore = true; };
+
+nonterm class token_def_name
+{
+	String name;
+};
+
+token_def_name:
+	opt_name
+	final {
+		String name = $1->name;
+
+		$$->name = name;
+		pd->insideRegion = regionStack.top() != pd->rootRegion;
+		pd->tokenDefName = name;
+
+		if ( !pd->insideRegion ) {
+			/* If not inside a region, make one for the token. */
+			TokenRegion *tokenRegion = new TokenRegion( InputLoc(), name,
+					pd->regionList.length(), regionStack.top() );
+			regionStack.top()->childRegions.append( tokenRegion );
+			pd->regionList.append( tokenRegion );
+			JoinOrLm *joinOrLm = new JoinOrLm( tokenRegion );
+			String scannerName( name.length() + 2, "<%s>", name.data );
+			addRegularDef( InputLoc(), namespaceStack.top(), scannerName, joinOrLm, true );
+			regionStack.push( tokenRegion );
+		}
+
+		/* Reset the lable id counter. */
+		pd->nextLabelId = 0;
+	};
+
+nonterm class opt_name
+{
+	String name;
+};
+
+opt_name: TK_Word final { $$->name = $1->data; };
+opt_name: ;
+
+nonterm opt_translate
+{
+	CodeBlock *transBlock;
+};
+
+opt_translate: 
+	block_open lang_stmt_list block_close
+	final { 
+		$$->transBlock = new CodeBlock( $2->stmtList );
+		$$->transBlock->localFrame = $1->localFrame;
+	};
+
+opt_translate: 
+	final {
+		$$->transBlock = 0;
+	};
+
+pre_eof: 
+	KW_Preeof block_open lang_stmt_list block_close
+	final {
+		bool insideRegion = regionStack.top() != pd->rootRegion;
+		if ( !insideRegion )
+			error($1->loc) << "preeof must be used inside an existing region" << endl;
+
+		CodeBlock *codeBlock = new CodeBlock( $3->stmtList );
+		codeBlock->localFrame = $2->localFrame;
+
+		TokenRegion *region = regionStack.top();
+		region->preEofBlock = codeBlock;
+	};
+
+rl_def:
+	KW_Rl machine_name '/' rl_join '/'
+	final {
+		/* Generic creation of machine for instantiation and assignment. */
+		JoinOrLm *joinOrLm = new JoinOrLm( $4->join );
+		addRegularDef( $2->loc, namespaceStack.top(), $2->data, joinOrLm, false );
+	};
+
+type class token_data
+{
+	InputLoc loc;
+	String data;
+};
+
+nonterm machine_name uses token_data;
+
+machine_name: 
+	TK_Word
+	final {
+		/* Make/get the priority key. The name may have already been referenced
+		 * and therefore exist. */
+		PriorDictEl *priorDictEl;
+		if ( pd->priorDict.insert( $1->data, pd->nextPriorKey, &priorDictEl ) )
+			pd->nextPriorKey += 1;
+		pd->curDefPriorKey = priorDictEl->value;
+
+		/* Make/get the local error key. */
+		LocalErrDictEl *localErrDictEl;
+		if ( pd->localErrDict.insert( $1->data, pd->nextLocalErrKey, &localErrDictEl ) )
+			pd->nextLocalErrKey += 1;
+		pd->curDefLocalErrKey = localErrDictEl->value;
+
+		$$->loc = $1->loc;
+		$$->data = $1->data;
+	};
+
+#
+# Reduce statements
+#
+
+nonterm opt_reduce_code
+{
+	CodeBlock *codeBlock;
+};
+
+opt_reduce_code: 
+	final { $$->codeBlock = 0; };
+
+opt_reduce_code: 
+	start_reduce lang_stmt_list block_close
+	final { 
+		$$->codeBlock = new CodeBlock( $2->stmtList );
+		$$->codeBlock->localFrame = $1->localFrame;
+	};
+
+nonterm start_reduce uses block_open;
+
+start_reduce: 
+	block_open
+	final {
+		$$->localFrame = $1->localFrame;
+
+		/* Get the language element. */
+		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
+			curDefineId, KlangEl::NonTerm );
+
+		/* References to the reduce item. */
+		pd->addProdRedObjectVar( pd->curLocalFrame, prodName );
+		pd->addProdRHSVars( pd->curLocalFrame, curProdElList );
+	};
+
+nonterm lang_stmt_list
+{
+	StmtList *stmtList;
+};
+
+lang_stmt_list: rec_stmt_list opt_require_stmt
+	final {
+		$$->stmtList = $1->stmtList;
+		if ( $2->stmt != 0 )
+			$$->stmtList->append( $2->stmt );
+	};
+
+nonterm rec_stmt_list uses lang_stmt_list;
+
+rec_stmt_list: rec_stmt_list statement
+	final {
+		$$->stmtList = $1->stmtList;
+
+		/* Maybe a statement was generated. */
+		if ( $2->stmt != 0 )
+			$$->stmtList->append( $2->stmt );
+	};
+
+rec_stmt_list:
+	final {
+		$$->stmtList = new StmtList;
+	};
+
+nonterm opt_def_init
+{
+	LangExpr *expr;
+	LangStmt::Type assignType;
+};
+
+opt_def_init: '=' code_expr
+	final {
+		$$->expr = $2->expr;
+		$$->assignType = LangStmt::AssignType;
+	};
+opt_def_init: 
+	final {
+		$$->expr = 0;
+	};
+
+nonterm statement
+{
+	LangStmt *stmt;
+};
+
+statement: var_def opt_def_init 
+	final {
+		/* By default no statement here. Maybe will add an initialization. */
+		$$->stmt = 0;
+
+		/* Check for redeclaration. */
+		if ( pd->curLocalFrame->objFieldMap->find( $1->objField->name ) != 0 ) {
+			error( $1->objField->loc ) << "variable " << $1->objField->name <<
+					" redeclared" << endp;
+		}
+
+		/* Insert it into the field map. */
+		pd->curLocalFrame->objFieldMap->insert( $1->objField->name, $1->objField );
+
+		if ( $2->expr != 0 ) {
+			LangVarRef *varRef = new LangVarRef( $1->objField->loc, 
+					new QualItemVect, $1->objField->name );
+
+			$$->stmt = new LangStmt( $1->objField->loc, 
+					$2->assignType, varRef, $2->expr );
+		}
+	};
+statement: var_ref '=' code_expr
+	final {
+		$$->stmt = new LangStmt( $2->loc, LangStmt::AssignType, $1->varRef, $3->expr );
+	};
+statement: KW_Print '(' code_expr_list ')'
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::PrintType, $3->exprVect );
+	};
+statement: KW_PrintXML '(' code_expr_list ')'
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::PrintXMLType, $3->exprVect );
+	};
+statement: code_expr
+	final {
+		$$->stmt = new LangStmt( InputLoc(), LangStmt::ExprType, $1->expr );
+	};
+statement: KW_If code_expr block_or_single elsif_list
+	final {
+		$$->stmt = new LangStmt( LangStmt::IfType, $2->expr, $3->stmtList, $4->stmtList );
+	};
+statement: KW_Reject
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::RejectType );
+	};
+statement: KW_While code_expr block_or_single
+	final {
+		$$->stmt = new LangStmt( LangStmt::WhileType, $2->expr, $3->stmtList );
+	};
+statement: KW_For TK_Word ':' type_ref KW_In iter_call block_or_single
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::ForIterType, 
+			$2->data, $4->typeRef, $6->langTerm, $7->stmtList );
+	};
+statement: KW_Return code_expr
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::ReturnType, $2->expr );
+	};
+statement: KW_Break
+	final {
+		$$->stmt = new LangStmt( LangStmt::BreakType );
+	};
+statement: KW_Yield var_ref
+	final {
+		$$->stmt = new LangStmt( LangStmt::YieldType, $2->varRef );
+	};
+
+nonterm opt_require_stmt uses statement;
+
+opt_require_stmt: 
+	require_pattern lang_stmt_list
+	final {
+		$$->stmt = new LangStmt( LangStmt::IfType, $1->expr, $2->stmtList, 0 );
+	};
+opt_require_stmt:
+	final {
+		$$->stmt = 0;
+	};
+
+nonterm require_pattern uses code_expr;
+
+require_pattern: 
+	KW_Require var_ref pattern_list 
+	final {
+		Namespace *nspace = namespaceStack.top();
+		TokenRegion *region = regionStack.top();
+		Pattern *pattern = new Pattern( $1->loc, nspace, region, 
+				patternItemList, pd->nextPatReplId++ );
+		pd->patternList.append( pattern );
+
+		$$->expr = new LangExpr(
+				new LangTerm( LangTerm::MatchType, $2->varRef, pattern ) );
+	};
+
+nonterm block_or_single uses lang_stmt_list;
+
+block_or_single: '{' lang_stmt_list '}'
+	final {
+		$$->stmtList = $2->stmtList;
+	};
+block_or_single: statement
+	final {
+		$$->stmtList = new StmtList;
+		$$->stmtList->append( $1->stmt );
+	};
+
+nonterm iter_call
+{
+	LangTerm *langTerm;
+};
+
+iter_call: var_ref '(' opt_code_expr_list ')'
+	final {
+		$$->langTerm = new LangTerm( $1->varRef, $3->exprVect );
+	};
+iter_call: TK_Word
+	final {
+		$$->langTerm = new LangTerm( LangTerm::VarRefType,
+			new LangVarRef( $1->loc, new QualItemVect, $1->data ) );
+	};
+
+nonterm elsif_list
+{
+	StmtList *stmtList;
+};
+
+elsif_list: 
+	elsif_clause elsif_list
+	final {
+		/* Put any of the followng elseif part, an else, or null into the elsePart. */
+		$1->stmt->elsePart = $2->stmtList;
+
+		/* Make a statement list with jsut the elseif clause in it. It will go into
+		 * some else part. */
+		$$->stmtList = new StmtList;
+		$$->stmtList->append( $1->stmt );
+	};
+elsif_list:
+	optional_else
+	final {
+		$$->stmtList = $1->stmtList;
+	};
+
+nonterm elsif_clause
+{
+	LangStmt *stmt;
+};
+
+elsif_clause: 
+	KW_Elsif code_expr block_or_single
+	final {
+		$$->stmt = new LangStmt( LangStmt::IfType, $2->expr, $3->stmtList, 0 );
+	};
+
+nonterm optional_else
+{
+	StmtList *stmtList;
+};
+
+optional_else: 
+	KW_Else block_or_single
+	final {
+		$$->stmtList = $2->stmtList;
+	};
+
+optional_else: 
+	final {
+		$$->stmtList = 0;
+	};
+
+nonterm code_expr_list
+{
+	ExprVect *exprVect;
+};
+
+code_expr_list: code_expr_list ',' code_expr
+	final {
+		$$->exprVect = $1->exprVect;
+		$$->exprVect->append( $3->expr );
+	};
+code_expr_list: code_expr
+	final {
+		$$->exprVect = new ExprVect;
+		$$->exprVect->append( $1->expr );
+	};
+
+nonterm opt_code_expr_list uses code_expr_list;
+
+opt_code_expr_list: code_expr_list
+	final {
+		$$->exprVect = $1->exprVect;
+	};
+
+opt_code_expr_list: 
+	final {
+		$$->exprVect = 0;
+	};
+
+#
+# Type list
+#
+
+nonterm type_list
+{
+	TypeRefVect *typeRefVect;
+};
+
+type_list: type_list ',' type_ref
+	final {
+		$$->typeRefVect = $1->typeRefVect;
+		$$->typeRefVect->append( $3->typeRef );
+	};
+type_list: type_ref
+	final {
+		$$->typeRefVect = new TypeRefVect;
+		$$->typeRefVect->append( $1->typeRef );
+	};
+
+nonterm opt_type_list uses type_list;
+
+opt_type_list: type_list
+	final {
+		$$->typeRefVect = $1->typeRefVect;
+	};
+
+opt_type_list: 
+	final {
+		$$->typeRefVect = 0;
+	};
+
+
+#
+# Variable reference
+#
+
+nonterm var_ref
+{
+	LangVarRef *varRef;
+};
+
+var_ref: qual TK_Word
+	final {
+		$$->varRef = new LangVarRef( $2->loc, $1->qual, $2->data );
+	};
+
+nonterm qual
+{
+	QualItemVect *qual;
+};
+
+qual: qual TK_Word '.'
+	final {
+		$$->qual = $1->qual;
+		$$->qual->append( QualItem( $2->loc, $2->data, QualItem::Dot ) );
+	};
+qual: qual TK_Word TK_RightArrow
+	final {
+		$$->qual = $1->qual;
+		$$->qual->append( QualItem( $2->loc, $2->data, QualItem::Arrow ) );
+	};
+qual: 
+	final {
+		$$->qual = new QualItemVect;
+	};
+
+#
+# Code expression
+#
+
+nonterm code_expr
+{
+	LangExpr *expr;
+};
+
+code_expr: code_expr TK_AmpAmp code_relational
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_LogicalAnd, $3->expr );
+	};
+
+code_expr: code_expr TK_BarBar code_relational
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_LogicalOr, $3->expr );
+	};
+
+code_expr: code_relational
+	final {
+		$$->expr = $1->expr;
+	};
+
+nonterm code_relational uses code_expr;
+
+code_relational: code_relational TK_DoubleEql code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_DoubleEql, $3->expr );
+	};
+
+code_relational: code_relational TK_NotEql code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_NotEql, $3->expr );
+	};
+
+code_relational: code_relational '<' code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, '<', $3->expr );
+	};
+
+code_relational: code_relational '>' code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, '>', $3->expr );
+	};
+
+code_relational: code_relational TK_LessEql code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_LessEql, $3->expr );
+	};
+
+code_relational: code_relational TK_GrtrEql code_additive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, OP_GrtrEql, $3->expr );
+	};
+
+
+code_relational: code_additive
+	final {
+		$$->expr = $1->expr;
+	};
+
+nonterm code_additive uses code_expr;
+
+code_additive: code_additive '+' code_multiplicitive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, '+', $3->expr );
+	};
+
+code_additive: code_additive '-' code_multiplicitive
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, '-', $3->expr );
+	};
+
+code_additive: code_multiplicitive
+	final {
+		$$->expr = $1->expr;
+	};
+
+nonterm code_multiplicitive uses code_expr;
+
+code_multiplicitive: code_multiplicitive '*' code_unary
+	final {
+		$$->expr = new LangExpr( $2->loc, $1->expr, '*', $3->expr );
+	};
+
+code_multiplicitive: code_unary
+	final {
+		$$->expr = $1->expr;
+	};
+
+nonterm code_unary uses code_expr;
+code_unary: '!' code_factor
+	final {
+		$$->expr = new LangExpr( $1->loc, '!', $2->expr );
+	};
+code_unary: code_factor
+	final {
+		$$->expr = $1->expr;
+	};
+
+
+
+nonterm code_factor uses code_expr;
+
+code_factor: TK_Number
+	final {
+		$$->expr = new LangExpr( new LangTerm( LangTerm::NumberType, $1->data ) );
+	};
+code_factor: TK_Literal
+	final {
+		$$->expr = new LangExpr( new LangTerm( LangTerm::StringType, $1->data ) );
+	};
+code_factor: var_ref '(' opt_code_expr_list ')'
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->varRef, $3->exprVect ) );
+	};
+code_factor: var_ref
+	final {
+		$$->expr = new LangExpr( new LangTerm( LangTerm::VarRefType, $1->varRef ) );
+	};
+code_factor: KW_Match var_ref pattern_list
+	final {
+		Namespace *nspace = namespaceStack.top();
+		TokenRegion *region = regionStack.top();
+		Pattern *pattern = new Pattern( $1->loc, nspace, region, 
+				patternItemList, pd->nextPatReplId++ );
+		pd->patternList.append( pattern );
+
+		$$->expr = new LangExpr( new LangTerm( LangTerm::MatchType, $2->varRef, pattern ) );
+	};
+code_factor: KW_New code_factor
+	final {
+		$$->expr = new LangExpr( new LangTerm( LangTerm::NewType, $2->expr ) );
+	};
+code_factor: 
+	KW_Construct type_ref opt_field_init repl_list
+	final {
+		Namespace *nspace = namespaceStack.top();
+		TokenRegion *region = regionStack.top();
+		Replacement *replacement = new Replacement( nspace, region, replItemList, 
+				pd->nextPatReplId++ );
+		pd->replList.append( replacement );
+		$$->expr = new LangExpr( new LangTerm( $1->loc, LangTerm::ConstructType,
+				$2->typeRef, $3->fieldInitVect, replacement ) );
+	};
+code_factor: KW_Parse type_ref '(' opt_code_expr_list ')'
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::ParseType, $2->typeRef ) );
+		$$->expr->term->args = $4->exprVect;
+	};
+code_factor: KW_ParseStop type_ref '(' opt_code_expr_list ')'
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::ParseStopType, $2->typeRef ) );
+		$$->expr->term->args = $4->exprVect;
+	};
+code_factor: KW_TypeId type_ref
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc,
+				LangTerm::TypeIdType, $2->typeRef ) );
+	};
+code_factor: type_ref KW_In var_ref
+	final {
+		$$->expr = new LangExpr( new LangTerm( $2->loc,
+				LangTerm::SearchType, $1->typeRef, $3->varRef ) );
+	};
+code_factor: KW_Nil
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::NilType ) );
+	};
+code_factor: KW_True
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::TrueType ) );
+	};
+code_factor: KW_False
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::FalseType ) );
+	};
+code_factor: '(' code_expr ')'
+	final {
+		$$->expr = $2->expr;
+	};
+code_factor: KW_MakeTree '(' opt_code_expr_list ')'
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::MakeTreeType, $3->exprVect ) );
+	};
+code_factor: KW_MakeToken '(' opt_code_expr_list ')'
+	final {
+		$$->expr = new LangExpr( new LangTerm( $1->loc, 
+				LangTerm::MakeTokenType, $3->exprVect ) );
+	};
+code_factor: KW_Deref code_expr
+	final {
+		$$->expr = new LangExpr( $1->loc, OP_Deref, $2->expr );
+	};
+
+nonterm opt_field_init uses field_init_list;
+
+opt_field_init: '(' opt_field_init_list ')'
+	final {
+		$$->fieldInitVect = $2->fieldInitVect;
+	};
+opt_field_init: 
+	final {
+		$$->fieldInitVect = 0;
+	};
+
+nonterm opt_field_init_list uses field_init_list;
+
+opt_field_init_list: field_init_list 
+	final {
+		$$->fieldInitVect = $1->fieldInitVect;
+	};
+opt_field_init_list: 
+	final { 
+		$$->fieldInitVect = 0;
+	};
+
+nonterm field_init_list
+{
+	FieldInitVect *fieldInitVect;
+};
+
+field_init_list: field_init_list ',' field_init
+	final {
+		$$->fieldInitVect = $1->fieldInitVect;
+		$$->fieldInitVect->append( $3->fieldInit );
+	};
+field_init_list: field_init
+	final {
+		$$->fieldInitVect = new FieldInitVect;
+		$$->fieldInitVect->append( $1->fieldInit );
+	};
+
+nonterm field_init
+{
+	FieldInit *fieldInit;
+};
+
+field_init: TK_Word ':' code_expr
+	final {
+		$$->fieldInit = new FieldInit( $1->loc, $1->data, $3->expr );
+	};
+
+#
+# Regular Expressions
+#
+
+nonterm opt_rl_join uses rl_join;
+
+opt_rl_join: rl_join
+	final {
+		$$->join = $1->join;
+	};
+
+opt_rl_join:
+	final {
+		$$->join = 0;
+	};
+
+nonterm rl_join
+{
+	Join *join;
+};
+
+rl_join: 
+	rl_join ',' rl_expr
+	final {
+		/* Append the expression to the list and return it. */
+		$1->join->exprList.append( $3->expression );
+		$$->join = $1->join;
+	};
+rl_join: 
+	rl_expr 
+	final {
+		$$->join = new Join( $1->expression );
+	};
+
+nonterm rl_expr
+{
+	Expression *expression;
+};
+
+rl_expr: 
+	rl_expr '|' rl_term_short final {
+		$$->expression = new Expression( $1->expression, 
+				$3->term, Expression::OrType );
+	};
+rl_expr: 
+	rl_expr '&' rl_term_short final {
+		$$->expression = new Expression( $1->expression, 
+				$3->term, Expression::IntersectType );
+	};
+# This priority specification overrides the innermost parsing strategy which
+# results ordered choice interpretation of the grammar.
+rl_expr: 
+	rl_expr '-' rl_term_short final {
+		$$->expression = new Expression( $1->expression, 
+				$3->term, Expression::SubtractType );
+	};
+rl_expr: 
+	rl_expr TK_DashDash rl_term_short final {
+		$$->expression = new Expression( $1->expression, 
+				$3->term, Expression::StrongSubtractType );
+	};
+rl_expr: 
+	rl_term_short final {
+		$$->expression = new Expression( $1->term );
+	};
+
+nonterm rl_term_short
+{
+	Term *term;
+};
+
+shortest rl_term_short;
+
+rl_term_short: rl_term 
+	final { $$->term = $1->term; };
+
+nonterm rl_term
+{
+	Term *term;
+};
+
+rl_term:
+	rl_term factor_with_label final {
+		$$->term = new Term( $1->term, $2->factorWithAug );
+	};
+rl_term:
+	rl_term '.' factor_with_label final {
+		$$->term = new Term( $1->term, $3->factorWithAug );
+	};
+rl_term:
+	rl_term TK_ColonGt factor_with_label final {
+		$$->term = new Term( $1->term, $3->factorWithAug, Term::RightStartType );
+	};
+rl_term:
+	rl_term TK_ColonGtGt factor_with_label final {
+		$$->term = new Term( $1->term, $3->factorWithAug, Term::RightFinishType );
+	};
+rl_term:
+	rl_term TK_LtColon factor_with_label final {
+		$$->term = new Term( $1->term, 
+				$3->factorWithAug, Term::LeftType );
+	};
+rl_term:
+	factor_with_label final {
+		$$->term = new Term( $1->factorWithAug );
+	};
+
+nonterm factor_with_label
+{
+	FactorWithAug *factorWithAug;
+};
+
+factor_with_label: 
+	factor_with_ep final {
+		$$->factorWithAug = $1->factorWithAug;
+	};
+
+factor_with_label: 
+	TK_Word ':' factor_with_label final {
+		$$->factorWithAug = $3->factorWithAug;
+
+		if ( pd->objFieldMap->find( $1->data ) != 0 )
+			error($1->loc) << "label name \"" << $1->data << "\" already in use" << endp;
+
+		/* Create the object field. */
+		NamespaceQual *qual = new NamespaceQual( namespaceStack.top(), regionStack.top() );
+		TypeRef *typeRef = new TypeRef( $1->loc, qual, "str" );
+		ObjField *objField = new ObjField( $1->loc, typeRef, $1->data );
+
+		/* Insert it into the map. */
+		pd->objFieldMap->insert( $1->data, objField );
+
+		/* Create the enter and leaving actions that will mark the substring. */
+		Action *enter = new Action( MarkEnter, objField );
+		Action *leave = new Action( MarkLeave, objField );
+		pd->actionList.append( enter );
+		pd->actionList.append( leave );
+		
+		/* Add entering and leaving actions. */
+		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_start, 0, enter ) );
+		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_leave, 0, leave ) );
+	};
+
+nonterm factor_with_ep
+{
+	FactorWithAug *factorWithAug;
+};
+
+factor_with_ep: 
+	factor_with_aug final {
+		$$->factorWithAug = $1->factorWithAug;
+	};
+
+nonterm factor_with_aug
+{
+	FactorWithAug *factorWithAug;
+};
+
+factor_with_aug:
+	factor_with_rep final {
+		$$->factorWithAug = new FactorWithAug( $1->factorWithRep );
+	};
+
+
+# The fourth level of precedence. These are the trailing unary operators that
+# allow for repetition.
+
+nonterm factor_with_rep
+{
+	FactorWithRep *factorWithRep;
+};
+
+factor_with_rep:
+	factor_with_rep '*' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				0, 0, FactorWithRep::StarType );
+	};
+factor_with_rep:
+	factor_with_rep TK_StarStar final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				0, 0, FactorWithRep::StarStarType );
+	};
+factor_with_rep:
+	factor_with_rep '?' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				0, 0, FactorWithRep::OptionalType );
+	};
+factor_with_rep:
+	factor_with_rep '+' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				0, 0, FactorWithRep::PlusType );
+	};
+factor_with_rep:
+	factor_with_rep '{' factor_rep_num '}' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				$3->rep, 0, FactorWithRep::ExactType );
+	};
+factor_with_rep:
+	factor_with_rep '{' ',' factor_rep_num '}' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				0, $4->rep, FactorWithRep::MaxType );
+	};
+factor_with_rep:
+	factor_with_rep '{' factor_rep_num ',' '}' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep,
+				$3->rep, 0, FactorWithRep::MinType );
+	};
+factor_with_rep:
+	factor_with_rep '{' factor_rep_num ',' factor_rep_num '}' final {
+		$$->factorWithRep = new FactorWithRep( $2->loc, $1->factorWithRep, 
+				$3->rep, $5->rep, FactorWithRep::RangeType );
+	};
+factor_with_rep:
+	factor_with_neg final {
+		$$->factorWithRep = new FactorWithRep( 
+				$1->factorWithNeg->loc, $1->factorWithNeg );
+	};
+
+nonterm factor_rep_num
+{
+	int rep;
+};
+
+factor_rep_num:
+	TK_UInt final {
+		// Convert the priority number to a long. Check for overflow.
+		errno = 0;
+		int rep = strtol( $1->data, 0, 10 );
+		if ( errno == ERANGE && rep == LONG_MAX ) {
+			// Repetition too large. Recover by returing repetition 1. */
+			error($1->loc) << "repetition number " << $1->data << " overflows" << endl;
+			$$->rep = 1;
+		}
+		else {
+			// Cannot be negative, so no overflow.
+			$$->rep = rep;
+ 		}
+	};
+
+
+#
+# The fifth level up in precedence. Negation.
+#
+
+nonterm factor_with_neg
+{
+	FactorWithNeg *factorWithNeg;
+};
+
+factor_with_neg:
+	'!' factor_with_neg final {
+		$$->factorWithNeg = new FactorWithNeg( $1->loc,
+				$2->factorWithNeg, FactorWithNeg::NegateType );
+	};
+factor_with_neg:
+	'^' factor_with_neg final {
+		$$->factorWithNeg = new FactorWithNeg( $1->loc,
+				$2->factorWithNeg, FactorWithNeg::CharNegateType );
+	};
+factor_with_neg:
+	rl_factor final {
+		$$->factorWithNeg = new FactorWithNeg( $1->factor->loc, $1->factor );
+	};
+
+nonterm rl_factor
+{
+	Factor *factor;
+};
+
+rl_factor: 
+	TK_Literal final {
+		/* Create a new factor node going to a concat literal. */
+		$$->factor = new Factor( new Literal( $1->loc, $1->data, Literal::LitString ) );
+	};
+rl_factor: 
+	alphabet_num final {
+		/* Create a new factor node going to a literal number. */
+		$$->factor = new Factor( new Literal( $1->loc, 
+				$1->data, Literal::Number ) );
+	};
+rl_factor:
+	TK_Word final {
+		/* Find the named graph. */
+		Namespace *nspace = namespaceStack.top();
+		GraphDictEl *gdNode = nspace->graphDict.find( $1->data );
+		if ( gdNode == 0 ) {
+			/* Recover by returning null as the factor node. */
+			error($1->loc) << "graph lookup of \"" << $1->data << "\" failed" << endl;
+			$$->factor = 0;
+		}
+		else if ( gdNode->isInstance ) {
+			/* Recover by retuning null as the factor node. */
+			error($1->loc) << "references to graph instantiations not allowed "
+					"in expressions" << endl;
+			$$->factor = 0;
+		}
+		else {
+			/* Create a factor node that is a lookup of an expression. */
+			$$->factor = new Factor( $1->loc, gdNode->value );
+		}
+	};
+rl_factor:
+	TK_SqOpen regular_expr_or_data TK_SqClose final {
+		/* Create a new factor node going to an OR expression. */
+		$$->factor = new Factor( new ReItem( $1->loc, $2->reOrBlock, ReItem::OrBlock ) );
+	};
+rl_factor:
+	TK_SqOpenNeg regular_expr_or_data TK_SqClose final {
+		/* Create a new factor node going to a negated OR expression. */
+		$$->factor = new Factor( new ReItem( $1->loc, $2->reOrBlock, ReItem::NegOrBlock ) );
+	};
+rl_factor:
+	range_lit TK_DotDot range_lit final {
+		/* Create a new factor node going to a range. */
+		$$->factor = new Factor( new Range( $1->literal, $3->literal ) );
+	};
+rl_factor:
+	'(' rl_join ')' final {
+		/* Create a new factor going to a parenthesized join. */
+		$$->factor = new Factor( $2->join );
+	};
+
+nonterm range_lit
+{
+	Literal *literal;
+};
+
+# Literals which can be the end points of ranges.
+range_lit:
+	TK_Literal final {
+		/* Range literas must have only one char. We restrict this in the parse tree. */
+		$$->literal = new Literal( $1->loc, $1->data, Literal::LitString );
+	};
+range_lit:
+	alphabet_num final {
+		/* Create a new literal number. */
+		$$->literal = new Literal( $1->loc, $1->data, Literal::Number );
+	};
+
+nonterm alphabet_num uses token_data;
+
+# Any form of a number that can be used as a basic machine. */
+alphabet_num:
+	TK_UInt final { 
+		$$->loc = $1->loc;
+		$$->data = $1->data;
+	};
+alphabet_num: 
+	'-' TK_UInt final { 
+		$$->loc = $1->loc;
+		$$->data = '+';
+		$$->data += $2->data;
+	};
+alphabet_num: 
+	TK_Hex final { 
+		$$->loc = $1->loc;
+		$$->data = $1->data;
+	};
+
+#
+# Regular Expressions.
+#
+
+
+# The data inside of a [] expression in a regular expression. Accepts any
+# number of characters or ranges. */
+nonterm regular_expr_or_data
+{
+	ReOrBlock *reOrBlock;
+};
+
+regular_expr_or_data:
+	regular_expr_or_data regular_expr_or_char final {
+		/* An optimization to lessen the tree size. If an or char is directly
+		 * under the left side on the right and the right side is another or
+		 * char then paste them together and return the left side. Otherwise
+		 * just put the two under a new or data node. */
+		if ( $2->reOrItem->type == ReOrItem::Data &&
+				$1->reOrBlock->type == ReOrBlock::RecurseItem &&
+				$1->reOrBlock->item->type == ReOrItem::Data )
+		{
+			/* Append the right side to right side of the left and toss the
+			 * right side. */
+			$1->reOrBlock->item->data += $2->reOrItem->data;
+			delete $2->reOrItem;
+			$$->reOrBlock = $1->reOrBlock;
+		}
+		else {
+			/* Can't optimize, put the left and right under a new node. */
+			$$->reOrBlock = new ReOrBlock( $1->reOrBlock, $2->reOrItem );
+		}
+	};
+regular_expr_or_data:
+	final {
+		$$->reOrBlock = new ReOrBlock();
+	};
+
+# A single character inside of an or expression. Can either be a character or a
+# set of characters.
+nonterm regular_expr_or_char
+{
+	ReOrItem *reOrItem;
+};
+
+regular_expr_or_char:
+	TK_ReChar final {
+		$$->reOrItem = new ReOrItem( $1->loc, $1->data );
+	};
+regular_expr_or_char:
+	TK_ReChar TK_Dash TK_ReChar final {
+		$$->reOrItem = new ReOrItem( $2->loc, $1->data[0], $3->data[0] );
+	};
+
+#  A local state reference. Cannot have :: prefix.
+local_state_ref:
+	no_name_sep state_ref_names;
+
+# Clear the name ref structure.
+no_name_sep:
+	final {
+		nameRef.empty();
+	};
+
+# A qualified state reference.
+state_ref: opt_name_sep state_ref_names;
+
+# Optional leading name separator.
+opt_name_sep:
+	TK_NameSep 
+	final {
+		/* Insert an initial null pointer val to indicate the existence of the
+		 * initial name seperator. */
+		nameRef.setAs( 0 );
+	};
+opt_name_sep:
+	final {
+		nameRef.empty();
+	};
+
+# List of names separated by ::
+state_ref_names:
+	state_ref_names TK_NameSep TK_Word
+	final {
+		nameRef.append( $3->data );
+	};
+state_ref_names:
+	TK_Word 
+	final {
+		nameRef.append( $1->data );
+	};
+
+nonterm opt_commit
+{
+	bool commit;
+};
+
+opt_commit: final { $$->commit = false; };
+opt_commit: KW_Commit final { $$->commit = true; };
+
+#
+# Grammar Finished
+#
+
+	write types;
+	write data;
+}%%
+
+void Parser::init()
+{
+
+	/* Set up the root namespace. */
+	const char *rootNamespaceName = "___ROOT_NAMESPACE";
+	Namespace *rootNamespace = new Namespace( InputLoc(), 
+			rootNamespaceName, pd->namespaceList.length(), 0 );
+	pd->namespaceList.append( rootNamespace );
+	namespaceStack.push( rootNamespace );
+	pd->rootNamespace = rootNamespace;
+
+	/* Set up the root token region. */
+	const char *rootRegionName = "___ROOT_REGION";
+	TokenRegion *rootRegion = new TokenRegion( InputLoc(), rootRegionName, 
+			pd->regionList.length(), 0 );
+	pd->regionList.append( rootRegion );
+	JoinOrLm *joinOrLm = new JoinOrLm( rootRegion );
+	addRegularDef( InputLoc(), namespaceStack.top(), rootRegionName, joinOrLm, true );
+	regionStack.push( rootRegion );
+	pd->rootRegion = rootRegion;
+
+	/* Set up the global object. */
+	String global = "global";
+	ObjFieldMap *objFieldMap = new ObjFieldMap;
+	pd->globalObjectDef = new ObjectDef( ObjectDef::UserType, global, 
+			objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+	
+	/* The eofTokenRegion defaults to the root region. */
+	pd->eofTokenRegion = rootRegion;
+
+	/* Initialize the dictionary of graphs. This is our symbol table. The
+	 * initialization needs to be done on construction which happens at the
+	 * beginning of a machine spec so any assignment operators can reference
+	 * the builtins. */
+	pd->initGraphDict();
+
+	pd->rootLocalFrame = new ObjectDef( ObjectDef::FrameType, 
+				"local", new ObjFieldMap(), new ObjMethodMap(), 
+				pd->nextObjectId++ );
+	pd->curLocalFrame = pd->rootLocalFrame;
+
+	%% write init;
+}
+
+int Parser::parseLangEl( int type, const Token *token )
+{
+	%% write exec;
+	return errCount == 0 ? 0 : -1;
+}
+
+void Parser::addRegularDef( const InputLoc &loc, Namespace *nspace,
+		const String &name, JoinOrLm *joinOrLm, bool isInstance )
+{
+	GraphDictEl *newEl = nspace->graphDict.insert( name );
+	if ( newEl != 0 ) {
+		/* New element in the dict, all good. */
+		newEl->value = new VarDef( name, joinOrLm );
+		newEl->isInstance = isInstance;
+		newEl->loc = loc;
+
+		/* It it is an instance, put on the instance list. */
+		if ( isInstance )
+			pd->instanceList.append( newEl );
+	}
+	else {
+		// Recover by ignoring the duplicate.
+		error(loc) << "fsm \"" << name << "\" previously defined" << endl;
+	}
+}
+
+void Parser::addProduction( InputLoc &loc, const String &name, 
+		ProdElList *prodElList, bool commit, CodeBlock *redBlock )
+{
+	/* Get the language element. */
+	KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
+			name, KlangEl::NonTerm );
+
+	/* Check that the element wasn't previously defined as something else. */
+	if ( prodName->type != KlangEl::Unknown 
+			&& prodName->type != KlangEl::NonTerm )
+	{
+		error(loc) << "'" << name << "' already defined as something else" << endp;
+	}
+	else {
+		Namespace *nspace = namespaceStack.top();
+
+		prodName->type = KlangEl::NonTerm;
+		Definition *newDef = new Definition( loc, prodName, 
+				prodElList, commit, redBlock,
+				pd->prodList.length(), Definition::Production );
+
+		prodName->defList.append( newDef );
+		pd->prodList.append( newDef );
+
+		/* If the token has the same name as the region it is in, then also
+		 * insert it into the symbol map for the parent region. */
+		if ( strcmp( name, nspace->name ) == 0 ) {
+			/* Insert the name into the top of the region stack after popping the
+			 * region just created. We need it in the parent. */
+			nspace->parentNamespace->symbolMap.insert( name, prodName );
+		}
+	}
+}
+
+ostream &Parser::parse_error( int tokId, Token &token )
+{
+	/* Maintain the error count. */
+	gblErrorCount += 1;
+
+	cerr << token.loc.fileName << ":" << token.loc.line << ":" << token.loc.col << ": ";
+	cerr << "at token ";
+	if ( tokId < 128 )
+		cerr << "\"" << Parser_lelNames[tokId] << "\"";
+	else 
+		cerr << Parser_lelNames[tokId];
+	if ( token.data != 0 )
+		cerr << " with data \"" << token.data << "\"";
+	cerr << ": ";
+	
+	return cerr;
+}
+
+int Parser::token( InputLoc &loc, int tokId, char *tokstart, int toklen )
+{
+	Token token;
+
+	if ( toklen > 0 )
+		token.data.setAs( tokstart, toklen );
+
+	token.loc = loc;
+	int res = parseLangEl( tokId, &token );
+	if ( res < 0 ) {
+		parse_error(tokId, token) << "parse error" << endl;
+		exit(1);
+	}
+	return res;
+}
diff --git a/colm/lmscan.h b/colm/lmscan.h
new file mode 100644
index 00000000..06ad6deb
--- /dev/null
+++ b/colm/lmscan.h
@@ -0,0 +1,131 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _RLSCAN_H
+#define _RLSCAN_H
+
+#include <iostream>
+#include <fstream>
+#include <string.h>
+
+#include "colm.h"
+#include "lmparse.h"
+#include "parsedata.h"
+#include "avltree.h"
+#include "vector.h"
+#include "buffer.h"
+
+using std::ifstream;
+using std::istream;
+using std::ostream;
+using std::cout;
+using std::cerr;
+using std::endl;
+
+extern char *Parser_lelNames[];
+
+/* This is used for tracking the current stack of include file/machine pairs. It is
+ * is used to detect and recursive include structure. */
+struct IncludeStackItem
+{
+	IncludeStackItem( char *fileName, char *sectionName )
+		: fileName(fileName), sectionName(sectionName) {}
+
+	char *fileName;
+	char *sectionName;
+};
+
+typedef Vector<IncludeStackItem> IncludeStack;
+
+struct Scanner
+{
+	Scanner( const char *fileName, istream &input, ostream &output,
+			Parser *inclToParser, char *inclSectionTarg,
+			int includeDepth )
+	: 
+		fileName(fileName), input(input), output(output),
+		inclToParser(inclToParser),
+		inclSectionTarg(inclSectionTarg),
+		includeDepth(includeDepth),
+		line(1), column(1), lastnl(0), 
+		parserExistsError(false),
+		whitespaceOn(true)
+	{
+		parser = new Parser( fileName, "machine", InputLoc() );
+		parser->init();
+	}
+
+	bool recursiveInclude( char *inclFileName, char *inclSectionName );
+
+	#if 0
+	char *prepareFileName( char *fileName, int len )
+	{
+		bool caseInsensitive;
+		Token tokenFnStr, tokenRes;
+		tokenFnStr.data = fileName;
+		tokenFnStr.length = len;
+		tokenFnStr.prepareLitString( tokenRes, caseInsensitive );
+		return tokenRes.data;
+	}
+	#endif
+
+	void sectionParseInit();
+	void token( int type, char *start, char *end );
+	void token( int type, char c );
+	void token( int type );
+	void updateCol();
+	void endSection();
+	void do_scan();
+	ostream &scan_error();
+
+	const char *fileName;
+	istream &input;
+	ostream &output;
+	Parser *inclToParser;
+	char *inclSectionTarg;
+	int includeDepth;
+
+	int cs;
+	int line;
+	char *word, *lit;
+	int word_len, lit_len;
+	InputLoc sectionLoc;
+	char *ts, *te;
+	int column;
+	char *lastnl;
+
+	/* Set by machine statements, these persist from section to section
+	 * allowing for unnamed sections. */
+	Parser *parser;
+	IncludeStack includeStack;
+
+	/* This is set if ragel has already emitted an error stating that
+	 * no section name has been seen and thus no parser exists. */
+	bool parserExistsError;
+
+	/* This is for inline code. By default it is on. It goes off for
+	 * statements and values in inline blocks which are parsed. */
+	bool whitespaceOn;
+
+	Buffer litBuf;
+};
+
+#endif /* _RLSCAN_H */
diff --git a/colm/lmscan.rl b/colm/lmscan.rl
new file mode 100644
index 00000000..6bbc5d00
--- /dev/null
+++ b/colm/lmscan.rl
@@ -0,0 +1,545 @@
+/*
+ *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <fstream>
+#include <string.h>
+
+#include "colm.h"
+#include "lmscan.h"
+#include "lmparse.h"
+#include "parsedata.h"
+#include "avltree.h"
+#include "vector.h"
+
+//#define PRINT_TOKENS
+
+using std::ifstream;
+using std::istream;
+using std::ostream;
+using std::cout;
+using std::cerr;
+using std::endl;
+
+%%{
+	machine section_parse;
+	alphtype int;
+	write data;
+}%%
+
+void Scanner::sectionParseInit()
+{
+	%% write init;
+}
+
+ostream &Scanner::scan_error()
+{
+	/* Maintain the error count. */
+	gblErrorCount += 1;
+	cerr << fileName << ":" << line << ":" << column << ": ";
+	return cerr;
+}
+
+bool Scanner::recursiveInclude( char *inclFileName, char *inclSectionName )
+{
+	for ( IncludeStack::Iter si = includeStack; si.lte(); si++ ) {
+		if ( strcmp( si->fileName, inclFileName ) == 0 &&
+				strcmp( si->sectionName, inclSectionName ) == 0 )
+		{
+			return true;
+		}
+	}
+	return false;	
+}
+
+void Scanner::updateCol()
+{
+	char *from = lastnl;
+	if ( from == 0 )
+		from = ts;
+	//cerr << "adding " << te - from << " to column" << endl;
+	column += te - from;
+	lastnl = 0;
+}
+
+void Scanner::token( int type, char c )
+{
+	token( type, &c, &c + 1 );
+}
+
+void Scanner::token( int type )
+{
+	token( type, 0, 0 );
+}
+
+%%{
+	machine section_parse;
+	import "lmparse.h";
+
+	action clear_words { word = lit = 0; word_len = lit_len = 0; }
+	action store_lit { lit = tokdata; lit_len = toklen; }
+
+	action mach_err { scan_error() << "bad machine statement" << endl; }
+	action incl_err { scan_error() << "bad include statement" << endl; }
+	action write_err { scan_error() << "bad write statement" << endl; }
+
+	action handle_include
+	{
+		#if 0
+		char *inclSectionName = word;
+		char *inclFileName = 0;
+
+		/* Implement defaults for the input file and section name. */
+		if ( inclSectionName == 0 )
+			inclSectionName = parser->sectionName;
+
+		if ( lit != 0 ) 
+			inclFileName = prepareFileName( lit, lit_len );
+		else
+			inclFileName = fileName;
+
+		/* Check for a recursive include structure. Add the current file/section
+		 * name then check if what we are including is already in the stack. */
+		includeStack.append( IncludeStackItem( fileName, parser->sectionName ) );
+
+		if ( recursiveInclude( inclFileName, inclSectionName ) )
+			scan_error() << "include: this is a recursive include operation" << endl;
+		else {
+			/* Open the input file for reading. */
+			ifstream *inFile = new ifstream( inclFileName );
+			if ( ! inFile->is_open() ) {
+				scan_error() << "include: could not open " << 
+						inclFileName << " for reading" << endl;
+			}
+
+			Scanner scanner( inclFileName, *inFile, output, parser,
+					inclSectionName, includeDepth+1 );
+			scanner.do_scan( );
+			delete inFile;
+		}
+
+		/* Remove the last element (len-1) */
+		includeStack.remove( -1 );
+		#endif
+	}
+
+	include_target = 
+		TK_Literal >clear_words @store_lit;
+
+	include_stmt =
+		( KW_Include include_target ';' ) @handle_include
+		<>err incl_err <>eof incl_err;
+
+	action handle_token
+	{
+		InputLoc loc;
+
+		#ifdef PRINT_TOKENS
+		cerr << "scanner:" << line << ":" << column << 
+				": sending token to the parser " << Parser_lelNames[*p];
+		cerr << " " << toklen;
+		if ( tokdata != 0 )
+			cerr << " " << tokdata;
+		cerr << endl;
+		#endif
+
+		loc.fileName = fileName;
+		loc.line = line;
+		loc.col = column;
+
+		parser->token( loc, type, tokdata, toklen );
+	}
+
+	# Catch everything else.
+	everything_else = ^( KW_Include ) @handle_token;
+
+	main := ( 
+		include_stmt |
+		everything_else
+	)*;
+}%%
+
+void Scanner::token( int type, char *start, char *end )
+{
+	char *tokdata = 0;
+	int toklen = 0;
+	int *p = &type;
+	int *pe = &type + 1;
+	int *eof = 0;
+
+	if ( start != 0 ) {
+		toklen = end-start;
+		tokdata = new char[toklen+1];
+		memcpy( tokdata, start, toklen );
+		tokdata[toklen] = 0;
+	}
+
+	%%{
+		machine section_parse;
+		write exec;
+	}%%
+
+	updateCol();
+}
+
+void Scanner::endSection( )
+{
+	/* Execute the eof actions for the section parser. */
+	/* Probably use: token( -1 ); */
+}
+
+%%{
+	machine rlscan;
+
+	# This is sent by the driver code.
+	EOF = 0;
+	
+	action inc_nl { 
+		lastnl = p; 
+		column = 0;
+		line++;
+	}
+	NL = '\n' @inc_nl;
+
+	# Identifiers, numbers, commetns, and other common things.
+	ident = ( alpha | '_' ) ( alpha |digit |'_' )*;
+	number = digit+;
+	hex_number = '0x' [0-9a-fA-F]+;
+
+	# These literal forms are common to C-like host code and ragel.
+	s_literal = "'" ([^'\\] | NL | '\\' (any | NL))* "'";
+	d_literal = '"' ([^"\\] | NL | '\\' (any | NL))* '"';
+
+	whitespace = [ \t] | NL;
+	pound_comment = '#' [^\n]* NL;
+
+	or_literal := |*
+		# Escape sequences in OR expressions.
+		'\\0' => { token( TK_ReChar, '\0' ); };
+		'\\a' => { token( TK_ReChar, '\a' ); };
+		'\\b' => { token( TK_ReChar, '\b' ); };
+		'\\t' => { token( TK_ReChar, '\t' ); };
+		'\\n' => { token( TK_ReChar, '\n' ); };
+		'\\v' => { token( TK_ReChar, '\v' ); };
+		'\\f' => { token( TK_ReChar, '\f' ); };
+		'\\r' => { token( TK_ReChar, '\r' ); };
+		'\\\n' => { updateCol(); };
+		'\\' any => { token( TK_ReChar, ts+1, te ); };
+
+		# Range dash in an OR expression.
+		'-' => { token( TK_Dash, 0, 0 ); };
+
+		# Terminate an OR expression.
+		']'	=> { token( TK_SqClose ); fret; };
+
+		EOF => {
+			scan_error() << "unterminated OR literal" << endl;
+		};
+
+		# Characters in an OR expression.
+		[^\]] => { token( TK_ReChar, ts, te ); };
+
+	*|;
+
+	regular_type := |*
+		# Identifiers.
+		ident => { token( TK_Word, ts, te ); } ;
+
+		# Numbers
+		number => { token( TK_UInt, ts, te ); };
+		hex_number => { token( TK_Hex, ts, te ); };
+
+		# Literals, with optionals.
+		( s_literal | d_literal ) [i]? 
+			=> { token( TK_Literal, ts, te ); };
+
+		'[' => { token( TK_SqOpen ); fcall or_literal; };
+		'[^' => { token( TK_SqOpenNeg ); fcall or_literal; };
+
+		'/' => { token( '/'); fret; };
+
+		# Ignore.
+		pound_comment => { updateCol(); };
+
+		'..' => { token( TK_DotDot ); };
+		'**' => { token( TK_StarStar ); };
+		'--' => { token( TK_DashDash ); };
+
+		':>'  => { token( TK_ColonGt ); };
+		':>>' => { token( TK_ColonGtGt ); };
+		'<:'  => { token( TK_LtColon ); };
+
+		# Whitespace other than newline.
+		[ \t\r]+ => { updateCol(); };
+
+		# If we are in a single line machine then newline may end the spec.
+		NL => { updateCol(); };
+
+		# Consume eof.
+		EOF;
+
+		any => { token( *ts ); } ;
+	*|;
+
+	literal_pattern := |*
+		'\\' 'a' { litBuf.append( '\a' ); };
+		'\\' 'b' { litBuf.append( '\b' ); };
+		'\\' 't' { litBuf.append( '\t' ); };
+		'\\' 'n' { litBuf.append( '\n' ); };
+		'\\' 'v' { litBuf.append( '\v' ); };
+		'\\' 'f' { litBuf.append( '\f' ); };
+		'\\' 'r' { litBuf.append( '\r' ); };
+
+		'\\' any {
+			litBuf.append( ts[1] );
+		};
+		'"' => {
+			if ( litBuf.length > 0 ) {
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '"' );
+			fret;
+		};
+		NL => {
+			if ( litBuf.length > 0 ) {
+				litBuf.append( '\n' );
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '"' );
+			fret;
+		};
+		'[' => { 
+			if ( litBuf.length > 0 ) {
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '[' );
+			fcall main;
+		};
+		any => { 
+			litBuf.append( *ts );
+		};
+	*|;
+
+	# Parser definitions. 
+	main := |*
+		'lex' => { token( KW_Lex ); };
+		'commit' => { token( KW_Commit ); };
+		'token' => { token( KW_Token ); };
+		'literal' => { token( KW_Literal ); };
+		'rl' => { token( KW_Rl ); };
+		'def' => { token( KW_Def ); };
+		'ignore' => { token( KW_Ignore ); };
+		'construct' => { token( KW_Construct ); };
+		'new' => { token( KW_New ); };
+		'print' => { token( KW_Print ); };
+		'if' => { token( KW_If ); };
+		'reject' => { token( KW_Reject ); };
+		'while' => { token( KW_While ); };
+		'else' => { token( KW_Else ); };
+		'elsif' => { token( KW_Elsif ); };
+		'match' => { token( KW_Match ); };
+		'for' => { token( KW_For ); };
+		'iter' => { token( KW_Iter ); };
+		'print_xml' => { token( KW_PrintXML ); };
+		'namespace' => { token( KW_Namespace ); };
+		'lex' => { token( KW_Lex ); };
+		'map' => { token( KW_Map ); };
+		'list' => { token( KW_List ); };
+		'vector' => { token( KW_Vector ); };
+		'return' => { token( KW_Return ); };
+		'break' => { token( KW_Break ); };
+		'yield' => { token( KW_Yield ); };
+		'typeid' => { token( KW_TypeId ); };
+		'make_token' => { token( KW_MakeToken ); };
+		'make_tree' => { token( KW_MakeTree ); };
+		'reducefirst' => { token( KW_ReduceFirst ); };
+		'for' => { token( KW_For ); };
+		'in' => { token( KW_In ); };
+		'nil' => { token( KW_Nil ); };
+		'true' => { token( KW_True ); };
+		'false' => { token( KW_False ); };
+		'parse' => { token( KW_Parse ); };
+		'parse_stop' => { token( KW_ParseStop ); };
+		'global' => { token( KW_Global ); };
+		'ptr' => { token( KW_Ptr ); };
+		'ref' => { token( KW_Ref ); };
+		'deref' => { token( KW_Deref ); };
+		'require' => { token( KW_Require ); };
+		'preeof' => { token( KW_Preeof ); };
+
+		# Identifiers.
+		ident => { token( TK_Word, ts, te ); } ;
+
+		number => { token( TK_Number, ts, te ); };
+
+		'/' => { 
+			token( '/' ); 
+			fcall regular_type;
+		};
+
+		"~" [^\n]* NL => { 
+			token( '"' );
+			token( TK_LitPat, ts+1, te );
+			token( '"' );
+		};
+
+		s_literal => {
+			token( TK_Literal, ts, te );
+		};
+
+		'"' => { 
+			token( '"' );
+			litBuf.clear(); 
+			fcall literal_pattern;
+		};
+		'[' => { 
+			token( '[' ); 
+			fcall main;
+		};
+
+		']' => {
+			token( ']' );
+			if ( top > 0 )
+				fret;
+		};
+
+		# Ignore.
+		pound_comment => { updateCol(); };
+
+		'=>' => { token( TK_DoubleArrow ); };
+		'==' => { token( TK_DoubleEql ); };
+		'!=' => { token( TK_NotEql ); };
+		'::' => { token( TK_DoubleColon ); };
+		'<=' => { token( TK_LessEql ); };
+		'>=' => { token( TK_GrtrEql ); };
+		'->' => { token( TK_RightArrow ); };
+		'&&' => { token( TK_AmpAmp ); };
+		'||' => { token( TK_BarBar ); };
+		
+		('+' | '-' | '*' | '/' | '(' | ')' | '@' | '$' ) => { token( *ts ); };
+
+
+		# Whitespace other than newline.
+		[ \t\r]+ => { updateCol(); };
+
+		# If we are in a single line machine then newline may end the spec.
+		NL => { updateCol(); };
+
+		# Consume eof.
+		EOF;
+
+		any => { token( *ts ); } ;
+	*|;
+}%%
+
+%% write data;
+
+void Scanner::do_scan()
+{
+	int bufsize = 8;
+	char *buf = new char[bufsize];
+	const char last_char = 0;
+	int cs, act, have = 0;
+	int top, stack[32];
+	bool execute = true;
+
+	sectionParseInit();
+	%% write init;
+
+	while ( execute ) {
+		char *p = buf + have;
+		int space = bufsize - have;
+
+		if ( space == 0 ) {
+			/* We filled up the buffer trying to scan a token. Grow it. */
+			bufsize = bufsize * 2;
+			char *newbuf = new char[bufsize];
+
+			/* Recompute p and space. */
+			p = newbuf + have;
+			space = bufsize - have;
+
+			/* Patch up pointers possibly in use. */
+			if ( ts != 0 )
+				ts = newbuf + ( ts - buf );
+			te = newbuf + ( te - buf );
+
+			/* Copy the new buffer in. */
+			memcpy( newbuf, buf, have );
+			delete[] buf;
+			buf = newbuf;
+		}
+
+		input.read( p, space );
+		int len = input.gcount();
+
+		/* If we see eof then append the EOF char. */
+	 	if ( len == 0 ) {
+			p[0] = last_char, len = 1;
+			execute = false;
+		}
+
+		char *pe = p + len;
+		char *eof = 0;
+		%% write exec;
+
+		/* Check if we failed. */
+		if ( cs == rlscan_error ) {
+			/* Machine failed before finding a token. I'm not yet sure if this
+			 * is reachable. */
+			scan_error() << "scanner error" << endl;
+			exit(1);
+		}
+
+		/* Decide if we need to preserve anything. */
+		char *preserve = ts;
+
+		/* Now set up the prefix. */
+		if ( preserve == 0 )
+			have = 0;
+		else {
+			/* There is data that needs to be shifted over. */
+			have = pe - preserve;
+			memmove( buf, preserve, have );
+			unsigned int shiftback = preserve - buf;
+			if ( ts != 0 )
+				ts -= shiftback;
+			te -= shiftback;
+
+			preserve = buf;
+		}
+	}
+	delete[] buf;
+
+	InputLoc loc;
+	loc.fileName = "<EOF>";
+	loc.line = line;
+	loc.col = 1;
+	parser->token( loc, Parser_tk_eof, 0, 0 );
+}
+
+void scan( char *fileName, istream &input, ostream &output )
+{
+	Scanner scanner( fileName, input, output, 0, 0, 0 );
+}
diff --git a/colm/main.cpp b/colm/main.cpp
new file mode 100644
index 00000000..2e78efd7
--- /dev/null
+++ b/colm/main.cpp
@@ -0,0 +1,357 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <stdlib.h>
+#include <string.h>
+#include <stdio.h>
+#include <iostream>
+#include <fstream>
+#include <unistd.h>
+#include <sstream>
+
+#include "colm.h"
+#include "lmscan.h"
+#include "pcheck.h"
+#include "vector.h"
+#include "version.h"
+#include "common.h"
+#include "parsedata.h"
+#include "vector.h"
+#include "version.h"
+#include "fsmcodegen.h"
+#include "dotgen.h"
+
+using std::istream;
+using std::ifstream;
+using std::ostream;
+using std::ios;
+using std::cin;
+using std::cout;
+using std::cerr;
+using std::endl;
+
+/* Graphviz dot file generation. */
+bool graphvizDone = false;
+
+bool printPrintables = false;
+
+using std::ostream;
+using std::istream;
+using std::ifstream;
+using std::ofstream;
+using std::ios;
+using std::cout;
+using std::cerr;
+using std::cin;
+using std::endl;
+
+/* Target language and output style. */
+char defExtension[] = ".cpp";
+
+/* Io globals. */
+istream *inStream = 0;
+ostream *outStream = 0;
+const char *inputFileName = 0;
+const char *outputFileName = 0;
+
+bool generateGraphviz = false;
+bool branchPointInfo = false;
+bool addUniqueEmptyProductions = false;
+
+/* Print version information. */
+void version();
+
+/* Total error count. */
+int gblErrorCount = 0;
+
+/* Print the opening to an error in the input, then return the error ostream. */
+ostream &error( const InputLoc &loc )
+{
+	/* Keep the error count. */
+	gblErrorCount += 1;
+
+	cerr << "error: " << inputFileName << ":" << 
+			loc.line << ":" << loc.col << ": ";
+	return cerr;
+}
+
+/* Print the opening to a program error, then return the error stream. */
+ostream &error()
+{
+	gblErrorCount += 1;
+	cerr << "error: " PROGNAME ": ";
+	return cerr;
+}
+
+
+/* Print the opening to a warning, then return the error ostream. */
+ostream &warning( )
+{
+	cerr << "warning: " << inputFileName << ": ";
+	return cerr;
+}
+
+/* Print the opening to a warning in the input, then return the error ostream. */
+ostream &warning( const InputLoc &loc )
+{
+	assert( inputFileName != 0 );
+	cerr << "warning: " << inputFileName << ":" << 
+			loc.line << ":" << loc.col << ": ";
+	return cerr;
+}
+
+void escapeLineDirectivePath( std::ostream &out, char *path )
+{
+	for ( char *pc = path; *pc != 0; pc++ ) {
+		if ( *pc == '\\' )
+			out << "\\\\";
+		else
+			out << *pc;
+	}
+}
+
+void escapeLineDirectivePath( std::ostream &out, char *path );
+void scan( char *fileName, istream &input );
+
+bool printStatistics = false;
+
+/* Print a summary of the options. */
+void usage()
+{
+	cout <<
+"usage: colm [options] file\n"
+"general:\n"
+"   -h, -H, -?, --help   print this usage and exit\n"
+"   -v, --version        print version information and exit\n"
+"   -o <file>            write output to <file>\n"
+"   -i                   show conflict information\n"
+	;	
+}
+
+/* Print version information. */
+void version()
+{
+	cout << "Colm version " VERSION << " " PUBDATE << endl <<
+			"Copyright (c) 2007, 2008 by Adrian Thurston" << endl;
+}
+
+/* Invoked by the parser when the root element is opened. */
+void openOutput( )
+{
+	/* If the output format is code and no output file name is given, then
+	 * make a default. */
+	if ( outputFileName == 0 ) {
+		const char *ext = findFileExtension( inputFileName );
+		if ( ext != 0 && strcmp( ext, ".rh" ) == 0 )
+			outputFileName = fileNameFromStem( inputFileName, ".h" );
+		else {
+			const char *defExtension = ".cpp";
+			outputFileName = fileNameFromStem( inputFileName, defExtension );
+		}
+	}
+
+	#ifdef COLM_LOG_COMPILE
+	cerr << "opening output file: " << outputFileName << endl;
+	#endif
+
+	/* Make sure we are not writing to the same file as the input file. */
+	if ( outputFileName != 0 && strcmp( inputFileName, outputFileName  ) == 0 ) {
+		error() << "output file \"" << outputFileName  << 
+				"\" is the same as the input file" << endl;
+	}
+
+	if ( outputFileName != 0 ) {
+		/* Open the output stream, attaching it to the filter. */
+		ofstream *outFStream = new ofstream( outputFileName );
+
+		if ( !outFStream->is_open() ) {
+			error() << "error opening " << outputFileName << " for writing" << endl;
+			exit(1);
+		}
+
+		outStream = outFStream;
+	}
+	else {
+		/* Writing out ot std out. */
+		outStream = &cout;
+	}
+}
+
+void compileOutput( const char *argv0 )
+{
+	/* Find the location of us. */
+	char *location = strdup( argv0 );
+	char *last = location + strlen(location) - 1;
+	while ( true ) {
+		if ( last == location ) {
+			last[0] = '.';
+			last[1] = 0;
+			break;
+		}
+		if ( *last == '/' ) {
+			last[0] = 0;
+			break;
+		}
+		last -= 1;
+	}
+
+	char *exec = fileNameFromStem( outputFileName, ".bin" );
+
+	int length = 1024 + 3*strlen(location) + strlen(outputFileName) + strlen(exec);
+	char command[length];
+	sprintf( command, 
+		"g++ -Wall -Wwrite-strings"
+		" -I%s/../aapl"
+		" -I%s/../colm"
+		" -I%s/../common"
+		" -g"
+		" -o %s"
+		" %s"
+		" %s/../colm/runtime.a",
+		location, location, location, exec, outputFileName, location );
+	#ifdef COLM_LOG_COMPILE
+	cout << "compiling: " << outputFileName << endl;
+	#endif
+	int res = system( command );
+	if ( res != 0 )
+		cout << "there was a problem compiling the output" << endl;
+}
+
+void process_args( int argc, const char **argv )
+{
+	ParamCheck pc( "io:S:M:vHh?-:s", argc, argv );
+
+	while ( pc.check() ) {
+		switch ( pc.state ) {
+		case ParamCheck::match:
+			switch ( pc.parameter ) {
+			case 'i':
+				branchPointInfo = true;
+				break;
+			/* Output. */
+			case 'o':
+				if ( *pc.parameterArg == 0 )
+					error() << "a zero length output file name was given" << endl;
+				else if ( outputFileName != 0 )
+					error() << "more than one output file name was given" << endl;
+				else {
+					/* Ok, remember the output file name. */
+					outputFileName = pc.parameterArg;
+				}
+				break;
+
+			/* Version and help. */
+			case 'v':
+				version();
+				exit(0);
+			case 'H': case 'h': case '?':
+				usage();
+				exit(0);
+			case 's':
+				printStatistics = true;
+				break;
+			case '-':
+				if ( strcasecmp(pc.parameterArg, "help") == 0 ) {
+					usage();
+					exit(0);
+				}
+				else if ( strcasecmp(pc.parameterArg, "version") == 0 ) {
+					version();
+					exit(0);
+				}
+				else {
+					error() << "--" << pc.parameterArg << 
+							" is an invalid argument" << endl;
+				}
+			}
+			break;
+
+		case ParamCheck::invalid:
+			error() << "-" << pc.parameter << " is an invalid argument" << endl;
+			break;
+
+		case ParamCheck::noparam:
+			/* It is interpreted as an input file. */
+			if ( *pc.curArg == 0 )
+				error() << "a zero length input file name was given" << endl;
+			else if ( inputFileName != 0 )
+				error() << "more than one input file name was given" << endl;
+			else {
+				/* OK, Remember the filename. */
+				inputFileName = pc.curArg;
+			}
+			break;
+		}
+	}
+}
+
+/* Main, process args and call yyparse to start scanning input. */
+int main(int argc, const char **argv)
+{
+	process_args( argc, argv );
+
+	/* Bail on above errors. */
+	if ( gblErrorCount > 0 )
+		exit(1);
+
+	/* Make sure we are not writing to the same file as the input file. */
+	if ( inputFileName != 0 && outputFileName != 0 && 
+			strcmp( inputFileName, outputFileName  ) == 0 )
+	{
+		error() << "output file \"" << outputFileName  << 
+				"\" is the same as the input file" << endl;
+	}
+
+	/* Open the input file for reading. */
+	istream *inStream;
+	if ( inputFileName != 0 ) {
+		/* Open the input file for reading. */
+		ifstream *inFile = new ifstream( inputFileName );
+		inStream = inFile;
+		if ( ! inFile->is_open() )
+			error() << "could not open " << inputFileName << " for reading" << endl;
+	}
+	else {
+		inputFileName = "<stdin>";
+		inStream = &cin;
+	}
+
+	/* Bail on above errors. */
+	if ( gblErrorCount > 0 )
+		exit(1);
+
+	Scanner scanner( inputFileName, *inStream, cout, 0, 0, 0 );
+	scanner.do_scan();
+
+	/* Parsing complete, check for errors.. */
+	if ( gblErrorCount > 0 )
+		return 1;
+
+	/* Initiate a compile following a parse. */
+	scanner.parser->pd->semanticAnalysis();
+
+	if ( outStream != 0 )
+		delete outStream;
+
+	compileOutput( argv[0] );
+
+	return 0;
+}
diff --git a/colm/map.cpp b/colm/map.cpp
new file mode 100644
index 00000000..6327b301
--- /dev/null
+++ b/colm/map.cpp
@@ -0,0 +1,806 @@
+/*
+ *  Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pdarun.h"
+
+void Map::listAbandon()
+{
+	head = tail = 0;
+}
+
+void Map::listAddBefore( MapEl *next_el, MapEl *new_el )
+{
+	/* Set the next pointer of the new element to next_el. We do
+	 * this regardless of the state of the list. */
+	new_el->next = next_el; 
+
+	/* Set reverse pointers. */
+	if (next_el == 0) {
+		/* There is no next elememnt. We are inserting at the tail. */
+		new_el->prev = tail;
+		tail = new_el;
+	} 
+	else {
+		/* There is a next element and we can access next's previous. */
+		new_el->prev = next_el->prev;
+		next_el->prev = new_el;
+	} 
+
+	/* Set forward pointers. */
+	if (new_el->prev == 0) {
+		/* There is no previous element. Set the head pointer.*/
+		head = new_el;
+	}
+	else {
+		/* There is a previous element, set it's next pointer to new_el. */
+		new_el->prev->next = new_el;
+	}
+}
+
+void Map::listAddAfter( MapEl *prev_el, MapEl *new_el )
+{
+	/* Set the previous pointer of new_el to prev_el. We do
+	 * this regardless of the state of the list. */
+	new_el->prev = prev_el; 
+
+	/* Set forward pointers. */
+	if (prev_el == 0) {
+		/* There was no prev_el, we are inserting at the head. */
+		new_el->next = head;
+		head = new_el;
+	} 
+	else {
+		/* There was a prev_el, we can access previous next. */
+		new_el->next = prev_el->next;
+		prev_el->next = new_el;
+	} 
+
+	/* Set reverse pointers. */
+	if (new_el->next == 0) {
+		/* There is no next element. Set the tail pointer. */
+		tail = new_el;
+	}
+	else {
+		/* There is a next element. Set it's prev pointer. */
+		new_el->next->prev = new_el;
+	}
+}
+
+MapEl *Map::listDetach(MapEl *el)
+{
+	/* Set forward pointers to skip over el. */
+	if (el->prev == 0) 
+		head = el->next; 
+	else
+		el->prev->next = el->next; 
+
+	/* Set reverse pointers to skip over el. */
+	if (el->next == 0) 
+		tail = el->prev; 
+	else
+		el->next->prev = el->prev; 
+
+	/* Update List length and return element we detached. */
+	return el;
+}
+
+
+/* Recursive worker for tree copying. */
+MapEl *Map::copyBranch( Program *p, MapEl *el, Kid *oldNextDown, Kid *&newNextDown )
+{
+	/* Duplicate element. Either the base element's copy constructor or defaul
+	 * constructor will get called. Both will suffice for initting the
+	 * pointers to null when they need to be. */
+	MapEl *newEl = p->mapElPool.allocate();
+
+	if ( (Kid*)el == oldNextDown )
+		newNextDown = (Kid*)newEl;
+
+	/* If the left tree is there, copy it. */
+	if ( newEl->left ) {
+		newEl->left = copyBranch( p, newEl->left, oldNextDown, newNextDown );
+		newEl->left->parent = newEl;
+	}
+
+	listAddAfter( tail, newEl );
+
+	/* If the right tree is there, copy it. */
+	if ( newEl->right ) {
+		newEl->right = copyBranch( p, newEl->right, oldNextDown, newNextDown );
+		newEl->right->parent = newEl;
+	}
+
+	return newEl;
+}
+
+/* Once an insertion position is found, attach a element to the tree. */
+void Map::attachRebal( MapEl *element, MapEl *parentEl, MapEl *lastLess )
+{
+	/* Increment the number of element in the tree. */
+	treeSize += 1;
+
+	/* Set element's parent. */
+	element->parent = parentEl;
+
+	/* New element always starts as a leaf with height 1. */
+	element->left = 0;
+	element->right = 0;
+	element->height = 1;
+
+	/* Are we inserting in the tree somewhere? */
+	if ( parentEl != 0 ) {
+		/* We have a parent so we are somewhere in the tree. If the parent
+		 * equals lastLess, then the last traversal in the insertion went
+		 * left, otherwise it went right. */
+		if ( lastLess == parentEl ) {
+			parentEl->left = element;
+
+			listAddBefore( parentEl, element );
+		}
+		else {
+			parentEl->right = element;
+
+			listAddAfter( parentEl, element );
+		}
+	}
+	else {
+		/* No parent element so we are inserting the root. */
+		root = element;
+
+		listAddAfter( tail, element );
+	}
+
+	/* Recalculate the heights. */
+	recalcHeights(parentEl);
+
+	/* Find the first unbalance. */
+	MapEl *ub = findFirstUnbalGP(element);
+
+	/* rebalance. */
+	if ( ub != 0 )
+	{
+		/* We assert that after this single rotation the 
+		 * tree is now properly balanced. */
+		rebalance(ub);
+	}
+}
+
+/**
+ * \brief Insert an existing element into the tree. 
+ *
+ * If the insert succeeds and lastFound is given then it is set to the element
+ * inserted. If the insert fails then lastFound is set to the existing element in
+ * the tree that has the same key as element. If the element's avl pointers are
+ * already in use then undefined behaviour results.
+ * 
+ * \returns The element inserted upon success, null upon failure.
+ */
+MapEl *Map::insert( MapEl *element, MapEl **lastFound )
+{
+	long keyRelation;
+	MapEl *curEl = root, *parentEl = 0;
+	MapEl *lastLess = 0;
+
+	while (true) {
+		if ( curEl == 0 ) {
+			/* We are at an external element and did not find the key we were
+			 * looking for. Attach underneath the leaf and rebalance. */
+			attachRebal( element, parentEl, lastLess );
+
+			if ( lastFound != 0 )
+				*lastFound = element;
+			return element;
+		}
+
+		keyRelation = compare( element->getKey(),
+				curEl->getKey() );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 ) {
+			parentEl = lastLess = curEl;
+			curEl = curEl->left;
+		}
+		/* Do we go right? */
+		else if ( keyRelation > 0 ) {
+			parentEl = curEl;
+			curEl = curEl->right;
+		}
+		/* We have hit the target. */
+		else {
+			if ( lastFound != 0 )
+				*lastFound = curEl;
+			return 0;
+		}
+	}
+}
+
+/**
+ * \brief Insert a new element into the tree with given key.
+ *
+ * If the key is not already in the tree then a new element is made using the
+ * MapEl(const Key &key) constructor and the insert succeeds. If lastFound is
+ * given then it is set to the element inserted. If the insert fails then
+ * lastFound is set to the existing element in the tree that has the same key as
+ * element.
+ * 
+ * \returns The new element upon success, null upon failure.
+ */
+MapEl *Map::insert( Program *p, Tree *key, MapEl **lastFound )
+{
+	long keyRelation;
+	MapEl *curEl = root, *parentEl = 0;
+	MapEl *lastLess = 0;
+
+	while (true) {
+		if ( curEl == 0 ) {
+			/* We are at an external element and did not find the key we were
+			 * looking for. Create the new element, attach it underneath the leaf
+			 * and rebalance. */
+			MapEl *element = p->mapElPool.allocate();
+			element->key = key;
+			element->tree = 0;
+			attachRebal( element, parentEl, lastLess );
+
+			if ( lastFound != 0 )
+				*lastFound = element;
+			return element;
+		}
+
+		keyRelation = compare( key, curEl->getKey() );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 ) {
+			parentEl = lastLess = curEl;
+			curEl = curEl->left;
+		}
+		/* Do we go right? */
+		else if ( keyRelation > 0 ) {
+			parentEl = curEl;
+			curEl = curEl->right;
+		}
+		/* We have hit the target. */
+		else {
+			if ( lastFound != 0 )
+				*lastFound = curEl;
+			return 0;
+		}
+	}
+}
+
+/**
+ * \brief Find a element in the tree with the given key.
+ *
+ * \returns The element if key exists, null if the key does not exist.
+ */
+MapEl *Map::find( Tree *key ) const
+{
+	MapEl *curEl = root;
+	long keyRelation;
+
+	while (curEl) {
+		keyRelation = compare( key, curEl->getKey() );
+
+		/* Do we go left? */
+		if ( keyRelation < 0 )
+			curEl = curEl->left;
+		/* Do we go right? */
+		else if ( keyRelation > 0 )
+			curEl = curEl->right;
+		/* We have hit the target. */
+		else {
+			return curEl;
+		}
+	}
+	return 0;
+}
+
+
+/**
+ * \brief Find a element, then detach it from the tree. 
+ * 
+ * The element is not deleted.
+ *
+ * \returns The element detached if the key is found, othewise returns null.
+ */
+MapEl *Map::detach( Tree *key )
+{
+	MapEl *element = find( key );
+	if ( element ) {
+		detach(element);
+	}
+
+	return element;
+}
+
+/**
+ * \brief Find, detach and delete a element from the tree. 
+ *
+ * \returns True if the element was found and deleted, false otherwise.
+ */
+bool Map::remove( Tree *key )
+{
+	/* Assume not found. */
+	bool retVal = false;
+
+	/* Look for the key. */
+	MapEl *element = find( key );
+	if ( element != 0 ) {
+		/* If found, detach the element and delete. */
+		detach( element );
+		delete element;
+		retVal = true;
+	}
+
+	return retVal;
+}
+
+/**
+ * \brief Detach and delete a element from the tree. 
+ *
+ * If the element is not in the tree then undefined behaviour results.
+ */
+void Map::remove(MapEl *element)
+{
+	/* Detach and delete. */
+	detach(element);
+	delete element;
+}
+
+/**
+ * \brief Detach a element from the tree. 
+ *
+ * If the element is not in the tree then undefined behaviour results.
+ * 
+ * \returns The element given.
+ */
+MapEl *Map::detach(MapEl *element)
+{
+	MapEl *replacement, *fixfrom;
+	long lheight, rheight;
+
+	/* Remove the element from the ordered list. */
+	listDetach( element );
+
+	/* Update treeSize. */
+	treeSize--;
+
+	/* Find a replacement element. */
+	if (element->right)
+	{
+		/* Find the leftmost element of the right subtree. */
+		replacement = element->right;
+		while (replacement->left)
+			replacement = replacement->left;
+
+		/* If replacing the element the with its child then we need to start
+		 * fixing at the replacement, otherwise we start fixing at the
+		 * parent of the replacement. */
+		if (replacement->parent == element)
+			fixfrom = replacement;
+		else
+			fixfrom = replacement->parent;
+
+		removeEl(replacement, replacement->right);
+		replaceEl(element, replacement);
+	}
+	else if (element->left)
+	{
+		/* Find the rightmost element of the left subtree. */
+		replacement = element->left;
+		while (replacement->right)
+			replacement = replacement->right;
+
+		/* If replacing the element the with its child then we need to start
+		 * fixing at the replacement, otherwise we start fixing at the
+		 * parent of the replacement. */
+		if (replacement->parent == element)
+			fixfrom = replacement;
+		else
+			fixfrom = replacement->parent;
+
+		removeEl(replacement, replacement->left);
+		replaceEl(element, replacement);
+	}
+	else
+	{
+		/* We need to start fixing at the parent of the element. */
+		fixfrom = element->parent;
+
+		/* The element we are deleting is a leaf element. */
+		removeEl(element, 0);
+	}
+
+	/* If fixfrom is null it means we just deleted
+	 * the root of the tree. */
+	if ( fixfrom == 0 )
+		return element;
+
+	/* Fix the heights after the deletion. */
+	recalcHeights(fixfrom);
+
+	/* Fix every unbalanced element going up in the tree. */
+	MapEl *ub = findFirstUnbalEl(fixfrom);
+	while ( ub )
+	{
+		/* Find the element to rebalance by moving down from the first unbalanced
+		 * element 2 levels in the direction of the greatest heights. On the
+		 * second move down, the heights may be equal ( but not on the first ).
+		 * In which case go in the direction of the first move. */
+		lheight = ub->left ? ub->left->height : 0;
+		rheight = ub->right ? ub->right->height : 0;
+		assert( lheight != rheight );
+		if (rheight > lheight)
+		{
+			ub = ub->right;
+			lheight = ub->left ?
+				ub->left->height : 0;
+			rheight = ub->right ?
+				ub->right->height : 0;
+			if (rheight > lheight)
+				ub = ub->right;
+			else if (rheight < lheight)
+				ub = ub->left;
+			else
+				ub = ub->right;
+		}
+		else
+		{
+			ub = ub->left;
+			lheight = ub->left ?
+				ub->left->height : 0;
+			rheight = ub->right ?
+				ub->right->height : 0;
+			if (rheight > lheight)
+				ub = ub->right;
+			else if (rheight < lheight)
+				ub = ub->left;
+			else
+				ub = ub->left;
+		}
+
+
+		/* rebalance returns the grandparant of the subtree formed
+		 * by the element that were rebalanced.
+		 * We must continue upward from there rebalancing. */
+		fixfrom = rebalance(ub);
+
+		/* Find the next unbalaced element. */
+		ub = findFirstUnbalEl(fixfrom);
+	}
+
+	return element;
+}
+
+
+void Map::empty()
+{
+	if ( root ) {
+		/* Recursively delete from the tree structure. */
+		deleteChildrenOf(root);
+		delete root;
+		root = 0;
+		treeSize = 0;
+
+		listAbandon();
+	}
+}
+
+/* Recursively delete all the children of a element. */
+void Map::deleteChildrenOf( MapEl *element )
+{
+	/* Recurse left. */
+	if (element->left) {
+		deleteChildrenOf(element->left);
+
+		/* Delete left element. */
+		delete element->left;
+		element->left = 0;
+	}
+
+	/* Recurse right. */
+	if (element->right) {
+		deleteChildrenOf(element->right);
+
+		/* Delete right element. */
+		delete element->right;
+		element->left = 0;
+	}
+}
+
+/* rebalance from a element whose gradparent is unbalanced. Only
+ * call on a element that has a grandparent. */
+MapEl *Map::rebalance(MapEl *n)
+{
+	long lheight, rheight;
+	MapEl *a, *b, *c;
+	MapEl *t1, *t2, *t3, *t4;
+
+	MapEl *p = n->parent; /* parent (Non-NUL). L*/
+	MapEl *gp = p->parent; /* Grand-parent (Non-NULL). */
+	MapEl *ggp = gp->parent; /* Great grand-parent (may be NULL). */
+
+	if (gp->right == p)
+	{
+		/*  gp
+		 *   		 *    p
+		 p
+		 */
+		if (p->right == n)
+		{
+			/*  gp
+			 *   			 *    p
+			 p
+			 *     			 *      n
+			 n
+			 */
+			a = gp;
+			b = p;
+			c = n;
+			t1 = gp->left;
+			t2 = p->left;
+			t3 = n->left;
+			t4 = n->right;
+		}
+		else
+		{
+			/*  gp
+			 *     			 *       p
+			 p
+			 *      /
+			 *     n
+			 */
+			a = gp;
+			b = n;
+			c = p;
+			t1 = gp->left;
+			t2 = n->left;
+			t3 = n->right;
+			t4 = p->right;
+		}
+	}
+	else
+	{
+		/*    gp
+		 *   /
+		 *  p
+		 */
+		if (p->right == n)
+		{
+			/*      gp
+			 *    /
+			 *  p
+			 *   			 *    n
+			 n
+			 */
+			a = p;
+			b = n;
+			c = gp;
+			t1 = p->left;
+			t2 = n->left;
+			t3 = n->right;
+			t4 = gp->right;
+		}
+		else
+		{
+			/*      gp
+			 *     /
+			 *    p
+			 *   /
+			 *  n
+			 */
+			a = n;
+			b = p;
+			c = gp;
+			t1 = n->left;
+			t2 = n->right;
+			t3 = p->right;
+			t4 = gp->right;
+		}
+	}
+
+	/* Perform rotation.
+	*/
+
+	/* Tie b to the great grandparent. */
+	if ( ggp == 0 )
+		root = b;
+	else if ( ggp->left == gp )
+		ggp->left = b;
+	else
+		ggp->right = b;
+	b->parent = ggp;
+
+	/* Tie a as a leftchild of b. */
+	b->left = a;
+	a->parent = b;
+
+	/* Tie c as a rightchild of b. */
+	b->right = c;
+	c->parent = b;
+
+	/* Tie t1 as a leftchild of a. */
+	a->left = t1;
+	if ( t1 != 0 ) t1->parent = a;
+
+	/* Tie t2 as a rightchild of a. */
+	a->right = t2;
+	if ( t2 != 0 ) t2->parent = a;
+
+	/* Tie t3 as a leftchild of c. */
+	c->left = t3;
+	if ( t3 != 0 ) t3->parent = c;
+
+	/* Tie t4 as a rightchild of c. */
+	c->right = t4;
+	if ( t4 != 0 ) t4->parent = c;
+
+	/* The heights are all recalculated manualy and the great
+	 * grand-parent is passed to recalcHeights() to ensure
+	 * the heights are correct up the tree.
+	 *
+	 * Note that recalcHeights() cuts out when it comes across
+	 * a height that hasn't changed.
+	 */
+
+	/* Fix height of a. */
+	lheight = a->left ? a->left->height : 0;
+	rheight = a->right ? a->right->height : 0;
+	a->height = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of c. */
+	lheight = c->left ? c->left->height : 0;
+	rheight = c->right ? c->right->height : 0;
+	c->height = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of b. */
+	lheight = a->height;
+	rheight = c->height;
+	b->height = (lheight > rheight ? lheight : rheight) + 1;
+
+	/* Fix height of b's parents. */
+	recalcHeights(ggp);
+	return ggp;
+}
+
+/* Recalculates the heights of all the ancestors of element. */
+void Map::recalcHeights(MapEl *element)
+{
+	long lheight, rheight, new_height;
+	while ( element != 0 )
+	{
+		lheight = element->left ? element->left->height : 0;
+		rheight = element->right ? element->right->height : 0;
+
+		new_height = (lheight > rheight ? lheight : rheight) + 1;
+
+		/* If there is no chage in the height, then there will be no
+		 * change in any of the ancestor's height. We can stop going up.
+		 * If there was a change, continue upward. */
+		if (new_height == element->height)
+			return;
+		else
+			element->height = new_height;
+
+		element = element->parent;
+	}
+}
+
+/* Finds the first element whose grandparent is unbalanced. */
+MapEl *Map::findFirstUnbalGP(MapEl *element)
+{
+	long lheight, rheight, balanceProp;
+	MapEl *gp;
+
+	if ( element == 0 || element->parent == 0 ||
+			element->parent->parent == 0 )
+		return 0;
+
+	/* Don't do anything if we we have no grandparent. */
+	gp = element->parent->parent;
+	while ( gp != 0 )
+	{
+		lheight = gp->left ? gp->left->height : 0;
+		rheight = gp->right ? gp->right->height : 0;
+		balanceProp = lheight - rheight;
+
+		if ( balanceProp < -1 || balanceProp > 1 )
+			return element;
+
+		element = element->parent;
+		gp = gp->parent;
+	}
+	return 0;
+}
+
+
+/* Finds the first element that is unbalanced. */
+MapEl *Map::findFirstUnbalEl(MapEl *element)
+{
+	if ( element == 0 )
+		return 0;
+
+	while ( element != 0 )
+	{
+		long lheight = element->left ?
+			element->left->height : 0;
+		long rheight = element->right ?
+			element->right->height : 0;
+		long balanceProp = lheight - rheight;
+
+		if ( balanceProp < -1 || balanceProp > 1 )
+			return element;
+
+		element = element->parent;
+	}
+	return 0;
+}
+
+/* Replace a element in the tree with another element not in the tree. */
+void Map::replaceEl(MapEl *element, MapEl *replacement)
+{
+	MapEl *parent = element->parent,
+			*left = element->left,
+			*right = element->right;
+
+	replacement->left = left;
+	if (left)
+		left->parent = replacement;
+	replacement->right = right;
+	if (right)
+		right->parent = replacement;
+
+	replacement->parent = parent;
+	if (parent)
+	{
+		if (parent->left == element)
+			parent->left = replacement;
+		else
+			parent->right = replacement;
+	}
+	else
+		root = replacement;
+
+	replacement->height = element->height;
+}
+
+/* Removes a element from a tree and puts filler in it's place.
+ * Filler should be null or a child of element. */
+void Map::removeEl(MapEl *element, MapEl *filler)
+{
+	MapEl *parent = element->parent;
+
+	if (parent)
+	{
+		if (parent->left == element)
+			parent->left = filler;
+		else
+			parent->right = filler;
+	}
+	else
+		root = filler;
+
+	if (filler)
+		filler->parent = parent;
+
+	return;
+}
+
+
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
new file mode 100644
index 00000000..54b55b23
--- /dev/null
+++ b/colm/parsedata.cpp
@@ -0,0 +1,1830 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <iomanip>
+#include <errno.h>
+#include <stdlib.h>
+#include <limits.h>
+#include <sstream>
+
+#include "colm.h"
+#include "lmparse.h"
+#include "parsedata.h"
+#include "parsetree.h"
+#include "mergesort.h"
+#include "redbuild.h"
+#include "pdacodegen.h"
+#include "fsmcodegen.h"
+#include "fsmrun.h"
+
+using namespace std;
+using std::ostringstream;
+
+char machineMain[] = "main";
+
+/* Perform minimization after an operation according 
+ * to the command line args. */
+void afterOpMinimize( FsmGraph *fsm, bool lastInSeq )
+{
+	/* Switch on the prefered minimization algorithm. */
+	if ( lastInSeq ) {
+		/* First clean up the graph. FsmGraph operations may leave these
+		 * lying around. There should be no dead end states. The subtract
+		 * intersection operators are the only places where they may be
+		 * created and those operators clean them up. */
+		fsm->removeUnreachableStates();
+		fsm->minimizePartition2();
+	}
+}
+
+/* Count the transitions in the fsm by walking the state list. */
+int countTransitions( FsmGraph *fsm )
+{
+	int numTrans = 0;
+	FsmState *state = fsm->stateList.head;
+	while ( state != 0 ) {
+		numTrans += state->outList.length();
+		state = state->next;
+	}
+	return numTrans;
+}
+
+Key makeFsmKeyHex( char *str, const InputLoc &loc, ParseData *pd )
+{
+	/* Reset errno so we can check for overflow or underflow. In the event of
+	 * an error, sets the return val to the upper or lower bound being tested
+	 * against. */
+	errno = 0;
+	unsigned int size = keyOps->alphType->size;
+	bool unusedBits = size < sizeof(unsigned long);
+
+	unsigned long ul = strtoul( str, 0, 16 );
+
+	if ( errno == ERANGE || unusedBits && ul >> (size * 8) ) {
+		error(loc) << "literal " << str << " overflows the alphabet type" << endl;
+		ul = 1 << (size * 8);
+	}
+
+	if ( unusedBits && keyOps->alphType->isSigned && ul >> (size * 8 - 1) )
+		ul |= (0xffffffff >> (size*8 ) ) << (size*8);
+
+	return Key( (long)ul );
+}
+
+Key makeFsmKeyDec( char *str, const InputLoc &loc, ParseData *pd )
+{
+	/* Convert the number to a decimal. First reset errno so we can check
+	 * for overflow or underflow. */
+	errno = 0;
+	long long minVal = keyOps->alphType->minVal;
+	long long maxVal = keyOps->alphType->maxVal;
+
+	long long ll = strtoll( str, 0, 10 );
+
+	/* Check for underflow. */
+	if ( errno == ERANGE && ll < 0 || ll < minVal) {
+		error(loc) << "literal " << str << " underflows the alphabet type" << endl;
+		ll = minVal;
+	}
+	/* Check for overflow. */
+	else if ( errno == ERANGE && ll > 0 || ll > maxVal ) {
+		error(loc) << "literal " << str << " overflows the alphabet type" << endl;
+		ll = maxVal;
+	}
+
+	if ( keyOps->alphType->isSigned )
+		return Key( (long)ll );
+	else
+		return Key( (unsigned long)ll );
+}
+
+/* Make an fsm key in int format (what the fsm graph uses) from an alphabet
+ * number returned by the parser. Validates that the number doesn't overflow
+ * the alphabet type. */
+Key makeFsmKeyNum( char *str, const InputLoc &loc, ParseData *pd )
+{
+	/* Switch on hex/decimal format. */
+	if ( str[0] == '0' && str[1] == 'x' )
+		return makeFsmKeyHex( str, loc, pd );
+	else
+		return makeFsmKeyDec( str, loc, pd );
+}
+
+/* Make an fsm int format (what the fsm graph uses) from a single character.
+ * Performs proper conversion depending on signed/unsigned property of the
+ * alphabet. */
+Key makeFsmKeyChar( char c, ParseData *pd )
+{
+	if ( keyOps->isSigned ) {
+		/* Copy from a char type. */
+		return Key( c );
+	}
+	else {
+		/* Copy from an unsigned byte type. */
+		return Key( (unsigned char)c );
+	}
+}
+
+/* Make an fsm key array in int format (what the fsm graph uses) from a string
+ * of characters. Performs proper conversion depending on signed/unsigned
+ * property of the alphabet. */
+void makeFsmKeyArray( Key *result, char *data, int len, ParseData *pd )
+{
+	if ( keyOps->isSigned ) {
+		/* Copy from a char star type. */
+		char *src = data;
+		for ( int i = 0; i < len; i++ )
+			result[i] = Key(src[i]);
+	}
+	else {
+		/* Copy from an unsigned byte ptr type. */
+		unsigned char *src = (unsigned char*) data;
+		for ( int i = 0; i < len; i++ )
+			result[i] = Key(src[i]);
+	}
+}
+
+/* Like makeFsmKeyArray except the result has only unique keys. They ordering
+ * will be changed. */
+void makeFsmUniqueKeyArray( KeySet &result, char *data, int len, 
+		bool caseInsensitive, ParseData *pd )
+{
+	/* Use a transitions list for getting unique keys. */
+	if ( keyOps->isSigned ) {
+		/* Copy from a char star type. */
+		char *src = data;
+		for ( int si = 0; si < len; si++ ) {
+			Key key( src[si] );
+			result.insert( key );
+			if ( caseInsensitive ) {
+				if ( key.isLower() )
+					result.insert( key.toUpper() );
+				else if ( key.isUpper() )
+					result.insert( key.toLower() );
+			}
+		}
+	}
+	else {
+		/* Copy from an unsigned byte ptr type. */
+		unsigned char *src = (unsigned char*) data;
+		for ( int si = 0; si < len; si++ ) {
+			Key key( src[si] );
+			result.insert( key );
+			if ( caseInsensitive ) {
+				if ( key.isLower() )
+					result.insert( key.toUpper() );
+				else if ( key.isUpper() )
+					result.insert( key.toLower() );
+			}
+		}
+	}
+}
+
+FsmGraph *dotFsm( ParseData *pd )
+{
+	FsmGraph *retFsm = new FsmGraph();
+	retFsm->rangeFsm( keyOps->minKey, keyOps->maxKey );
+	return retFsm;
+}
+
+FsmGraph *dotStarFsm( ParseData *pd )
+{
+	FsmGraph *retFsm = new FsmGraph();
+	retFsm->rangeStarFsm( keyOps->minKey, keyOps->maxKey );
+	return retFsm;
+}
+
+/* Make a builtin type. Depends on the signed nature of the alphabet type. */
+FsmGraph *makeBuiltin( BuiltinMachine builtin, ParseData *pd )
+{
+	/* FsmGraph created to return. */
+	FsmGraph *retFsm = 0;
+	bool isSigned = keyOps->isSigned;
+
+	switch ( builtin ) {
+	case BT_Any: {
+		/* All characters. */
+		retFsm = dotFsm( pd );
+		break;
+	}
+	case BT_Ascii: {
+		/* Ascii characters 0 to 127. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( 0, 127 );
+		break;
+	}
+	case BT_Extend: {
+		/* Ascii extended characters. This is the full byte range. Dependent
+		 * on signed, vs no signed. If the alphabet is one byte then just use
+		 * dot fsm. */
+		if ( isSigned ) {
+			retFsm = new FsmGraph();
+			retFsm->rangeFsm( -128, 127 );
+		}
+		else {
+			retFsm = new FsmGraph();
+			retFsm->rangeFsm( 0, 255 );
+		}
+		break;
+	}
+	case BT_Alpha: {
+		/* Alpha [A-Za-z]. */
+		FsmGraph *upper = new FsmGraph(), *lower = new FsmGraph();
+		upper->rangeFsm( 'A', 'Z' );
+		lower->rangeFsm( 'a', 'z' );
+		upper->unionOp( lower );
+		upper->minimizePartition2();
+		retFsm = upper;
+		break;
+	}
+	case BT_Digit: {
+		/* Digits [0-9]. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( '0', '9' );
+		break;
+	}
+	case BT_Alnum: {
+		/* Alpha numerics [0-9A-Za-z]. */
+		FsmGraph *digit = new FsmGraph(), *lower = new FsmGraph();
+		FsmGraph *upper = new FsmGraph();
+		digit->rangeFsm( '0', '9' );
+		upper->rangeFsm( 'A', 'Z' );
+		lower->rangeFsm( 'a', 'z' );
+		digit->unionOp( upper );
+		digit->unionOp( lower );
+		digit->minimizePartition2();
+		retFsm = digit;
+		break;
+	}
+	case BT_Lower: {
+		/* Lower case characters. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( 'a', 'z' );
+		break;
+	}
+	case BT_Upper: {
+		/* Upper case characters. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( 'A', 'Z' );
+		break;
+	}
+	case BT_Cntrl: {
+		/* Control characters. */
+		FsmGraph *cntrl = new FsmGraph();
+		FsmGraph *highChar = new FsmGraph();
+		cntrl->rangeFsm( 0, 31 );
+		highChar->concatFsm( 127 );
+		cntrl->unionOp( highChar );
+		cntrl->minimizePartition2();
+		retFsm = cntrl;
+		break;
+	}
+	case BT_Graph: {
+		/* Graphical ascii characters [!-~]. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( '!', '~' );
+		break;
+	}
+	case BT_Print: {
+		/* Printable characters. Same as graph except includes space. */
+		retFsm = new FsmGraph();
+		retFsm->rangeFsm( ' ', '~' );
+		break;
+	}
+	case BT_Punct: {
+		/* Punctuation. */
+		FsmGraph *range1 = new FsmGraph();
+		FsmGraph *range2 = new FsmGraph();
+		FsmGraph *range3 = new FsmGraph(); 
+		FsmGraph *range4 = new FsmGraph();
+		range1->rangeFsm( '!', '/' );
+		range2->rangeFsm( ':', '@' );
+		range3->rangeFsm( '[', '`' );
+		range4->rangeFsm( '{', '~' );
+		range1->unionOp( range2 );
+		range1->unionOp( range3 );
+		range1->unionOp( range4 );
+		range1->minimizePartition2();
+		retFsm = range1;
+		break;
+	}
+	case BT_Space: {
+		/* Whitespace: [\t\v\f\n\r ]. */
+		FsmGraph *cntrl = new FsmGraph();
+		FsmGraph *space = new FsmGraph();
+		cntrl->rangeFsm( '\t', '\r' );
+		space->concatFsm( ' ' );
+		cntrl->unionOp( space );
+		cntrl->minimizePartition2();
+		retFsm = cntrl;
+		break;
+	}
+	case BT_Xdigit: {
+		/* Hex digits [0-9A-Fa-f]. */
+		FsmGraph *digit = new FsmGraph();
+		FsmGraph *upper = new FsmGraph();
+		FsmGraph *lower = new FsmGraph();
+		digit->rangeFsm( '0', '9' );
+		upper->rangeFsm( 'A', 'F' );
+		lower->rangeFsm( 'a', 'f' );
+		digit->unionOp( upper );
+		digit->unionOp( lower );
+		digit->minimizePartition2();
+		retFsm = digit;
+		break;
+	}
+	case BT_Lambda: {
+		retFsm = new FsmGraph();
+		retFsm->lambdaFsm();
+		break;
+	}
+	case BT_Empty: {
+		retFsm = new FsmGraph();
+		retFsm->emptyFsm();
+		break;
+	}}
+
+	return retFsm;
+}
+
+/* Check if this name inst or any name inst below is referenced. */
+bool NameInst::anyRefsRec()
+{
+	if ( numRefs > 0 )
+		return true;
+
+	/* Recurse on children until true. */
+	for ( NameVect::Iter ch = childVect; ch.lte(); ch++ ) {
+		if ( (*ch)->anyRefsRec() )
+			return true;
+	}
+
+	return false;
+}
+
+/*
+ * ParseData
+ */
+
+/* Initialize the structure that will collect info during the parse of a
+ * machine. */
+ParseData::ParseData( const String &fileName, const String &sectionName, 
+			const InputLoc &sectionLoc, ostream &out )
+:	
+	nextPriorKey(0),
+	nextLocalErrKey(1),          /* 0 is reserved for global error actions. */
+	nextNameId(0),
+	alphTypeSet(false),
+	getKeyExpr(0),
+	accessExpr(0),
+	curStateExpr(0),
+	lowerNum(0),
+	upperNum(0),
+	fileName(fileName),
+	sectionName(sectionName),
+	sectionLoc(sectionLoc),
+	errorCount(0),
+	curActionOrd(0),
+	curPriorOrd(0),
+	nextEpsilonResolvedLink(0),
+	nextTokenId(1),
+	rootCodeBlock(0),
+	parserName(sectionName),
+	out(out),
+	access(0),
+	tokenStruct(0),
+	rootKlangEl(0),
+	eofKlangEl(0),
+	errorKlangEl(0),
+	defaultCharKlangEl(0),
+	rootRegion(0),
+	defaultRegion(0),
+	firstNonTermId(0),
+	prodIdIndex(0),
+	nextPatReplId(0),
+	nextGenericId(1),
+	nextFuncId(0),
+	loopCleanup(0),
+	nextObjectId(1),     /* 0 is  reserved for no object. */
+	nextFrameId(0),
+	nextParserId(0),
+	nextLabelId(0)
+{
+}
+
+/* Clean up the data collected during a parse. */
+ParseData::~ParseData()
+{
+	/* Delete all the nodes in the action list. Will cause all the
+	 * string data that represents the actions to be deallocated. */
+	actionList.empty();
+}
+
+/* Make a name id in the current name instantiation scope if it is not
+ * already there. */
+NameInst *ParseData::addNameInst( const InputLoc &loc, char *data, bool isLabel )
+{
+	/* Create the name instantitaion object and insert it. */
+	NameInst *newNameInst = new NameInst( loc, curNameInst, data, nextNameId++, isLabel );
+	curNameInst->childVect.append( newNameInst );
+	if ( data != 0 )
+		curNameInst->children.insertMulti( data, newNameInst );
+	return newNameInst;
+}
+
+void ParseData::initNameWalk( NameInst *rootName )
+{
+	curNameInst = rootName;
+	curNameChild = 0;
+}
+
+/* Goes into the next child scope. The number of the child is already set up.
+ * We need this for the syncronous name tree and parse tree walk to work
+ * properly. It is reset on entry into a scope and advanced on poping of a
+ * scope. A call to enterNameScope should be accompanied by a corresponding
+ * popNameScope. */
+NameFrame ParseData::enterNameScope( bool isLocal, int numScopes )
+{
+	/* Save off the current data. */
+	NameFrame retFrame;
+	retFrame.prevNameInst = curNameInst;
+	retFrame.prevNameChild = curNameChild;
+	retFrame.prevLocalScope = localNameScope;
+
+	/* Enter into the new name scope. */
+	for ( int i = 0; i < numScopes; i++ ) {
+		curNameInst = curNameInst->childVect[curNameChild];
+		curNameChild = 0;
+	}
+
+	if ( isLocal )
+		localNameScope = curNameInst;
+
+	return retFrame;
+}
+
+/* Return from a child scope to a parent. The parent info must be specified as
+ * an argument and is obtained from the corresponding call to enterNameScope.
+ * */
+void ParseData::popNameScope( const NameFrame &frame )
+{
+	/* Pop the name scope. */
+	curNameInst = frame.prevNameInst;
+	curNameChild = frame.prevNameChild+1;
+	localNameScope = frame.prevLocalScope;
+}
+
+void ParseData::resetNameScope( const NameFrame &frame )
+{
+	/* Pop the name scope. */
+	curNameInst = frame.prevNameInst;
+	curNameChild = frame.prevNameChild;
+	localNameScope = frame.prevLocalScope;
+}
+
+
+void ParseData::unsetObsoleteEntries( FsmGraph *graph )
+{
+	/* Loop the reference names and increment the usage. Names that are no
+	 * longer needed will be unset in graph. */
+	for ( NameVect::Iter ref = curNameInst->referencedNames; ref.lte(); ref++ ) {
+		/* Get the name. */
+		NameInst *name = *ref;
+		name->numUses += 1;
+
+		/* If the name is no longer needed unset its corresponding entry. */
+		if ( name->numUses == name->numRefs ) {
+			assert( graph->entryPoints.find( name->id ) != 0 );
+			graph->unsetEntry( name->id );
+		}
+	}
+}
+
+NameSet ParseData::resolvePart( NameInst *refFrom, const char *data, bool recLabelsOnly )
+{
+	/* Queue needed for breadth-first search, load it with the start node. */
+	NameInstList nameQueue;
+	nameQueue.append( refFrom );
+
+	NameSet result;
+	while ( nameQueue.length() > 0 ) {
+		/* Pull the next from location off the queue. */
+		NameInst *from = nameQueue.detachFirst();
+
+		/* Look for the name. */
+		NameMapEl *low, *high;
+		if ( from->children.findMulti( data, low, high ) ) {
+			/* Record all instances of the name. */
+			for ( ; low <= high; low++ )
+				result.insert( low->value );
+		}
+
+		/* Name not there, do breadth-first operation of appending all
+		 * childrent to the processing queue. */
+		for ( NameVect::Iter name = from->childVect; name.lte(); name++ ) {
+			if ( !recLabelsOnly || (*name)->isLabel )
+				nameQueue.append( *name );
+		}
+	}
+
+	/* Queue exhausted and name never found. */
+	return result;
+}
+
+void ParseData::resolveFrom( NameSet &result, NameInst *refFrom, 
+		const NameRef &nameRef, int namePos )
+{
+	/* Look for the name in the owning scope of the factor with aug. */
+	NameSet partResult = resolvePart( refFrom, nameRef[namePos], false );
+	
+	/* If there are more parts to the name then continue on. */
+	if ( ++namePos < nameRef.length() ) {
+		/* There are more components to the name, search using all the part
+		 * results as the base. */
+		for ( NameSet::Iter name = partResult; name.lte(); name++ )
+			resolveFrom( result, *name, nameRef, namePos );
+	}
+	else {
+		/* This is the last component, append the part results to the final
+		 * results. */
+		result.insert( partResult );
+	}
+}
+
+ostream &operator<<( ostream &out, const Token &token )
+{
+	out << token.data;
+	return out;
+}
+
+/* Write out a name reference. */
+ostream &operator<<( ostream &out, const NameRef &nameRef )
+{
+	int pos = 0;
+	if ( nameRef[pos] == 0 ) {
+		out << "::";
+		pos += 1;
+	}
+	out << nameRef[pos++];
+	for ( ; pos < nameRef.length(); pos++ )
+		out << "::" << nameRef[pos];
+	return out;
+}
+
+ostream &operator<<( ostream &out, const NameInst &nameInst )
+{
+	/* Count the number fully qualified name parts. */
+	int numParents = 0;
+	NameInst *curParent = nameInst.parent;
+	while ( curParent != 0 ) {
+		numParents += 1;
+		curParent = curParent->parent;
+	}
+
+	/* Make an array and fill it in. */
+	curParent = nameInst.parent;
+	NameInst **parents = new NameInst*[numParents];
+	for ( int p = numParents-1; p >= 0; p-- ) {
+		parents[p] = curParent;
+		curParent = curParent->parent;
+	}
+		
+	/* Write the parents out, skip the root. */
+	for ( int p = 1; p < numParents; p++ )
+		out << "::" << ( parents[p]->name != 0 ? parents[p]->name : "<ANON>" );
+
+	/* Write the name and cleanup. */
+	out << "::" << ( nameInst.name != 0 ? nameInst.name : "<ANON>" );
+	delete[] parents;
+	return out;
+}
+
+struct CmpNameInstLoc
+{
+	static int compare( const NameInst *ni1, const NameInst *ni2 )
+	{
+		if ( ni1->loc.line < ni2->loc.line )
+			return -1;
+		else if ( ni1->loc.line > ni2->loc.line )
+			return 1;
+		else if ( ni1->loc.col < ni2->loc.col )
+			return -1;
+		else if ( ni1->loc.col > ni2->loc.col )
+			return 1;
+		return 0;
+	}
+};
+
+void errorStateLabels( const NameSet &resolved )
+{
+	MergeSort<NameInst*, CmpNameInstLoc> mergeSort;
+	mergeSort.sort( resolved.data, resolved.length() );
+	for ( NameSet::Iter res = resolved; res.lte(); res++ )
+		error((*res)->loc) << "  -> " << **res << endl;
+}
+
+
+void ParseData::referenceRegions( NameInst *rootName )
+{
+	for ( NameVect::Iter inst = rootName->childVect; inst.lte(); inst++ ) {
+		/* Inc the reference in the name. This will cause the entry point to
+		 * survive to the end of the graph generating walk. */
+		(*inst)->numRefs += 1;
+	}
+}
+
+/* Walk a name tree starting at from and fill the name index. */
+void ParseData::fillNameIndex( NameInst **nameIndex, NameInst *from )
+{
+	/* Fill the value for from in the name index. */
+	nameIndex[from->id] = from;
+
+	/* Recurse on the implicit final state and then all children. */
+	if ( from->final != 0 )
+		fillNameIndex( nameIndex, from->final );
+	for ( NameVect::Iter name = from->childVect; name.lte(); name++ )
+		fillNameIndex( nameIndex, *name );
+}
+
+NameInst **ParseData::makeNameIndex( NameInst *rootName )
+{
+	/* The number of nodes in the tree can now be given by nextNameId. Put a
+	 * null pointer on the end of the list to terminate it. */
+	NameInst **nameIndex = new NameInst*[nextNameId+1];
+	memset( nameIndex, 0, sizeof(NameInst*)*(nextNameId+1) );
+	fillNameIndex( nameIndex, rootName );
+	return nameIndex;
+}
+
+void ParseData::createBuiltin( const char *name, BuiltinMachine builtin )
+{
+	Expression *expression = new Expression( builtin );
+	Join *join = new Join( expression );
+	JoinOrLm *joinOrLm = new JoinOrLm( join );
+	VarDef *varDef = new VarDef( name, joinOrLm );
+	GraphDictEl *graphDictEl = new GraphDictEl( name, varDef );
+	rootNamespace->graphDict.insert( graphDictEl );
+}
+
+/* Initialize the graph dict with builtin types. */
+void ParseData::initGraphDict( )
+{
+	createBuiltin( "any", BT_Any );
+	createBuiltin( "ascii", BT_Ascii );
+	createBuiltin( "extend", BT_Extend );
+	createBuiltin( "alpha", BT_Alpha );
+	createBuiltin( "digit", BT_Digit );
+	createBuiltin( "alnum", BT_Alnum );
+	createBuiltin( "lower", BT_Lower );
+	createBuiltin( "upper", BT_Upper );
+	createBuiltin( "cntrl", BT_Cntrl );
+	createBuiltin( "graph", BT_Graph );
+	createBuiltin( "print", BT_Print );
+	createBuiltin( "punct", BT_Punct );
+	createBuiltin( "space", BT_Space );
+	createBuiltin( "xdigit", BT_Xdigit );
+	createBuiltin( "null", BT_Lambda );
+	createBuiltin( "zlen", BT_Lambda );
+	createBuiltin( "empty", BT_Empty );
+}
+
+/* Set the alphabet type. If the types are not valid returns false. */
+bool ParseData::setAlphType( char *s1, char *s2 )
+{
+	bool valid = false;
+	for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+		if ( strcmp( s1, hostLang->hostTypes[i].data1 ) == 0 && 
+				hostLang->hostTypes[i].data2 != 0 && 
+				strcmp( s2, hostLang->hostTypes[i].data2 ) == 0 )
+		{
+			valid = true;
+			userAlphType = hostLang->hostTypes + i;
+			break;
+		}
+	}
+
+	alphTypeSet = true;
+	return valid;
+}
+
+/* Set the alphabet type. If the types are not valid returns false. */
+bool ParseData::setAlphType( char *s1 )
+{
+	bool valid = false;
+	for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+		if ( strcmp( s1, hostLang->hostTypes[i].data1 ) == 0 && 
+				hostLang->hostTypes[i].data2 == 0 )
+		{
+			valid = true;
+			userAlphType = hostLang->hostTypes + i;
+			break;
+		}
+	}
+
+	alphTypeSet = true;
+	return valid;
+}
+
+/* Initialize the key operators object that will be referenced by all fsms
+ * created. */
+void ParseData::initKeyOps( )
+{
+	/* Signedness and bounds. */
+	HostType *alphType = alphTypeSet ? userAlphType : hostLang->defaultAlphType;
+	thisKeyOps.setAlphType( alphType );
+
+	if ( lowerNum != 0 ) {
+		/* If ranges are given then interpret the alphabet type. */
+		thisKeyOps.minKey = makeFsmKeyNum( lowerNum, rangeLowLoc, this );
+		thisKeyOps.maxKey = makeFsmKeyNum( upperNum, rangeHighLoc, this );
+	}
+
+	thisCondData.nextCondKey = thisKeyOps.maxKey;
+	thisCondData.nextCondKey.increment();
+}
+
+void ParseData::printNameInst( NameInst *nameInst, int level )
+{
+	for ( int i = 0; i < level; i++ )
+		cerr << "  ";
+	cerr << (nameInst->name != 0 ? nameInst->name : "<ANON>") << 
+			"  id: " << nameInst->id << 
+			"  refs: " << nameInst->numRefs << endl;
+	for ( NameVect::Iter name = nameInst->childVect; name.lte(); name++ )
+		printNameInst( *name, level+1 );
+}
+
+/* Remove duplicates of unique actions from an action table. */
+void ParseData::removeDups( ActionTable &table )
+{
+	/* Scan through the table looking for unique actions to 
+	 * remove duplicates of. */
+	for ( int i = 0; i < table.length(); i++ ) {
+		/* Remove any duplicates ahead of i. */
+		for ( int r = i+1; r < table.length(); ) {
+			if ( table[r].value == table[i].value )
+				table.vremove(r);
+			else
+				r += 1;
+		}
+	}
+}
+
+/* Remove duplicates from action lists. This operates only on transition and
+ * eof action lists and so should be called once all actions have been
+ * transfered to their final resting place. */
+void ParseData::removeActionDups( FsmGraph *graph )
+{
+	/* Loop all states. */
+	for ( StateList::Iter state = graph->stateList; state.lte(); state++ ) {
+		/* Loop all transitions. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ )
+			removeDups( trans->actionTable );
+		removeDups( state->toStateActionTable );
+		removeDups( state->fromStateActionTable );
+		removeDups( state->eofActionTable );
+	}
+}
+
+Action *ParseData::newAction( const String &name, InlineList *inlineList )
+{
+	InputLoc loc;
+	loc.line = 1;
+	loc.col = 1;
+
+	Action *action = new Action( loc, name, inlineList );
+	actionList.append( action );
+	return action;
+}
+
+void ParseData::initLongestMatchData()
+{
+	if ( regionList.length() > 0 ) {
+		/* The initActId action gives act a default value. */
+		InlineList *il4 = new InlineList;
+		il4->append( new InlineItem( InputLoc(), InlineItem::LmInitAct ) );
+		initActId = newAction( "initact", il4 );
+		initActId->isLmAction = true;
+
+		/* The setTokStart action sets tokstart. */
+		InlineList *il5 = new InlineList;
+		il5->append( new InlineItem( InputLoc(), InlineItem::LmSetTokStart ) );
+		setTokStart = newAction( "tokstart", il5 );
+		setTokStart->isLmAction = true;
+
+		/* The setTokEnd action sets tokend. */
+		InlineList *il3 = new InlineList;
+		il3->append( new InlineItem( InputLoc(), InlineItem::LmSetTokEnd ) );
+		setTokEnd = newAction( "tokend", il3 );
+		setTokEnd->isLmAction = true;
+
+		/* The action will also need an ordering: ahead of all user action
+		 * embeddings. */
+		initActIdOrd = curActionOrd++;
+		setTokStartOrd = curActionOrd++;
+		setTokEndOrd = curActionOrd++;
+	}
+}
+
+void ParseData::finishGraphBuild( FsmGraph *graph )
+{
+	/* Resolve any labels that point to multiple states. Any labels that are
+	 * still around are referenced only by gotos and calls and they need to be
+	 * made into deterministic entry points. */
+	graph->deterministicEntry();
+
+	/*
+	 * All state construction is now complete.
+	 */
+
+	/* Transfer global error actions. */
+	for ( StateList::Iter state = graph->stateList; state.lte(); state++ )
+		graph->transferErrorActions( state, 0 );
+	
+	removeActionDups( graph );
+
+	/* Remove unreachable states. There should be no dead end states. The
+	 * subtract and intersection operators are the only places where they may
+	 * be created and those operators clean them up. */
+	graph->removeUnreachableStates();
+
+	/* No more fsm operations are to be done. Action ordering numbers are
+	 * no longer of use and will just hinder minimization. Clear them. */
+	graph->nullActionKeys();
+
+	/* Transition priorities are no longer of use. We can clear them
+	 * because they will just hinder minimization as well. Clear them. */
+	graph->clearAllPriorities();
+
+	/* Minimize here even if we minimized at every op. Now that function
+	 * keys have been cleared we may get a more minimal fsm. */
+	graph->minimizePartition2();
+	graph->compressTransitions();
+}
+
+void ParseData::printNameTree( NameInst *rootName )
+{
+	/* Print the name instance map. */
+	cerr << "name tree:" << endl;
+	for ( NameVect::Iter name = rootName->childVect; name.lte(); name++ )
+		printNameInst( *name, 0 );
+}
+
+void ParseData::printNameIndex( NameInst **nameIndex )
+{
+	/* The name index is terminated with a null pointer. */
+	cerr << "name index:" << endl;
+	for ( int ni = 0; nameIndex[ni]; ni++ ) {
+		cerr << ni << ": ";
+		char *name = nameIndex[ni]->name;
+		cerr << ( name != 0 ? name : "<ANON>" ) << endl;
+	}
+}
+
+/* Build the name tree and supporting data structures. */
+NameInst *ParseData::makeJoinNameTree( Join *join )
+{
+	/* Create the root name. */
+	nextNameId = 0;
+	NameInst *rootName = new NameInst( InputLoc(), 0, 0, nextNameId++, false );
+
+	/* Make the name tree. */
+	initNameWalk( rootName );
+	join->makeNameTree( this );
+
+	return rootName;
+}
+
+
+/* Build the name tree and supporting data structures. */
+NameInst *ParseData::makeNameTree()
+{
+	/* Create the root name. */
+	nextNameId = 0;
+	NameInst *rootName = new NameInst( InputLoc(), 0, 0, nextNameId++, false );
+
+	/* First make the name tree. */
+	initNameWalk( rootName );
+	for ( GraphList::Iter glel = instanceList; glel.lte(); glel++ ) {
+		/* Recurse on the instance. */
+		glel->value->makeNameTree( glel->loc, this );
+	}
+
+	return rootName;
+}
+
+
+FsmGraph *ParseData::makeJoin( Join *join )
+{
+	/* Build the name tree and supporting data structures. */
+	NameInst *rootName = makeJoinNameTree( join );
+	NameInst **nameIndex = makeNameIndex( rootName );
+
+	/* Resove name references in the tree. */
+	initNameWalk( rootName );
+	join->resolveNameRefs( this );
+
+	/* Make all the instantiations, we know that main exists in this list. */
+	initNameWalk( rootName );
+
+	/* Build the graph from a walk of the parse tree. */
+	FsmGraph *newGraph = join->walk( this );
+
+	/* Wrap up the construction. */
+	finishGraphBuild( newGraph );
+
+	newGraph->rootName = rootName;
+	newGraph->nameIndex = nameIndex;
+
+	return newGraph;
+}
+
+FsmGraph *ParseData::makeAllRegions()
+{
+	/* Build the name tree and supporting data structures. */
+	NameInst *rootName = makeNameTree( );
+	NameInst **nameIndex = makeNameIndex( rootName );
+
+	/* Resove name references in the tree. */
+	initNameWalk( rootName );
+	for ( GraphList::Iter glel = instanceList; glel.lte(); glel++ )
+		glel->value->resolveNameRefs( this );
+
+	/* Resovle the implicit name references to the nfa instantiations. */
+	referenceRegions( rootName );
+
+	int numGraphs = 0;
+	FsmGraph **graphs = new FsmGraph*[instanceList.length()];
+
+	/* Make all the instantiations, we know that main exists in this list. */
+	initNameWalk( rootName );
+	for ( GraphList::Iter glel = instanceList; glel.lte();  glel++ ) {
+		/* Build the graph from a walk of the parse tree. */
+		FsmGraph *newGraph = glel->value->walk( this );
+
+		/* Wrap up the construction. */
+		finishGraphBuild( newGraph );
+
+		/* Save off the new graph. */
+		graphs[numGraphs++] = newGraph;
+	}
+
+	/* NOTE: If putting in minimization here we need to include eofTarget
+	 * into the minimization algorithm. It is currently set by the longest
+	 * match operator and not considered anywhere else. */
+
+	/* Add all the other graphs into the first. */
+	FsmGraph *all = graphs[0];
+	all->globOp( graphs+1, numGraphs-1 );
+	delete[] graphs;
+
+	/* Go through all the token regions and check for lmRequiresErrorState. */
+	for ( RegionList::Iter reg = regionList; reg.lte(); reg++ ) {
+		if ( reg->lmSwitchHandlesError )
+			all->lmRequiresErrorState = true;
+	}
+
+	all->rootName = rootName;
+	all->nameIndex = nameIndex;
+
+	return all;
+}
+
+void ParseData::analyzeAction( Action *action, InlineList *inlineList )
+{
+	/* FIXME: Actions used as conditions should be very constrained. */
+	for ( InlineList::Iter item = *inlineList; item.lte(); item++ ) {
+		//if ( item->type == InlineItem::Call || item->type == InlineItem::CallExpr )
+		//	action->anyCall = true;
+
+		/* Need to recurse into longest match items. */
+		if ( item->type == InlineItem::LmSwitch ) {
+			TokenRegion *lm = item->tokenRegion;
+			for ( TokenDefList::Iter lmi = lm->tokenDefList; lmi.lte(); lmi++ ) {
+				if ( lmi->action != 0 )
+					analyzeAction( action, lmi->action->inlineList );
+			}
+		}
+
+		if ( item->type == InlineItem::LmOnLast || 
+				item->type == InlineItem::LmOnNext ||
+				item->type == InlineItem::LmOnLagBehind )
+		{
+			TokenDef *lmi = item->longestMatchPart;
+			if ( lmi->action != 0 )
+				analyzeAction( action, lmi->action->inlineList );
+		}
+
+		if ( item->children != 0 )
+			analyzeAction( action, item->children );
+	}
+}
+
+void ParseData::analyzeGraph( FsmGraph *graph )
+{
+	for ( ActionList::Iter act = actionList; act.lte(); act++ )
+		analyzeAction( act, act->inlineList );
+
+	for ( StateList::Iter st = graph->stateList; st.lte(); st++ ) {
+		/* The transition list. */
+		for ( TransList::Iter trans = st->outList; trans.lte(); trans++ ) {
+			for ( ActionTable::Iter at = trans->actionTable; at.lte(); at++ )
+				at->value->numTransRefs += 1;
+		}
+
+		for ( ActionTable::Iter at = st->toStateActionTable; at.lte(); at++ )
+			at->value->numToStateRefs += 1;
+
+		for ( ActionTable::Iter at = st->fromStateActionTable; at.lte(); at++ )
+			at->value->numFromStateRefs += 1;
+
+		for ( ActionTable::Iter at = st->eofActionTable; at.lte(); at++ )
+			at->value->numEofRefs += 1;
+
+		for ( StateCondList::Iter sc = st->stateCondList; sc.lte(); sc++ ) {
+			for ( CondSet::Iter sci = sc->condSpace->condSet; sci.lte(); sci++ )
+				(*sci)->numCondRefs += 1;
+		}
+	}
+}
+
+FsmGraph *ParseData::makeFsmGraph( Join *join )
+{
+	/* Make the graph, do minimization. */
+	FsmGraph *fsmGraph = join != 0 ? makeJoin( join ) : makeAllRegions();
+
+	/* If any errors have occured in the input file then don't write anything. */
+	if ( gblErrorCount > 0 )
+		return 0;
+
+	analyzeGraph( fsmGraph );
+
+	/* Decide if an error state is necessary.
+	 *  1. There is an error transition
+	 *  2. There is a gap in the transitions
+	 *  3. The longest match operator requires it. */
+	if ( fsmGraph->lmRequiresErrorState || fsmGraph->hasErrorTrans() )
+		fsmGraph->errState = fsmGraph->addState();
+
+	/* State numbers need to be assigned such that all final states have a
+	 * larger state id number than all non-final states. This enables the
+	 * first_final mechanism to function correctly. We also want states to be
+	 * ordered in a predictable fashion. So we first apply a depth-first
+	 * search, then do a stable sort by final state status, then assign
+	 * numbers. */
+
+	fsmGraph->depthFirstOrdering();
+	fsmGraph->sortStatesByFinal();
+	fsmGraph->setStateNumbers( 0 );
+
+	return fsmGraph;
+}
+
+void ParseData::createDefaultScanner()
+{
+	InputLoc loc;
+
+	const char *name = "___DEFAULT_SCANNER";
+
+	/* Create the default namespace. */
+	defaultNamespace = new Namespace( InputLoc(), name,
+			namespaceList.length(), 0 );
+	namespaceList.append( defaultNamespace );
+
+	/* Create a scanner which will be used when no other scanner can be
+	 * figured out. It returns single characters. */
+	defaultRegion = new TokenRegion( InputLoc(), name, 
+			regionList.length(), 0 );
+	regionList.append( defaultRegion );
+	JoinOrLm *joinOrLm = new JoinOrLm( defaultRegion );
+
+	/* Insert the machine definition into the graph dictionary. */
+	GraphDictEl *newEl = rootNamespace->graphDict.insert( name );
+	assert( newEl != 0 );
+	newEl->value = new VarDef( name, joinOrLm );
+	newEl->isInstance = true;
+	instanceList.append( newEl );
+
+	/* Now create the one and only token -> "<chr>" / any /  */
+	name = "___DEFAULT_SCANNER_CHR";
+	defaultCharKlangEl = getKlangEl( this, defaultNamespace, 
+			name, KlangEl::Term );
+	assert( defaultCharKlangEl != 0 );
+	assert( defaultCharKlangEl->type == KlangEl::Term );
+
+	Join *join = new Join( new Expression( BT_Any ) );
+		
+	TokenDef *tokenDef = new TokenDef( join, defaultCharKlangEl, loc, 
+			nextTokenId++, rootNamespace, defaultRegion );
+	defaultRegion->tokenDefList.append( tokenDef );
+	defaultCharKlangEl->tokenDef = tokenDef;
+}
+
+void ParseData::resolveLiteralFactor( PdaFactor *fact )
+{
+	/* Interpret escape sequences and remove quotes. */
+	bool unusedCI;
+	String interp;
+	prepareLitString( interp, unusedCI, fact->literal->token.data, 
+			fact->literal->token.loc );
+
+	//cerr << "resolving literal: " << fact->literal->token << endl;
+
+	/* Look for the production's associated region. */
+	Namespace *nspace = fact->nspaceQual->getQual( this );
+
+	if ( nspace == 0 )
+		error(fact->loc) << "do not have region for resolving literal" << endp;
+
+	LiteralDictEl *ldel = nspace->literalDict.find( interp );
+	if ( ldel == 0 )
+		cerr << "could not resolve literal: " << fact->literal->token << endp;
+
+	TokenDef *tokenDef = ldel->value->tokenDef;
+	fact->langEl = tokenDef->token;
+}
+
+void ParseData::resolveReferenceFactor( PdaFactor *fact )
+{
+	/* Look for the production's associated region. */
+	Namespace *nspace = fact->nspaceQual->getQual( this );
+
+	if ( nspace == 0 )
+		error(fact->loc) << "do not have namespace for resolving reference" << endp;
+	
+	fact->nspace = nspace;
+
+	/* Look up the language element in the region. */
+	KlangEl *langEl = getKlangEl( this, nspace, fact->refName, KlangEl::Unknown );
+
+	if ( fact->opt ) {
+		/* If the factor is an opt, create the opt element and link the factor
+		 * to it. */
+		String optName( 32, "_opt_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( optName );
+	    if ( inDict != 0 ) {
+			fact->langEl = inDict->value;
+		}
+		else {
+			KlangEl *prodName = getKlangEl( this, nspace, optName, KlangEl::NonTerm );
+			prodName->type = KlangEl::NonTerm;
+			prodName->isOpt = true;
+
+			ProdElList *prodElList1 = new ProdElList;
+
+			/* Build the first production of the repeat. */
+			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					fact->refName, 0, false, false );
+			prodElList1->append( factor1 );
+
+			Definition *newDef1 = new Definition( InputLoc(),
+					prodName, prodElList1, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef1 );
+			prodList.append( newDef1 );
+
+			/* Build the second production of the repeat. */
+			ProdElList *prodElList2 = new ProdElList;
+
+			Definition *newDef2 = new Definition( InputLoc(),
+					prodName, prodElList2, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef2 );
+			prodList.append( newDef2 );
+
+			fact->langEl = prodName;
+		}
+	}
+	else if ( fact->repeat ) {
+		/* If the factor is a repeat, create the repeat element and link the
+		 * factor to it. */
+		String repeatName( 32, "_repeat_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( repeatName );
+	    if ( inDict != 0 ) {
+			fact->langEl = inDict->value;
+		}
+		else {
+			KlangEl *prodName = getKlangEl( this, nspace,
+					repeatName, KlangEl::NonTerm );
+			prodName->type = KlangEl::NonTerm;
+			prodName->isRepeat = true;
+
+			ProdElList *prodElList1 = new ProdElList;
+
+			/* Build the first production of the repeat. */
+			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					fact->refName, 0, false, false );
+			PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					repeatName, 0, false, false );
+
+			prodElList1->append( factor1 );
+			prodElList1->append( factor2 );
+
+			Definition *newDef1 = new Definition( InputLoc(),
+					prodName, prodElList1, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef1 );
+			prodList.append( newDef1 );
+
+			/* Build the second production of the repeat. */
+			ProdElList *prodElList2 = new ProdElList;
+
+			Definition *newDef2 = new Definition( InputLoc(),
+					prodName, prodElList2, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef2 );
+			prodList.append( newDef2 );
+
+			fact->langEl = prodName;
+		}
+	}
+	else {
+		/* The factor is not a repeat. Link to the language element. */
+		fact->langEl = langEl;
+	}
+}
+
+void ParseData::resolveFactor( PdaFactor *fact )
+{
+	switch ( fact->type ) {
+		case PdaFactor::LiteralType:
+			resolveLiteralFactor( fact );
+			break;
+		case PdaFactor::ReferenceType:
+			resolveReferenceFactor( fact );
+			break;
+	}
+}
+
+void ParseData::resolveProductionEls()
+{
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		for ( ProdElList::Iter fact = *prod->prodElList; fact.lte(); fact++ )
+			resolveFactor( fact );
+	}
+}
+
+Namespace *Namespace::findNamespace( const String &name )
+{
+	for ( NamespaceVect::Iter c = childNamespaces; c.lte(); c++ ) {
+		if ( strcmp( name, (*c)->name ) == 0 )
+			return *c;
+	}
+	return 0;
+}
+
+/* Search from a previously resolved qualification. (name 1+ in a qual list). */
+Namespace *NamespaceQual::searchFrom( Namespace *from, StringVect::Iter &qualPart )
+{
+	/* While there are still parts in the qualification.  */
+	while ( qualPart.lte() ) {
+		Namespace *child = from->findNamespace( *qualPart );
+		if ( child == 0 )
+			return 0;
+
+		from = child;
+		qualPart.increment();
+	}
+
+	return from;
+}
+
+Namespace *NamespaceQual::getQual( ParseData *pd )
+{
+	/* Do the search only once. */
+	if ( cachedNspaceQual != 0 )
+		return cachedNspaceQual;
+	
+	if ( qualNames.length() == 0 ) {
+		/* No qualification, use the region the qualification was 
+		 * declared in. */
+		cachedNspaceQual = declInNspace;
+	}
+	else if ( strcmp( qualNames[0], "root" ) == 0 ) {
+		/* First item is "root." Start the downward search from there. */
+		StringVect::Iter qualPart = qualNames;
+		qualPart.increment();
+		cachedNspaceQual = searchFrom( pd->rootNamespace, qualPart );
+		return cachedNspaceQual;
+	}
+	else {
+		/* Have a qualification. Move upwards through the declared
+		 * regions looking for the first part. */
+		StringVect::Iter qualPart = qualNames;
+		Namespace *parentNamespace = declInNspace;
+		while ( parentNamespace != 0 ) {
+			/* Search for the first part underneath the current parent. */
+			Namespace *child = parentNamespace->findNamespace( *qualPart );
+
+			if ( child != 0 ) {
+				/* Found the first part. Start going below the result.  */
+				qualPart.increment();
+				cachedNspaceQual = searchFrom( child, qualPart );
+				return cachedNspaceQual;
+			}
+
+			/* Not found, move up to the parent. */
+			parentNamespace = parentNamespace->parentNamespace;
+		}
+
+		/* Failed to find the place to start from. */
+		cachedNspaceQual = 0;
+	}
+
+	return cachedNspaceQual;
+}
+
+void ParseData::resolvePatternEls()
+{
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
+		for ( PatternItemList::Iter item = *pat->list; item.lte(); item++ ) {
+			switch ( item->type ) {
+			case PatternItem::FactorType:
+				/* Use pdaFactor reference resolving. */
+				resolveFactor( item->factor );
+				break;
+			case PatternItem::InputText:
+				/* Nothing to do here. */
+				break;
+			}
+		}
+	}
+}
+
+void ParseData::resolveReplacementEls()
+{
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
+		for ( ReplItemList::Iter item = *repl->list; item.lte(); item++ ) {
+			switch ( item->type ) {
+			case ReplItem::FactorType:
+				/* Use pdaFactor reference resolving. */
+				resolveFactor( item->factor );
+				break;
+			case ReplItem::InputText:
+			case ReplItem::VarRefType:
+				break;
+			}
+		}
+	}
+}
+
+void ParseData::initEmptyScanners()
+{
+	for ( RegionList::Iter reg = regionList; reg.lte(); reg++ ) {
+		if ( reg->tokenDefList.length() == 0 ) {
+			InputLoc loc;
+			String name( reg->name.length() + 16, "__%s_DEF_PAT", reg->name.data );
+
+			KlangEl *lel = getKlangEl( this, rootNamespace,
+					name.data, KlangEl::Term );
+			assert( lel != 0 );
+			assert( lel->type == KlangEl::Term );
+
+			Join *join = new Join( new Expression( BT_Any ) );
+				
+			TokenDef *tokenDef = new TokenDef( join, lel, loc, nextTokenId++,
+					rootNamespace, reg );
+			reg->tokenDefList.append( tokenDef );
+			lel->tokenDef = tokenDef;
+		}
+	}
+}
+
+
+/*
+ * Pattern
+ */
+
+InputStreamPattern::InputStreamPattern( Pattern *pattern )
+: 
+	pattern(pattern),
+	patItem(pattern->list->head),
+	offset(0),
+	flush(false)
+{}
+
+int InputStreamPattern::isLangEl()
+{ 
+	return patItem != 0 && patItem->type == PatternItem::FactorType;
+}
+
+int InputStreamPattern::shouldFlush()
+{ 
+	return patItem == 0 || patItem->type == PatternItem::FactorType;
+}
+
+KlangEl *InputStreamPattern::getLangEl( long &bindId, char *&data, long &length )
+{ 
+	KlangEl *klangEl = patItem->factor->langEl;
+	bindId = patItem->bindId;
+	data = 0;
+	length = 0;
+
+	patItem = patItem->next;
+	offset = 0;
+	flush = false;
+	return klangEl;
+}
+
+
+int InputStreamPattern::getData( char *dest, int length )
+{ 
+	assert ( patItem->type == PatternItem::InputText );
+	int available = patItem->data.length() - offset;
+
+	if ( available < length )
+		length = available;
+
+	memcpy( dest, patItem->data.data+offset, length );
+	offset += length;
+
+	if ( offset == patItem->data.length() ) {
+		/* Read up to the end of the data. Advance the
+		 * pattern item. */
+		patItem = patItem->next;
+		offset = 0;
+		flush = shouldFlush();
+	}
+	else {
+		/* There is more data in this buffer. Don't flush. */
+		flush = false;
+	}
+	return length;
+}
+
+int InputStreamPattern::isEOF()
+{
+	return patItem == 0;
+}
+
+int InputStreamPattern::needFlush()
+{
+	return flush;
+}
+
+
+void InputStreamPattern::backup()
+{
+	if ( patItem == 0 )
+		patItem = pattern->list->tail;
+	else
+		patItem = patItem->prev;
+}
+
+void InputStreamPattern::pushBack( char *data, long length )
+{
+	if ( length == 0 )
+		return;
+
+	/* While pushing back past the current pattern item start. */
+	while ( length > offset ) {
+		length -= offset;
+		if ( offset > 0 )
+			assert( memcmp( patItem->data, data-length, offset ) == 0 );
+		backup();
+		offset = patItem->data.length();
+	}
+
+	offset -= length;
+	assert( memcmp( &patItem->data[offset], data, length ) == 0 );
+}
+
+void InputStreamPattern::pushBackNamed()
+{
+	backup();
+	offset = patItem->data.length();
+}
+
+
+/*
+ * Replacement
+ */
+
+InputStreamRepl::InputStreamRepl( Replacement *replacement )
+: 
+	replacement(replacement),
+	replItem(replacement->list->head),
+	offset(0),
+	flush(false)
+{}
+
+int InputStreamRepl::isLangEl()
+{ 
+	return replItem != 0 && 
+		( replItem->type == ReplItem::VarRefType || replItem->type == ReplItem::FactorType );
+}
+
+int InputStreamRepl::shouldFlush()
+{ 
+	return replItem == 0 || 
+		( replItem->type == ReplItem::VarRefType || replItem->type == ReplItem::FactorType );
+}
+
+KlangEl *InputStreamRepl::getLangEl( long &bindId, char *&data, long &length )
+{ 
+	KlangEl *klangEl = replItem->type == ReplItem::VarRefType ? 
+			replItem->langEl : replItem->factor->langEl;
+	bindId = replItem->bindId;
+
+	data = 0;
+	length = 0;
+
+	if ( replItem->type == ReplItem::FactorType ) {
+		if ( replItem->factor->literal != 0 ) {
+			bool unusedCI;
+			prepareLitString( replItem->data, unusedCI, 
+					replItem->factor->literal->token.data,
+					replItem->factor->literal->token.loc );
+
+			data = replItem->data;
+			length = replItem->data.length();
+		}
+	}
+
+	replItem = replItem->next;
+	offset = 0;
+	flush = false;
+	return klangEl;
+}
+
+int InputStreamRepl::getData( char *dest, int length )
+{ 
+	assert ( replItem->type == ReplItem::InputText );
+	int available = replItem->data.length() - offset;
+
+	if ( available < length )
+		length = available;
+
+	memcpy( dest, replItem->data.data+offset, length );
+	offset += length;
+
+	if ( offset == replItem->data.length() ) {
+		/* Read up to the end of the data. Advance the
+		 * replacement item. */
+		replItem = replItem->next;
+		offset = 0;
+		flush = shouldFlush();
+	}
+	else {
+		/* There is more data in this buffer. Don't flush. */
+		flush = false;
+	}
+	return length;
+}
+
+int InputStreamRepl::isEOF()
+{
+	return replItem == 0;
+}
+
+int InputStreamRepl::needFlush()
+{
+	return flush;
+}
+
+void InputStreamRepl::backup()
+{
+	if ( replItem == 0 )
+		replItem = replacement->list->tail;
+	else
+		replItem = replItem->prev;
+}
+
+void InputStreamRepl::pushBack( char *data, long length )
+{
+	if ( length == 0 )
+		return;
+
+	/* While pushing back past the current pattern item start. */
+	while ( length > offset ) {
+		length -= offset;
+		assert( memcmp( replItem->data, data-length, offset ) == 0 );
+		backup();
+		offset = replItem->data.length();
+	}
+
+	offset -= length;
+	assert( memcmp( &replItem->data[offset], data, length ) == 0 );
+}
+
+void InputStreamRepl::pushBackNamed()
+{
+	backup();
+	offset = replItem->data.length();
+}
+
+
+void ParseData::makePatternParsers()
+{
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
+		/* We assume the reduction action compilation phase was run before
+		 * pattern parsing and it decorated the pattern with the target type. */
+		assert( pat->langEl != 0 );
+		if ( pat->langEl->type != KlangEl::NonTerm )
+			error(pat->loc) << "pattern type is not a non-terminal" << endp;
+
+		/* Make a parser for the language element. */
+		makeParser( pat->langEl );
+	}
+
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
+		/* We assume the reduction action compilation phase was run before
+		 * replacement parsing decorated the replacement with the target type. */
+		assert( repl->langEl != 0 );
+
+		/* Make a parser for the language element. */
+		makeParser( repl->langEl );
+	}
+}
+
+void ParseData::parsePatterns()
+{
+	FsmRun fsmRun( runtimeData->fsmTables );
+	Program program( false, runtimeData );
+
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
+		//cerr << "parsing replacement: " << repl->data << endl;
+		InputStreamRepl in( repl );
+		fsmRun.attachInputStream( &in );
+
+		repl->pdaRun = new PdaRun( 0, &program, repl->langEl->pdaTables, &fsmRun, 0 );
+		repl->pdaRun->run();
+
+		//#ifdef COLM_LOG_COMPILE
+		//xml_print_list( runtimeData, repl->pdaRun->stackTop, 0 );
+		//#endif
+	}
+
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
+		//cerr << "parsing pattern: " << pat->data << endl;
+		InputStreamPattern in( pat );
+		fsmRun.attachInputStream( &in );
+
+		pat->pdaRun = new PdaRun( 0, &program, pat->langEl->pdaTables, &fsmRun, 0 );
+		pat->pdaRun->run();
+
+		//#ifdef COLM_LOG_COMPILE
+		//xml_print_list( runtimeData, pat->pdaRun->stackTop, 0 );
+		//#endif
+	}
+
+	fillInPatterns( &program );
+}
+
+void ParseData::verifyParseStopGrammar( KlangEl *langEl )
+{
+	PdaGraph *pdaGraph = langEl->pdaGraph;
+
+	/* Get the entry into the graph and traverse over the root. The resulting
+	 * state can have eof, nothing else can. */
+	PdaState *overStart = pdaGraph->followFsm( 
+			pdaGraph->startState,
+			langEl->rootDef->fsm );
+
+	/* The graph must reduce to root all on it's own. It cannot depend on
+	 * require EOF. */
+	for ( PdaStateList::Iter st = pdaGraph->stateList; st.lte(); st++ ) {
+		if ( st == overStart )
+			continue;
+
+		for ( TransMap::Iter tr = st->transMap; tr.lte(); tr++ ) {
+			if ( tr->value->lowKey == eofKlangEl->id ) {
+				/* This needs a better error message. Appears to be voodoo. */
+				error() << "grammar is not usable with parse_stop" << endp;
+			}
+		}
+	}
+}
+
+void ParseData::resolveUses()
+{
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->objectDefUses != 0 ) {
+			/* Look for the production's associated region. */
+			Namespace *nspace = lel->objectDefUsesQual->getQual( this );
+
+			if ( nspace == 0 )
+				error() << "do not have namespace for resolving reference" << endp;
+	
+			/* Look up the language element in the region. */
+			KlangEl *langEl = getKlangEl( this, nspace, lel->objectDefUses, KlangEl::Unknown );
+			lel->objectDef = langEl->objectDef;
+		}
+	}
+}
+
+void ParseData::semanticAnalysis()
+{
+	beginProcessing();
+	initKeyOps();
+
+	/* Resolve uses statements. */
+	resolveUses();
+	
+	/* Init the longest match data and create the default scanner which will
+	 * return single characters for us when we have no other scanner */
+	initLongestMatchData();
+	createDefaultScanner();
+
+	/* This needs to happen before the scanner is built. */
+	resolveProductionEls();
+
+	/* Resolve pattern and replacement elements. */
+	resolvePatternEls();
+	resolveReplacementEls();
+
+	/* Fill any empty scanners with a default token. */
+	initEmptyScanners();
+
+	FsmGraph *fsmGraph = makeScanner();
+
+	#ifdef COLM_LOG_COMPILE
+	printNameTree( fsmGraph->rootName );
+	printNameIndex( fsmGraph->nameIndex );
+	#endif
+
+	prepGrammar();
+
+	/* Compile bytecode. */
+	compileByteCode();
+
+	/* Make the reduced fsm. */
+	RedFsmBuild reduce( sectionName, this, fsmGraph );
+	RedFsm *redFsm = reduce.reduceMachine();
+
+	/* Build the parsers used for patterns and replacements. */
+	makePatternParsers();
+
+	/* Make parsers that we need. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->parserId >= 0 ) {
+			makeParser( lel );
+
+			if ( lel->parseStop )
+				verifyParseStopGrammar( lel );
+		}
+	}
+
+	/* Make the scanner tables. */
+	fsmTables = redFsm->makeFsmTables();
+
+	/* Now that all parsers are built, make the global runtimeData. */
+	makeRuntimeData();
+
+	/* 
+	 * All compilation is now complete.
+	 */
+	
+	/* Parse patterns and replacements. */
+	parsePatterns();
+
+	/*
+	 * Write output.
+	 */
+
+	openOutput();
+
+	FsmCodeGen *fsmGen = new FsmCodeGen("<INPUT>", sectionName,
+			*outStream, redFsm, fsmTables );
+
+	PdaCodeGen *pdaGen = new PdaCodeGen( outputFileName, "parser", this, *outStream );
+
+	pdaGen->writeFirst();
+	fsmGen->writeCode();
+
+	/* Make parsers that we need. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->parserId >= 0 )
+			pdaGen->writeParserData( lel->parserId, lel->pdaTables );
+	}
+
+	/* Write the runtime data. */
+	pdaGen->writeRuntimeData( runtimeData );
+
+	outStream->flush();
+}
diff --git a/colm/parsedata.h b/colm/parsedata.h
new file mode 100644
index 00000000..801956f0
--- /dev/null
+++ b/colm/parsedata.h
@@ -0,0 +1,904 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PARSEDATA_H
+#define _PARSEDATA_H
+
+#include <iostream>
+#include <limits.h>
+#include "bstset.h"
+#include "colm.h"
+#include "avlmap.h"
+#include "avlset.h"
+#include "bstmap.h"
+#include "vector.h"
+#include "dlist.h"
+#include "dlistmel.h"
+#include "fsmgraph.h"
+#include "compare.h"
+#include "vector.h"
+#include "common.h"
+#include "parsetree.h"
+#include "astring.h"
+#include "pdagraph.h"
+#include "compare.h"
+#include "pdarun.h"
+#include "bytecode.h"
+
+using std::ostream;
+
+/* Forwards. */
+struct RedFsm;
+struct KlangEl;
+struct ParseData;
+struct PdaCodeGen;
+struct FsmCodeGen;
+
+#define SHIFT_CODE 0x1
+#define REDUCE_CODE 0x2
+#define SHIFT_REDUCE_CODE 0x3
+
+inline long makeReduceCode( long reduction, bool isShiftReduce )
+{
+	return ( isShiftReduce ? SHIFT_REDUCE_CODE : REDUCE_CODE ) | 
+		( reduction << 2 );
+}
+
+struct PdaFactor;
+struct ProdElList;
+struct PdaLiteral;
+struct Definition;
+
+struct DefListEl { Definition *prev, *next; };
+struct LelDefListEl { Definition *prev, *next; };
+typedef Vector< KlangEl* > KlangElVect;
+typedef Vector< PdaFactor* > FactorVect;
+
+typedef AvlMap<String, long, CmpStr> StringMap;
+typedef AvlMapEl<String, long> StringMapEl;
+
+/* Graph dictionary. */
+struct Definition 
+:
+	public DefListEl, public LelDefListEl
+{
+	enum Type { Production };
+
+	Definition( const InputLoc &loc, KlangEl *prodName, ProdElList *prodElList, 
+			bool prodCommit, CodeBlock *redBlock, int prodId, Type type ) : 
+		loc(loc), prodName(prodName), prodElList(prodElList), 
+		prodCommit(prodCommit), redBlock(redBlock), prodId(prodId), 
+		type(type), fsm(0), fsmLength(0), uniqueEmptyLeader(0), 
+		isLeftRec(false), localFrame(0), lhsField(0) {}
+
+	InputLoc loc;
+	KlangEl *prodName;
+	ProdElList *prodElList;
+	bool prodCommit;
+
+	CodeBlock *redBlock;
+
+	int prodId;
+	Type type;
+
+	PdaGraph *fsm;
+	int fsmLength;
+	String data;
+	LongSet reducesTo;
+
+	KlangEl *uniqueEmptyLeader;
+
+	ProdIdSet nonTermFirstSet;
+	AlphSet firstSet;
+	bool isLeftRec;
+
+	ObjectDef *localFrame;
+	ObjField *lhsField;
+};
+
+struct CmpDefById
+{
+	static int compare( Definition *d1, Definition *d2 )
+	{
+		if ( d1->prodId < d2->prodId )
+			return -1;
+		else if ( d1->prodId > d2->prodId )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+
+/* Map dotItems to productions. */
+typedef BstMap< int, Definition*, CmpOrd<int> > DotItemIndex;
+typedef BstMapEl< int, Definition*> DotItemIndexEl;
+
+/* A vector of production vectors. Each non terminal can have many productions. */
+typedef DListMel<Definition, DefListEl> DefList;
+typedef DListMel<Definition, LelDefListEl> LelDefList;
+
+/* A set of machines made during a closure round. */
+typedef Vector< PdaGraph* > Machines;
+
+/* List of language elements. */
+typedef DList<KlangEl> LelList;
+
+typedef Vector< TokenDef* > TokenDefVect;
+
+struct UniqueType;
+
+typedef Vector<KlangEl*> KlangElVect;
+
+/* A language element class. Can be a nonTerm or a term. */
+struct KlangEl : public DListEl<KlangEl>
+{
+	enum Type { Unknown, Term, NonTerm };
+
+	KlangEl( Namespace *nspace, const String &name, Type type );
+	~KlangEl();
+
+	/* The region the language element was defined in. */
+	Namespace *nspace;
+
+	String name;
+	String lit;
+
+	String fullName;
+	String fullLit;
+
+	Type type;
+	long id;
+	bool isUserTerm;
+	bool isContext;
+	String displayString;
+	long numAppearances;
+	bool commit;
+	bool ignore;
+	bool reduceFirst;
+	bool isLiteral;
+	bool isRepeat;
+	bool isOpt;
+	bool parseStop;
+
+	/* Productions from the language element if it is a non-terminal. */
+	LelDefList defList;
+
+	TokenDef *tokenDef;
+	Definition *rootDef;
+	KlangEl *termDup;
+
+	PdaGraph *pdaGraph;
+	PdaTables *pdaTables;
+
+	CodeBlock *transBlock;
+
+	ObjectDef *objectDef;
+	NamespaceQual *objectDefUsesQual;
+	String objectDefUses;
+
+	long thisSize;
+	long ofiOffset;
+
+	GenericType *generic;
+
+
+	long parserId;
+};
+
+struct PdaFactor
+{
+	/* Language elements a factor node can be. */
+	enum Type {
+		LiteralType, 
+		ReferenceType
+	}; 
+
+	/* Construct with a literal fsm. */
+	PdaFactor( const InputLoc &loc, bool commit, NamespaceQual *nspaceQual, 
+			PdaLiteral *literal, int priorVal, bool opt, bool repeat ) :
+		loc(loc), commit(commit), nspaceQual(nspaceQual), 
+		literal(literal), langEl(0), priorVal(priorVal), opt(opt), repeat(repeat),
+		nspace(0), type(LiteralType), objField(0) {}
+
+	/* Construct with a reference to a var def. */
+	PdaFactor( const InputLoc &loc, bool commit, NamespaceQual *nspaceQual, 
+			const String &refName, int priorVal, bool opt, bool repeat ) :
+		loc(loc), commit(commit), nspaceQual(nspaceQual), refName(refName),
+		literal(0), langEl(0), priorVal(priorVal), opt(opt), repeat(repeat), 
+		nspace(0), type(ReferenceType), objField(0) {}
+
+	PdaFactor( const InputLoc &loc, KlangEl *langEl ) :
+		loc(loc), commit(false), nspaceQual(0), literal(0), langEl(langEl), 
+		priorVal(0), opt(false), repeat(false), nspace(0), type(ReferenceType), objField(0) {}
+
+	PdaFactor() :
+		commit(false), nspaceQual(0), 
+		literal(0), langEl(0), priorVal(0), opt(false), repeat(false),
+		nspace(0), type(LiteralType), objField(0) {}
+
+	InputLoc loc;
+	bool commit;
+	NamespaceQual *nspaceQual;
+	String refName;
+	PdaLiteral *literal;
+	KlangEl *langEl;
+	int priorVal;
+	bool opt;
+	bool repeat;
+	Namespace *nspace;
+	Type type;
+	ObjField *objField;
+
+	PdaFactor *prev, *next;
+};
+
+struct ProdElList : public DList<PdaFactor>
+{
+	PdaGraph *walk( ParseData *pd );
+};
+
+/* Some literal machine. Can be a number or literal string. */
+struct PdaLiteral
+{
+	PdaLiteral( const InputLoc &loc, const Token &token )
+		: loc(loc), token(token), value(0) { }
+
+	InputLoc loc;
+	Token token;
+	long value;
+};
+
+/* Forwards. */
+using std::ostream;
+
+/* Nodes in the tree that use this action. */
+typedef Vector<NameInst*> ActionRefs;
+
+/* Element in list of actions. Contains the string for the code to exectute. */
+struct Action 
+:
+	public DListEl<Action>,
+	public AvlTreeEl<Action>
+{
+public:
+
+	Action( const InputLoc &loc, const String &name, InlineList *inlineList )
+	:
+		loc(loc),
+		name(name),
+		objField(0),
+		inlineList(inlineList), 
+		actionId(-1),
+		numTransRefs(0),
+		numToStateRefs(0),
+		numFromStateRefs(0),
+		numEofRefs(0),
+		numCondRefs(0),
+		anyCall(false),
+		isLmAction(false)
+	{
+	}
+
+	Action( MarkType markType, ObjField *objField )
+	:
+		name("mark"),
+		markType(markType),
+		objField(objField),
+		inlineList(new InlineList), 
+		actionId(-1),
+		numTransRefs(0),
+		numToStateRefs(0),
+		numFromStateRefs(0),
+		numEofRefs(0),
+		numCondRefs(0),
+		anyCall(false),
+		isLmAction(false)
+	{
+	}
+
+	/* Key for action dictionary. */
+	const String &getKey() const { return name; }
+
+	/* Data collected during parse. */
+	InputLoc loc;
+	String name;
+	
+	MarkType markType;
+	ObjField *objField;
+
+	InlineList *inlineList;
+	int actionId;
+
+	void actionName( ostream &out )
+	{
+		if ( name != 0 )
+			out << name;
+		else
+			out << loc.line << ":" << loc.col;
+	}
+
+	/* Places in the input text that reference the action. */
+	ActionRefs actionRefs;
+
+	/* Number of references in the final machine. */
+	bool numRefs() 
+		{ return numTransRefs + numToStateRefs + numFromStateRefs + numEofRefs; }
+	int numTransRefs;
+	int numToStateRefs;
+	int numFromStateRefs;
+	int numEofRefs;
+	int numCondRefs;
+	bool anyCall;
+
+	bool isLmAction;
+};
+
+/* A list of actions. */
+typedef DList<Action> ActionList;
+typedef AvlTree<Action, String, CmpStr> ActionDict;
+
+struct VarDef;
+struct Join;
+struct Expression;
+struct Term;
+struct FactorWithAug;
+struct FactorWithLabel;
+struct FactorWithRep;
+struct FactorWithNeg;
+struct Factor;
+struct Literal;
+struct Range;
+struct RegExpr;
+struct ReItem;
+struct ReOrBlock;
+struct ReOrItem;
+struct TokenRegion;
+
+/* Priority name dictionary. */
+typedef AvlMapEl<String, int> PriorDictEl;
+typedef AvlMap<String, int, CmpStr> PriorDict;
+
+/* Local error name dictionary. */
+typedef AvlMapEl<String, int> LocalErrDictEl;
+typedef AvlMap<String, int, CmpStr> LocalErrDict;
+
+/* Tree of instantiated names. */
+typedef BstMapEl<String, NameInst*> NameMapEl;
+typedef BstMap<String, NameInst*, CmpStr> NameMap;
+typedef Vector<NameInst*> NameVect;
+typedef BstSet<NameInst*> NameSet;
+
+/* Node in the tree of instantiated names. */
+struct NameInst
+{
+	NameInst( const InputLoc &loc, NameInst *parent, const String &name, 
+				int id, bool isLabel ) : 
+		loc(loc), parent(parent), name(name), id(id), isLabel(isLabel),
+		isLongestMatch(false), numRefs(0), numUses(0), start(0), final(0) {}
+
+	InputLoc loc;
+
+	/* Keep parent pointers in the name tree to retrieve 
+	 * fully qulified names. */
+	NameInst *parent;
+
+	String name;
+	int id;
+	bool isLabel;
+	bool isLongestMatch;
+
+	int numRefs;
+	int numUses;
+
+	/* Names underneath us, excludes anonymous names. */
+	NameMap children;
+
+	/* All names underneath us in order of appearance. */
+	NameVect childVect;
+
+	/* Join scopes need an implicit "final" target. */
+	NameInst *start, *final;
+
+	/* During a fsm generation walk, lists the names that are referenced by
+	 * epsilon operations in the current scope. After the link is made by the
+	 * epsilon reference and the join operation is complete, the label can
+	 * have its refcount decremented. Once there are no more references the
+	 * entry point can be removed from the fsm returned. */
+	NameVect referencedNames;
+
+	/* Pointers for the name search queue. */
+	NameInst *prev, *next;
+
+	/* Check if this name inst or any name inst below is referenced. */
+	bool anyRefsRec();
+};
+
+typedef DList<NameInst> NameInstList;
+
+/* Stack frame used in walking the name tree. */
+struct NameFrame 
+{
+	NameInst *prevNameInst;
+	int prevNameChild;
+	NameInst *prevLocalScope;
+};
+
+/* Class to collect information about the machine during the 
+ * parse of input. */
+struct ParseData
+{
+	/* Create a new parse data object. This is done at the beginning of every
+	 * fsm specification. */
+	ParseData( const String &fileName, const String &sectionName, 
+			const InputLoc &sectionLoc, ostream &out );
+	~ParseData();
+
+	/*
+	 * Setting up the graph dict.
+	 */
+
+	void compileLiteralTokens();
+	void initEmptyScanners();
+	void initUniqueTypes();
+
+	/* Initialize a graph dict with the basic fsms. */
+	void initGraphDict();
+	void createBuiltin( const char *name, BuiltinMachine builtin );
+
+	/* Make a name id in the current name instantiation scope if it is not
+	 * already there. */
+	NameInst *addNameInst( const InputLoc &loc, char *data, bool isLabel );
+	NameInst *makeJoinNameTree( Join *join );
+	NameInst *makeNameTree( );
+	void fillNameIndex( NameInst **nameIndex, NameInst *from );
+	NameInst **makeNameIndex( NameInst *rootName );
+
+	void printNameTree( NameInst *rootName );
+	void printNameIndex( NameInst **nameIndex );
+
+	/* Increments the usage count on entry names. Names that are no longer
+	 * needed will have their entry points unset. */
+	void unsetObsoleteEntries( FsmGraph *graph );
+
+	/* Resove name references in action code and epsilon transitions. */
+	NameSet resolvePart( NameInst *refFrom, const char *data, bool recLabelsOnly );
+	void resolveFrom( NameSet &result, NameInst *refFrom, 
+			const NameRef &nameRef, int namePos );
+	void referenceRegions( NameInst *root );
+
+	/* Set the alphabet type. If type types are not valid returns false. */
+	bool setAlphType( char *s1, char *s2 );
+	bool setAlphType( char *s1 );
+
+	/* Unique actions. */
+	void removeDups( ActionTable &actionTable );
+	void removeActionDups( FsmGraph *graph );
+
+	/* Dumping the name instantiation tree. */
+	void printNameInst( NameInst *nameInst, int level );
+
+	/* Make the graph from a graph dict node. Does minimization. */
+	void finishGraphBuild( FsmGraph *graph );
+	FsmGraph *makeJoin( Join *join );
+	FsmGraph *makeAllRegions();
+	FsmGraph *makeFsmGraph( Join *join );
+	FsmGraph *makeScanner() 
+		{ return makeFsmGraph(0); }
+
+	void analyzeAction( Action *action, InlineList *inlineList );
+	void analyzeGraph( FsmGraph *graph );
+
+	void initKeyOps();
+
+	/*
+	 * Data collected during the parse.
+	 */
+
+	/* The list of instances. */
+	GraphList instanceList;
+
+	/* Dictionary of actions. Lets actions be defined and then referenced. */
+	ActionDict actionDict;
+
+	/* Dictionary of named priorities. */
+	PriorDict priorDict;
+
+	/* Dictionary of named local errors. */
+	LocalErrDict localErrDict;
+
+	/* List of actions. Will be pasted into a switch statement. */
+	ActionList actionList;
+
+	/* The id of the next priority name and label. */
+	int nextPriorKey, nextLocalErrKey, nextNameId;
+	
+	/* The default priority number key for a machine. This is active during
+	 * the parse of the rhs of a machine assignment. */
+	int curDefPriorKey;
+
+	int curDefLocalErrKey;
+
+	/* Alphabet type. */
+	HostType *userAlphType;
+	bool alphTypeSet;
+
+	/* Element type and get key expression. */
+	InlineList *getKeyExpr;
+	InlineList *accessExpr;
+	InlineList *curStateExpr;
+
+	/* The alphabet range. */
+	char *lowerNum, *upperNum;
+	Key lowKey, highKey;
+	InputLoc rangeLowLoc, rangeHighLoc;
+
+	/* The name of the file the fsm is from, and the spec name. */
+	String fileName;
+	String sectionName;
+	InputLoc sectionLoc;
+
+	/* Number of errors encountered parsing the fsm spec. */
+	int errorCount;
+
+	/* Counting the action and priority ordering. */
+	int curActionOrd;
+	int curPriorOrd;
+
+	/* Root of the name tree. */
+	NameInst *curNameInst;
+	int curNameChild;
+
+	/* The place where resolved epsilon transitions go. These cannot go into
+	 * the parse tree because a single epsilon op can resolve more than once
+	 * to different nameInsts if the machine it's in is used more than once. */
+	NameVect epsilonResolvedLinks;
+	int nextEpsilonResolvedLink;
+
+	/* Root of the name tree used for doing local name searches. */
+	NameInst *localNameScope;
+
+	void setLmInRetLoc( InlineList *inlineList );
+	void initLongestMatchData();
+	void initNameWalk( NameInst *rootName );
+	NameInst *nextNameScope() { return curNameInst->childVect[curNameChild]; }
+	NameFrame enterNameScope( bool isLocal, int numScopes );
+	void popNameScope( const NameFrame &frame );
+	void resetNameScope( const NameFrame &frame );
+
+	/* Counter for assigning ids to longest match items. */
+	int nextTokenId;
+
+	/* List of all longest match parse tree items. */
+	RegionList regionList;
+
+	NamespaceList namespaceList;
+
+	Action *newAction( const String &name, InlineList *inlineList );
+
+	Action *setTokStart;
+	int setTokStartOrd;
+
+	Action *initActId;
+	int initActIdOrd;
+
+	Action *setTokEnd;
+	int setTokEndOrd;
+
+	CodeBlock *rootCodeBlock;
+
+	void beginProcessing()
+	{
+		::condData = &thisCondData;
+		::keyOps = &thisKeyOps;
+	}
+
+	CondData thisCondData;
+	KeyOps thisKeyOps;
+
+	/* CONTEXT FREE */
+	void wrapNonTerminals();
+	void makeDefinitionNames();
+	void noUndefindKlangEls();
+	void makeKlangElIds();
+	void makeKlangElNames();
+
+	/* Parser generation. */
+	void advanceReductions( PdaGraph *pdaGraph );
+	void sortActions( PdaGraph *pdaGraph );
+	void addDupTerms( PdaGraph *pdaGraph );
+	void linkExpansions( PdaGraph *pdaGraph );
+	void lalr1FollowEpsilonOp( PdaGraph *pdaGraph );
+
+	void transferCommits( PdaGraph *pdaGraph, PdaTrans *trans, PdaState *state, long prodId );
+
+	void lalr1AddFollow2( PdaGraph *pdaGraph, PdaTrans *trans, FollowToAdd &followKeys );
+	void lalr1AddFollow1( PdaGraph *pdaGraph, PdaState *state );
+
+	void lalr1AddFollow2( PdaGraph *pdaGraph, PdaTrans *trans, long followKey, long prior );
+	void lalr1AddFollow1( PdaGraph *pdaGraph, PdaTrans *trans );
+
+	void lalr1AddFollowSets( PdaGraph *pdaGraph, KlangEl *rootEl );
+
+	void lr0BringInItem( PdaGraph *pdaGraph, PdaState *dest, PdaState *prodState, 
+			PdaTrans *expandFrom, Definition *prod );
+	void lr0InvokeClosure( PdaGraph *pdaGraph, PdaState *state );
+	void lr0CloseAllStates( PdaGraph *pdaGraph );
+
+	void lalr1GenerateParser( PdaGraph *pdaGraph, KlangEl *rootEl );
+
+	void reduceActions( PdaGraph *pdaGraph );
+
+	bool makeNonTermFirstSetProd( Definition *prod, PdaState *state );
+	void makeNonTermFirstSets();
+
+	bool makeFirstSetProd( Definition *prod, PdaState *state );
+	void makeFirstSets();
+
+	void trySetTime( PdaTrans *trans, long code, long &time );
+	void addRegion( PdaState *tabState, long pdaKey );
+	PdaState *followProd( PdaState *tabState, PdaState *prodState );
+	void findFollow( AlphSet &result, PdaState *overTab, 
+			PdaState *overSrc, Definition *parentDef );
+	void pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl );
+	void pdaOrderFollow( KlangEl *rootEl, PdaState *tabState, 
+			PdaTrans *tabTrans, PdaTrans *srcTrans,
+			Definition *parentDef, Definition *definition, long &time );
+	void pdaOrderProd( KlangEl *rootEl, PdaState *tabState, 
+			PdaState *srcState, Definition *parentDef, long &time );
+	void analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl );
+
+	void makeProdFsms();
+	void insertUniqueEmptyProductions();
+	void printNonTermFirstSets();
+	void printFirstSets();
+
+	void resolveLiteralFactor( PdaFactor *fact );
+	void resolveReferenceFactor( PdaFactor *fact );
+	void resolveFactor( PdaFactor *fact );
+	void resolveProductionEls();
+	void resolvePatternEls();
+	void resolveReplacementEls();
+
+	void addMatchText( ObjectDef *frame, KlangEl *lel );
+	void addMatchLength( ObjectDef *frame, KlangEl *lel );
+	void addTransTokVar( ObjectDef *frame, KlangEl *lel );
+	void addProdRHSLoads( Definition *prod, long pos );
+	void addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList );
+	void addProdRedObjectVar( ObjectDef *localFrame, KlangEl *langEl );
+	void addProdObjects();
+
+	void prepGrammar();
+
+	void makePatternParsers();
+	void parsePatterns();
+
+	void makeParser( KlangEl *rootEl );
+	PdaGraph *makePdaGraph( KlangEl *rootEl );
+	PdaTables *makePdaTables( PdaGraph *pdaGraph );
+
+	void fillInPatterns( Program *prg );
+	void makeRuntimeData();
+
+	/* Generate and write out the fsm. */
+	void generateGraphviz();
+
+	void verifyParseStopGrammar( KlangEl *langEl );
+
+	void initFieldInstructions( ObjField *el );
+	void initLocalInstructions( ObjField *el );
+	void initLocalRefInstructions( ObjField *el );
+
+	void initMapFunctions( GenericType *gen );
+	void initListField( GenericType *gen, const char *name, int offset );
+	void initListFields( GenericType *gen );
+	void initListFunctions( GenericType *gen );
+	void initVectorFunctions( GenericType *gen );
+
+	void addStdin();
+	void addStdout();
+	void addStderr();
+	void initGlobalFunctions();
+	void makeDefaultIterators();
+	void addLengthField( ObjectDef *objDef, Code getLength );
+	ObjectDef *findObject( const String &name );
+	void initAllLanguageObjects();
+	void resolveListElementOf( ObjectDef *container, ObjectDef *obj, ElementOf *elof );
+	void resolveMapElementOf( ObjectDef *container, ObjectDef *obj, ElementOf *elof );
+	void resolveElementOf( ObjectDef *obj );
+	void makeFuncVisible( Function *func, bool isUserIter );
+	void compileFunction( Function *func );
+	void compileUserIter( Function *func );
+	void compilePreEof( TokenRegion *region );
+	void compileRootBlock();
+	void compileTranslateBlock( KlangEl *langEl );
+	void findLocalTrees( CharSet &trees );
+	void compileReductionCode( Definition *prod );
+	void resolveGenericTypes();
+	void compileByteCode();
+
+	void resolveUses();
+	void createDefaultScanner();
+	void semanticAnalysis();
+
+	/*
+	 * Data collected during the parse.
+	 */
+
+	/* Dictionary of graphs. Both instances and non-instances go here. */
+	LelList langEls;
+
+	/* The list of instances. */
+	DefList prodList;
+
+	/* Dumping. */
+	DotItemIndex dotItemIndex;
+
+	/* The name of the file the fsm is from, and the spec name. */
+	// EXISTS IN RL: char *fileName; 
+	String parserName;
+	ostream &out;
+	// EXISTS IN RL: InputLoc sectionLoc;
+
+	/* How to access the instance data. */
+	String access;
+
+	/* The name of the token structure. */
+	String tokenStruct;
+
+	GenericType *anyList;
+	GenericType *anyMap;
+	GenericType *anyVector;
+
+	KlangEl *ptrKlangEl;
+	KlangEl *boolKlangEl;
+	KlangEl *intKlangEl;
+	KlangEl *strKlangEl;
+	KlangEl *streamKlangEl;
+	KlangEl *anyKlangEl;
+	KlangEl *rootKlangEl;
+	KlangEl *eofKlangEl;
+	KlangEl *errorKlangEl;
+	KlangEl *defaultCharKlangEl;
+
+	TokenRegion *rootRegion;
+	TokenRegion *defaultRegion;
+	TokenRegion *eofTokenRegion;
+
+	Namespace *defaultNamespace;
+	Namespace *rootNamespace;
+
+	int nextSymbolId;
+	int firstNonTermId;
+
+	KlangEl **langElIndex;
+	PdaState *actionDestState;
+	DefSetSet prodSetSet;
+
+	Definition **prodIdIndex;
+	AlphSet literalSet;
+
+	PatternList patternList;
+	ReplList replList;
+
+	ObjectDef *globalObjectDef;
+
+	VectorTypeIdMap vectorTypeIdMap;
+	ObjectDef *curLocalFrame;
+
+	UniqueType *findUniqueType( int typeId );
+	UniqueType *findUniqueType( int typeId, KlangEl *langEl );
+	UniqueType *findUniqueType( int typeId, IterDef *iterDef );
+
+	UniqueType *uniqueTypeNil;
+	UniqueType *uniqueTypePtr;
+	UniqueType *uniqueTypeBool;
+	UniqueType *uniqueTypeInt;
+	UniqueType *uniqueTypeStr;
+	UniqueType *uniqueTypeStream;
+	UniqueType *uniqueTypeAny;
+
+	UniqueTypeMap uniqeTypeMap;
+
+	void initStrObject();
+	void initStreamObject();
+	void initIntObject();
+	void initTokenObjects();
+
+	ObjectDef *intObj;
+	ObjectDef *strObj;
+	ObjectDef *streamObj;
+	ObjectDef *tokenObj;
+
+	FsmTables *fsmTables;
+	RuntimeData *runtimeData;
+
+	int nextPatReplId;
+	int nextGenericId;
+
+	FunctionList functionList;
+	int nextFuncId;
+
+	enum CompileContext {
+		CompileTranslation,
+		CompileReduction,
+		CompileFunction,
+		CompileRoot
+	};
+
+	CompileContext compileContext;
+	LongVect returnJumps;
+	LongVect breakJumps;
+	Function *curFunction;
+
+	/* Loops fill this in for return statements to use. */
+	CodeVect *loopCleanup;
+
+	ObjField *makeDataEl();
+	ObjField *makePosEl();
+
+	IterDef *findIterDef( IterDef::Type type, GenericType *generic );
+	IterDef *findIterDef( IterDef::Type type, Function *func );
+	IterDef *findIterDef( IterDef::Type type );
+	IterDefSet iterDefSet;
+
+	enum GeneratesType { GenToken, GenIgnore, GenCfl };
+
+	int nextObjectId;
+	GeneratesType generatesType;
+	bool generatesIgnore;
+	bool insideRegion;
+	String tokenDefName;
+
+	StringMap literalStrings;
+
+	long nextFrameId;
+	long nextParserId;
+
+	ObjectDef *rootLocalFrame;
+
+	long nextLabelId;
+	ObjFieldMap *objFieldMap;
+};
+
+void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
+Key makeFsmKeyHex( char *str, const InputLoc &loc, ParseData *pd );
+Key makeFsmKeyDec( char *str, const InputLoc &loc, ParseData *pd );
+Key makeFsmKeyNum( char *str, const InputLoc &loc, ParseData *pd );
+Key makeFsmKeyChar( char c, ParseData *pd );
+void makeFsmKeyArray( Key *result, char *data, int len, ParseData *pd );
+void makeFsmUniqueKeyArray( KeySet &result, char *data, int len, 
+		bool caseInsensitive, ParseData *pd );
+FsmGraph *makeBuiltin( BuiltinMachine builtin, ParseData *pd );
+FsmGraph *dotFsm( ParseData *pd );
+FsmGraph *dotStarFsm( ParseData *pd );
+
+void errorStateLabels( const NameSet &locations );
+
+struct Parser;
+
+typedef AvlMap<String, Parser *, CmpStr> ParserDict;
+typedef AvlMapEl<String, Parser *> ParserDictEl;
+
+KlangEl *getKlangEl( ParseData *pd, Namespace *nspace,
+		const String &data, KlangEl::Type defType );
+
+#endif /* _PARSEDATA_H */
diff --git a/colm/parsetree.cpp b/colm/parsetree.cpp
new file mode 100644
index 00000000..86284867
--- /dev/null
+++ b/colm/parsetree.cpp
@@ -0,0 +1,2172 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <iomanip>
+#include <errno.h>
+#include <limits.h>
+#include <stdlib.h>
+
+/* Parsing. */
+#include "lmparse.h"
+#include "parsetree.h"
+
+using namespace std;
+ostream &operator<<( ostream &out, const NameRef &nameRef );
+ostream &operator<<( ostream &out, const NameInst &nameInst );
+ostream &operator<<( ostream &out, const Token &token );
+
+/* Convert the literal string which comes in from the scanner into an array of
+ * characters with escapes and options interpreted. Also null terminates the
+ * string. Though this null termination should not be relied on for
+ * interpreting literals in the parser because the string may contain a
+ * literal string with \0 */
+void prepareLitString( String &result, bool &caseInsensitive, 
+		const String &srcString, const InputLoc &loc )
+{
+	result.setAs( String::Fresh(), srcString.length() );
+	caseInsensitive = false;
+
+	char *src = srcString.data + 1;
+	char *end = srcString.data + srcString.length() - 1;
+
+	while ( *end != '\'' && *end != '\"' ) {
+		if ( *end == 'i' )
+			caseInsensitive = true;
+		else {
+			error( loc ) << "literal string '" << *end << 
+					"' option not supported" << endl;
+		}
+		end -= 1;
+	}
+
+	char *dest = result.data;
+	int len = 0;
+	while ( src != end ) {
+		if ( *src == '\\' ) {
+			switch ( src[1] ) {
+			case '0': dest[len++] = '\0'; break;
+			case 'a': dest[len++] = '\a'; break;
+			case 'b': dest[len++] = '\b'; break;
+			case 't': dest[len++] = '\t'; break;
+			case 'n': dest[len++] = '\n'; break;
+			case 'v': dest[len++] = '\v'; break;
+			case 'f': dest[len++] = '\f'; break;
+			case 'r': dest[len++] = '\r'; break;
+			case '\n':  break;
+			default: dest[len++] = src[1]; break;
+			}
+			src += 2;
+		}
+		else {
+			dest[len++] = *src++;
+		}
+	}
+
+	result.chop( len );
+}
+
+int CmpUniqueType::compare( const UniqueType &ut1, const UniqueType &ut2 )
+{
+	if ( ut1.typeId < ut2.typeId )
+		return -1;
+	else if ( ut1.typeId > ut2.typeId )
+		return 1;
+	else if ( ut1.typeId == TYPE_TREE || 
+			ut1.typeId == TYPE_PTR || 
+			ut1.typeId == TYPE_REF )
+	{
+		if ( ut1.langEl < ut2.langEl )
+			return -1;
+		else if ( ut1.langEl > ut2.langEl )
+			return 1;
+	}
+	else if ( ut1.typeId == TYPE_ITER ) {
+		if ( ut1.iterDef < ut2.iterDef )
+			return -1;
+		else if ( ut1.iterDef > ut2.iterDef )
+			return 1;
+	}
+	else {
+		/* Fail on anything unimplemented. */
+		assert( false );
+	}
+
+	return 0;
+}
+
+
+FsmGraph *VarDef::walk( ParseData *pd )
+{
+	/* We enter into a new name scope. */
+	NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+	/* Recurse on the expression. */
+	FsmGraph *rtnVal = joinOrLm->walk( pd );
+	
+	/* Do the tranfer of local error actions. */
+	LocalErrDictEl *localErrDictEl = pd->localErrDict.find( name );
+	if ( localErrDictEl != 0 ) {
+		for ( StateList::Iter state = rtnVal->stateList; state.lte(); state++ )
+			rtnVal->transferErrorActions( state, localErrDictEl->value );
+	}
+
+	/* If the expression below is a join operation with multiple expressions
+	 * then it just had epsilon transisions resolved. If it is a join
+	 * with only a single expression then run the epsilon op now. */
+	if ( joinOrLm->type == JoinOrLm::JoinType && joinOrLm->join->exprList.length() == 1 )
+		rtnVal->epsilonOp();
+
+	/* We can now unset entry points that are not longer used. */
+	pd->unsetObsoleteEntries( rtnVal );
+
+	/* If the name of the variable is referenced then add the entry point to
+	 * the graph. */
+	if ( pd->curNameInst->numRefs > 0 )
+		rtnVal->setEntry( pd->curNameInst->id, rtnVal->startState );
+	
+	/* Pop the name scope. */
+	pd->popNameScope( nameFrame );
+	return rtnVal;
+}
+
+void VarDef::makeNameTree( const InputLoc &loc, ParseData *pd )
+{
+	/* The variable definition enters a new scope. */
+	NameInst *prevNameInst = pd->curNameInst;
+	pd->curNameInst = pd->addNameInst( loc, name, false );
+
+	if ( joinOrLm->type == JoinOrLm::LongestMatchType )
+		pd->curNameInst->isLongestMatch = true;
+
+	/* Recurse. */
+	joinOrLm->makeNameTree( pd );
+
+	/* The name scope ends, pop the name instantiation. */
+	pd->curNameInst = prevNameInst;
+}
+
+void VarDef::resolveNameRefs( ParseData *pd )
+{
+	/* Entering into a new scope. */
+	NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+	/* Recurse. */
+	joinOrLm->resolveNameRefs( pd );
+	
+	/* The name scope ends, pop the name instantiation. */
+	pd->popNameScope( nameFrame );
+}
+
+InputLoc TokenDef::getLoc()
+{ 
+	return action != 0 ? action->loc : semiLoc;
+}
+
+/*
+ * If there are any LMs then all of the following entry points must reset
+ * tokstart:
+ *
+ *  1. fentry(StateRef)
+ *  2. ftoto(StateRef), fcall(StateRef), fnext(StateRef)
+ *  3. targt of any transition that has an fcall (the return loc).
+ *  4. start state of all longest match routines.
+ */
+
+Action *TokenRegion::newAction( ParseData *pd, const InputLoc &loc, 
+		const String &name, InlineList *inlineList )
+{
+	Action *action = new Action( loc, name, inlineList );
+	pd->actionList.append( action );
+	action->isLmAction = true;
+	return action;
+}
+
+void TokenRegion::makeActions( ParseData *pd )
+{
+	/* Make actions that set the action id. */
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* For each part create actions for setting the match type.  We need
+		 * to do this so that the actions will go into the actionIndex. */
+		InlineList *inlineList = new InlineList;
+		inlineList->append( new InlineItem( lmi->getLoc(), this, lmi, 
+				InlineItem::LmSetActId ) );
+		char *actName = new char[50];
+		sprintf( actName, "store%i", lmi->longestMatchId );
+		lmi->setActId = newAction( pd, lmi->getLoc(), actName, inlineList );
+	}
+
+	/* Make actions that execute the user action and restart on the last character. */
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* For each part create actions for setting the match type.  We need
+		 * to do this so that the actions will go into the actionIndex. */
+		InlineList *inlineList = new InlineList;
+		inlineList->append( new InlineItem( lmi->getLoc(), this, lmi, 
+				InlineItem::LmOnLast ) );
+		char *actName = new char[50];
+		sprintf( actName, "imm%i", lmi->longestMatchId );
+		lmi->actOnLast = newAction( pd, lmi->getLoc(), actName, inlineList );
+	}
+
+	/* Make actions that execute the user action and restart on the next
+	 * character.  These actions will set tokend themselves (it is the current
+	 * char). */
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* For each part create actions for setting the match type.  We need
+		 * to do this so that the actions will go into the actionIndex. */
+		InlineList *inlineList = new InlineList;
+		inlineList->append( new InlineItem( lmi->getLoc(), this, lmi, 
+				InlineItem::LmOnNext ) );
+		char *actName = new char[50];
+		sprintf( actName, "lagh%i", lmi->longestMatchId );
+		lmi->actOnNext = newAction( pd, lmi->getLoc(), actName, inlineList );
+	}
+
+	/* Make actions that execute the user action and restart at tokend. These
+	 * actions execute some time after matching the last char. */
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* For each part create actions for setting the match type.  We need
+		 * to do this so that the actions will go into the actionIndex. */
+		InlineList *inlineList = new InlineList;
+		inlineList->append( new InlineItem( lmi->getLoc(), this, lmi, 
+				InlineItem::LmOnLagBehind ) );
+		char *actName = new char[50];
+		sprintf( actName, "lag%i", lmi->longestMatchId );
+		lmi->actLagBehind = newAction( pd, lmi->getLoc(), actName, inlineList );
+	}
+
+	InputLoc loc;
+	loc.line = 1;
+	loc.col = 1;
+
+	/* Create the error action. */
+	InlineList *il6 = new InlineList;
+	il6->append( new InlineItem( loc, this, 0, InlineItem::LmSwitch ) );
+	lmActSelect = newAction( pd, loc, "lagsel", il6 );
+}
+
+void TokenRegion::findName( ParseData *pd )
+{
+	NameInst *nameInst = pd->curNameInst;
+	while ( nameInst->name == 0 ) {
+		nameInst = nameInst->parent;
+		/* Since every machine must must have a name, we should always find a
+		 * name for the longest match. */
+		assert( nameInst != 0 );
+	}
+	name = nameInst->name;
+}
+
+void TokenRegion::makeNameTree( ParseData *pd )
+{
+	/* Create an anonymous scope for the longest match. Will be used for
+	 * restarting machine after matching a token. */
+	NameInst *prevNameInst = pd->curNameInst;
+	pd->curNameInst = pd->addNameInst( loc, 0, false );
+
+	/* Save off the name inst into the token region. This is only legal for
+	 * token regions because they are only ever referenced once (near the root
+	 * of the name tree). They cannot have more than one corresponding name
+	 * inst. */
+	assert( regionNameInst == 0 );
+	regionNameInst = pd->curNameInst;
+
+	/* Recurse into all parts of the longest match operator. */
+	for ( TokenDefList::Iter td = tokenDefList; td.lte(); td++ ) {
+		/* Watch out for patternless tokens. */
+		if ( td->join != 0 ) 
+			td->join->makeNameTree( pd );
+	}
+
+	/* Traverse the name tree upwards to find a name for this lm. */
+	findName( pd );
+
+	/* Also make the longest match's actions at this point. */
+	makeActions( pd );
+
+	/* The name scope ends, pop the name instantiation. */
+	pd->curNameInst = prevNameInst;
+}
+
+void TokenRegion::resolveNameRefs( ParseData *pd )
+{
+	/* The longest match gets its own name scope. */
+	NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+	/* Take an action reference for each longest match item and recurse. */
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* Watch out for patternless tokens. */
+		if ( lmi->join != 0 )
+			lmi->join->resolveNameRefs( pd );
+	}
+
+	/* The name scope ends, pop the name instantiation. */
+	pd->popNameScope( nameFrame );
+}
+
+void TokenRegion::restart( FsmGraph *graph, FsmTrans *trans )
+{
+	FsmState *fromState = trans->fromState;
+	graph->detachTrans( fromState, trans->toState, trans );
+	graph->attachTrans( fromState, graph->startState, trans );
+}
+
+void TokenRegion::runLongestMatch( ParseData *pd, FsmGraph *graph )
+{
+	graph->markReachableFromHereStopFinal( graph->startState );
+	for ( StateList::Iter ms = graph->stateList; ms.lte(); ms++ ) {
+		if ( ms->stateBits & SB_ISMARKED ) {
+			ms->lmItemSet.insert( 0 );
+			ms->stateBits &= ~ SB_ISMARKED;
+		}
+	}
+
+	/* Transfer the first item of non-empty lmAction tables to the item sets
+	 * of the states that follow. Exclude states that have no transitions out.
+	 * This must happen on a separate pass so that on each iteration of the
+	 * next pass we have the item set entries from all lmAction tables. */
+	for ( StateList::Iter st = graph->stateList; st.lte(); st++ ) {
+		for ( TransList::Iter trans = st->outList; trans.lte(); trans++ ) {
+			if ( trans->lmActionTable.length() > 0 ) {
+				LmActionTableEl *lmAct = trans->lmActionTable.data;
+				FsmState *toState = trans->toState;
+				assert( toState );
+
+				/* Check if there are transitions out, this may be a very
+				 * close approximation? Out transitions going nowhere?
+				 * FIXME: Check. */
+				if ( toState->outList.length() > 0 ) {
+					/* Fill the item sets. */
+					graph->markReachableFromHereStopFinal( toState );
+					for ( StateList::Iter ms = graph->stateList; ms.lte(); ms++ ) {
+						if ( ms->stateBits & SB_ISMARKED ) {
+							ms->lmItemSet.insert( lmAct->value );
+							ms->stateBits &= ~ SB_ISMARKED;
+						}
+					}
+				}
+			}
+		}
+	}
+
+	/* The lmItem sets are now filled, telling us which longest match rules
+	 * can succeed in which states. First determine if we need to make sure
+	 * act is defaulted to zero. */
+	int maxItemSetLength = 0;
+	graph->markReachableFromHereStopFinal( graph->startState );
+	for ( StateList::Iter ms = graph->stateList; ms.lte(); ms++ ) {
+		if ( ms->stateBits & SB_ISMARKED ) {
+			if ( ms->lmItemSet.length() > maxItemSetLength )
+				maxItemSetLength = ms->lmItemSet.length();
+			ms->stateBits &= ~ SB_ISMARKED;
+		}
+	}
+
+	/* The actions executed on starting to match a token. */
+	graph->isolateStartState();
+	graph->startState->fromStateActionTable.setAction( pd->setTokStartOrd, pd->setTokStart );
+	if ( maxItemSetLength > 1 ) {
+		/* The longest match action switch may be called when tokens are
+		 * matched, in which case act must be initialized, there must be a
+		 * case to handle the error, and the generated machine will require an
+		 * error state. */
+		lmSwitchHandlesError = true;
+		graph->startState->toStateActionTable.setAction( pd->initActIdOrd, pd->initActId );
+	}
+
+	/* The place to store transitions to restart. It maybe possible for the
+	 * restarting to affect the searching through the graph that follows. For
+	 * now take the safe route and save the list of transitions to restart
+	 * until after all searching is done. */
+	Vector<FsmTrans*> restartTrans;
+
+	/* Set actions that do immediate token recognition, set the longest match part
+	 * id and set the token ending. */
+	for ( StateList::Iter st = graph->stateList; st.lte(); st++ ) {
+		for ( TransList::Iter trans = st->outList; trans.lte(); trans++ ) {
+			if ( trans->lmActionTable.length() > 0 ) {
+				LmActionTableEl *lmAct = trans->lmActionTable.data;
+				FsmState *toState = trans->toState;
+				assert( toState );
+
+				/* Check if there are transitions out, this may be a very
+				 * close approximation? Out transitions going nowhere?
+				 * FIXME: Check. */
+				if ( toState->outList.length() == 0 ) {
+					/* Can execute the immediate action for the longest match
+					 * part. Redirect the action to the start state. */
+					trans->actionTable.setAction( lmAct->key, 
+							lmAct->value->actOnLast );
+					restartTrans.append( trans );
+				}
+				else {
+					/* Look for non final states that have a non-empty item
+					 * set. If these are present then we need to record the
+					 * end of the token.  Also Find the highest item set
+					 * length reachable from here (excluding at transtions to
+					 * final states). */
+					bool nonFinalNonEmptyItemSet = false;
+					maxItemSetLength = 0;
+					graph->markReachableFromHereStopFinal( toState );
+					for ( StateList::Iter ms = graph->stateList; ms.lte(); ms++ ) {
+						if ( ms->stateBits & SB_ISMARKED ) {
+							if ( ms->lmItemSet.length() > 0 && !ms->isFinState() )
+								nonFinalNonEmptyItemSet = true;
+							if ( ms->lmItemSet.length() > maxItemSetLength )
+								maxItemSetLength = ms->lmItemSet.length();
+							ms->stateBits &= ~ SB_ISMARKED;
+						}
+					}
+
+					/* If there are reachable states that are not final and
+					 * have non empty item sets or that have an item set
+					 * length greater than one then we need to set tokend
+					 * because the error action that matches the token will
+					 * require it. */
+					if ( nonFinalNonEmptyItemSet || maxItemSetLength > 1 )
+						trans->actionTable.setAction( pd->setTokEndOrd, pd->setTokEnd );
+
+					/* Some states may not know which longest match item to
+					 * execute, must set it. */
+					if ( maxItemSetLength > 1 ) {
+						/* There are transitions out, another match may come. */
+						trans->actionTable.setAction( lmAct->key, 
+								lmAct->value->setActId );
+					}
+				}
+			}
+		}
+	}
+
+	/* Now that all graph searching is done it certainly safe set the
+	 * restarting. It may be safe above, however this must be verified. */
+	for ( Vector<FsmTrans*>::Iter pt = restartTrans; pt.lte(); pt++ )
+		restart( graph, *pt );
+
+	int lmErrActionOrd = pd->curActionOrd++;
+
+	/* Embed the error for recognizing a char. */
+	for ( StateList::Iter st = graph->stateList; st.lte(); st++ ) {
+		if ( st->lmItemSet.length() == 1 && st->lmItemSet[0] != 0 ) {
+			if ( st->isFinState() ) {
+				/* On error execute the onActNext action, which knows that
+				 * the last character of the token was one back and restart. */
+				graph->setErrorTarget( st, graph->startState, &lmErrActionOrd, 
+						&st->lmItemSet[0]->actOnNext, 1 );
+				st->eofActionTable.setAction( lmErrActionOrd, 
+						st->lmItemSet[0]->actOnNext );
+				st->eofTarget = graph->startState;
+			}
+			else {
+				graph->setErrorTarget( st, graph->startState, &lmErrActionOrd, 
+						&st->lmItemSet[0]->actLagBehind, 1 );
+				st->eofActionTable.setAction( lmErrActionOrd, 
+						st->lmItemSet[0]->actLagBehind );
+				st->eofTarget = graph->startState;
+			}
+		}
+		else if ( st->lmItemSet.length() > 1 ) {
+			/* Need to use the select. Take note of the which items the select
+			 * is needed for so only the necessary actions are included. */
+			for ( LmItemSet::Iter plmi = st->lmItemSet; plmi.lte(); plmi++ ) {
+				if ( *plmi != 0 )
+					(*plmi)->inLmSelect = true;
+			}
+			/* On error, execute the action select and go to the start state. */
+			graph->setErrorTarget( st, graph->startState, &lmErrActionOrd, 
+					&lmActSelect, 1 );
+			st->eofActionTable.setAction( lmErrActionOrd, lmActSelect );
+			st->eofTarget = graph->startState;
+		}
+	}
+	
+	/* Finally, the start state should be made final. */
+	graph->setFinState( graph->startState );
+}
+
+void TokenRegion::transferScannerLeavingActions( FsmGraph *graph )
+{
+	for ( StateList::Iter st = graph->stateList; st.lte(); st++ ) {
+		if ( st->outActionTable.length() > 0 )
+			graph->setErrorActions( st, st->outActionTable );
+	}
+}
+
+FsmGraph *TokenRegion::walk( ParseData *pd )
+{
+	/* The longest match has it's own name scope. */
+	NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+	/* Make each part of the longest match. */
+	int numParts = 0;
+	FsmGraph **parts = new FsmGraph*[tokenDefList.length()];
+	for ( TokenDefList::Iter lmi = tokenDefList; lmi.lte(); lmi++ ) {
+		/* Watch out for patternless tokens. */
+		if ( lmi->join != 0 ) {
+			/* Create the machine and embed the setting of the longest match id. */
+			parts[numParts] = lmi->join->walk( pd );
+			parts[numParts]->longMatchAction( pd->curActionOrd++, lmi );
+
+			/* Look for tokens that accept the zero length-word. The first one found
+			 * will be used as the default token. */
+			if ( defaultTokenDef == 0 && parts[numParts]->startState->isFinState() )
+				defaultTokenDef = lmi;
+
+			numParts += 1;
+		}
+	}
+	FsmGraph *retFsm = parts[0];
+
+	if ( defaultTokenDef != 0 && defaultTokenDef->token->ignore )
+		error() << "ignore token cannot be a scanner's zero-length token" << endp;
+
+	/* The region is empty. Return the empty set. */
+	if ( numParts == 0 ) {
+		retFsm = new FsmGraph();
+		retFsm->lambdaFsm();
+	}
+	else {
+		/* Before we union the patterns we need to deal with leaving actions. They
+		 * are transfered to error transitions out of the final states (like local
+		 * error actions) and to eof actions. In the scanner we need to forbid
+		 * on_last for any final state that has an leaving action. */
+		for ( int i = 0; i < numParts; i++ )
+			transferScannerLeavingActions( parts[i] );
+
+		/* Union machines one and up with machine zero. */
+		FsmGraph *retFsm = parts[0];
+		for ( int i = 1; i < numParts; i++ ) {
+			retFsm->unionOp( parts[i] );
+			afterOpMinimize( retFsm );
+		}
+
+		runLongestMatch( pd, retFsm );
+		delete[] parts;
+	}
+
+	/* Pop the name scope. */
+	pd->popNameScope( nameFrame );
+
+	return retFsm;
+}
+
+FsmGraph *JoinOrLm::walk( ParseData *pd )
+{
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+	case JoinType:
+		rtnVal = join->walk( pd );
+		break;
+	case LongestMatchType:
+		rtnVal = tokenRegion->walk( pd );
+		break;
+	}
+	return rtnVal;
+}
+
+void JoinOrLm::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case JoinType:
+		join->makeNameTree( pd );
+		break;
+	case LongestMatchType:
+		tokenRegion->makeNameTree( pd );
+		break;
+	}
+}
+
+void JoinOrLm::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case JoinType:
+		join->resolveNameRefs( pd );
+		break;
+	case LongestMatchType:
+		tokenRegion->resolveNameRefs( pd );
+		break;
+	}
+}
+
+
+/* Construct with a location and the first expression. */
+Join::Join( const InputLoc &loc, Expression *expr )
+:
+	loc(loc)
+{
+	exprList.append( expr );
+}
+
+/* Construct with a location and the first expression. */
+Join::Join( Expression *expr )
+:
+	loc(loc)
+{
+	exprList.append( expr );
+}
+
+/* Walk an expression node. */
+FsmGraph *Join::walk( ParseData *pd )
+{
+	if ( exprList.length() > 1 )
+		return walkJoin( pd );
+	else
+		return exprList.head->walk( pd );
+}
+
+/* There is a list of expressions to join. */
+FsmGraph *Join::walkJoin( ParseData *pd )
+{
+	/* We enter into a new name scope. */
+	NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+	/* Evaluate the machines. */
+	FsmGraph **fsms = new FsmGraph*[exprList.length()];
+	ExprList::Iter expr = exprList;
+	for ( int e = 0; e < exprList.length(); e++, expr++ )
+		fsms[e] = expr->walk( pd );
+	
+	/* Get the start and final names. Final is 
+	 * guaranteed to exist, start is not. */
+	NameInst *startName = pd->curNameInst->start;
+	NameInst *finalName = pd->curNameInst->final;
+
+	int startId = -1;
+	if ( startName != 0 ) {
+		/* Take note that there was an implicit link to the start machine. */
+		pd->localNameScope->referencedNames.append( startName );
+		startId = startName->id;
+	}
+
+	/* A final id of -1 indicates there is no epsilon that references the
+	 * final state, therefor do not create one or set an entry point to it. */
+	int finalId = -1;
+	if ( finalName->numRefs > 0 )
+		finalId = finalName->id;
+
+	/* Join machines 1 and up onto machine 0. */
+	FsmGraph *retFsm = fsms[0];
+	retFsm->joinOp( startId, finalId, fsms+1, exprList.length()-1 );
+
+	/* We can now unset entry points that are not longer used. */
+	pd->unsetObsoleteEntries( retFsm );
+
+	/* Pop the name scope. */
+	pd->popNameScope( nameFrame );
+
+	delete[] fsms;
+	return retFsm;
+}
+
+void Join::makeNameTree( ParseData *pd )
+{
+	if ( exprList.length() > 1 ) {
+		/* Create the new anonymous scope. */
+		NameInst *prevNameInst = pd->curNameInst;
+		pd->curNameInst = pd->addNameInst( loc, 0, false );
+
+		/* Join scopes need an implicit "final" target. */
+		pd->curNameInst->final = new NameInst( InputLoc(), pd->curNameInst, "final", 
+				pd->nextNameId++, false );
+
+		/* Recurse into all expressions in the list. */
+		for ( ExprList::Iter expr = exprList; expr.lte(); expr++ )
+			expr->makeNameTree( pd );
+
+		/* The name scope ends, pop the name instantiation. */
+		pd->curNameInst = prevNameInst;
+	}
+	else {
+		/* Recurse into the single expression. */
+		exprList.head->makeNameTree( pd );
+	}
+}
+
+
+void Join::resolveNameRefs( ParseData *pd )
+{
+	/* Branch on whether or not there is to be a join. */
+	if ( exprList.length() > 1 ) {
+		/* The variable definition enters a new scope. */
+		NameFrame nameFrame = pd->enterNameScope( true, 1 );
+
+		/* The join scope must contain a start label. */
+		NameSet resolved = pd->resolvePart( pd->localNameScope, "start", true );
+		if ( resolved.length() > 0 ) {
+			/* Take the first. */
+			pd->curNameInst->start = resolved[0];
+			if ( resolved.length() > 1 ) {
+				/* Complain about the multiple references. */
+				error(loc) << "multiple start labels" << endl;
+				errorStateLabels( resolved );
+			}
+		}
+
+		/* Make sure there is a start label. */
+		if ( pd->curNameInst->start != 0 ) {
+			/* There is an implicit reference to start name. */
+			pd->curNameInst->start->numRefs += 1;
+		}
+		else {
+			/* No start label. Complain and recover by adding a label to the
+			 * adding one. Recover ignoring the problem. */
+			error(loc) << "no start label" << endl;
+		}
+
+		/* Recurse into all expressions in the list. */
+		for ( ExprList::Iter expr = exprList; expr.lte(); expr++ )
+			expr->resolveNameRefs( pd );
+
+		/* The name scope ends, pop the name instantiation. */
+		pd->popNameScope( nameFrame );
+	}
+	else {
+		/* Recurse into the single expression. */
+		exprList.head->resolveNameRefs( pd );
+	}
+}
+
+/* Clean up after an expression node. */
+Expression::~Expression()
+{
+	switch ( type ) {
+		case OrType: case IntersectType: case SubtractType:
+		case StrongSubtractType:
+			delete expression;
+			delete term;
+			break;
+		case TermType:
+			delete term;
+			break;
+		case BuiltinType:
+			break;
+	}
+}
+
+/* Evaluate a single expression node. */
+FsmGraph *Expression::walk( ParseData *pd, bool lastInSeq )
+{
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+		case OrType: {
+			/* Evaluate the expression. */
+			rtnVal = expression->walk( pd, false );
+			/* Evaluate the term. */
+			FsmGraph *rhs = term->walk( pd );
+			/* Perform union. */
+			rtnVal->unionOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case IntersectType: {
+			/* Evaluate the expression. */
+			rtnVal = expression->walk( pd );
+			/* Evaluate the term. */
+			FsmGraph *rhs = term->walk( pd );
+			/* Perform intersection. */
+			rtnVal->intersectOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case SubtractType: {
+			/* Evaluate the expression. */
+			rtnVal = expression->walk( pd );
+			/* Evaluate the term. */
+			FsmGraph *rhs = term->walk( pd );
+			/* Perform subtraction. */
+			rtnVal->subtractOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case StrongSubtractType: {
+			/* Evaluate the expression. */
+			rtnVal = expression->walk( pd );
+
+			/* Evaluate the term and pad it with any* machines. */
+			FsmGraph *rhs = dotStarFsm( pd );
+			FsmGraph *termFsm = term->walk( pd );
+			FsmGraph *trailAnyStar = dotStarFsm( pd );
+			rhs->concatOp( termFsm );
+			rhs->concatOp( trailAnyStar );
+
+			/* Perform subtraction. */
+			rtnVal->subtractOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case TermType: {
+			/* Return result of the term. */
+			rtnVal = term->walk( pd );
+			break;
+		}
+		case BuiltinType: {
+			/* Duplicate the builtin. */
+			rtnVal = makeBuiltin( builtin, pd );
+			break;
+		}
+	}
+
+	return rtnVal;
+}
+
+void Expression::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case OrType:
+	case IntersectType:
+	case SubtractType:
+	case StrongSubtractType:
+		expression->makeNameTree( pd );
+		term->makeNameTree( pd );
+		break;
+	case TermType:
+		term->makeNameTree( pd );
+		break;
+	case BuiltinType:
+		break;
+	}
+}
+
+void Expression::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case OrType:
+	case IntersectType:
+	case SubtractType:
+	case StrongSubtractType:
+		expression->resolveNameRefs( pd );
+		term->resolveNameRefs( pd );
+		break;
+	case TermType:
+		term->resolveNameRefs( pd );
+		break;
+	case BuiltinType:
+		break;
+	}
+}
+
+/* Clean up after a term node. */
+Term::~Term()
+{
+	switch ( type ) {
+		case ConcatType:
+		case RightStartType:
+		case RightFinishType:
+		case LeftType:
+			delete term;
+			delete factorWithAug;
+			break;
+		case FactorWithAugType:
+			delete factorWithAug;
+			break;
+	}
+}
+
+/* Evaluate a term node. */
+FsmGraph *Term::walk( ParseData *pd, bool lastInSeq )
+{
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+		case ConcatType: {
+			/* Evaluate the Term. */
+			rtnVal = term->walk( pd, false );
+			/* Evaluate the FactorWithRep. */
+			FsmGraph *rhs = factorWithAug->walk( pd );
+			/* Perform concatenation. */
+			rtnVal->concatOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case RightStartType: {
+			/* Evaluate the Term. */
+			rtnVal = term->walk( pd );
+
+			/* Evaluate the FactorWithRep. */
+			FsmGraph *rhs = factorWithAug->walk( pd );
+
+			/* Set up the priority descriptors. The left machine gets the
+			 * lower priority where as the right get the higher start priority. */
+			priorDescs[0].key = pd->nextPriorKey++;
+			priorDescs[0].priority = 0;
+			rtnVal->allTransPrior( pd->curPriorOrd++, &priorDescs[0] );
+
+			/* The start transitions right machine get the higher priority.
+			 * Use the same unique key. */
+			priorDescs[1].key = priorDescs[0].key;
+			priorDescs[1].priority = 1;
+			rhs->startFsmPrior( pd->curPriorOrd++, &priorDescs[1] );
+
+			/* Perform concatenation. */
+			rtnVal->concatOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case RightFinishType: {
+			/* Evaluate the Term. */
+			rtnVal = term->walk( pd );
+
+			/* Evaluate the FactorWithRep. */
+			FsmGraph *rhs = factorWithAug->walk( pd );
+
+			/* Set up the priority descriptors. The left machine gets the
+			 * lower priority where as the finishing transitions to the right
+			 * get the higher priority. */
+			priorDescs[0].key = pd->nextPriorKey++;
+			priorDescs[0].priority = 0;
+			rtnVal->allTransPrior( pd->curPriorOrd++, &priorDescs[0] );
+
+			/* The finishing transitions of the right machine get the higher
+			 * priority. Use the same unique key. */
+			priorDescs[1].key = priorDescs[0].key;
+			priorDescs[1].priority = 1;
+			rhs->finishFsmPrior( pd->curPriorOrd++, &priorDescs[1] );
+
+			/* Perform concatenation. */
+			rtnVal->concatOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case LeftType: {
+			/* Evaluate the Term. */
+			rtnVal = term->walk( pd );
+
+			/* Evaluate the FactorWithRep. */
+			FsmGraph *rhs = factorWithAug->walk( pd );
+
+			/* Set up the priority descriptors. The left machine gets the
+			 * higher priority. */
+			priorDescs[0].key = pd->nextPriorKey++;
+			priorDescs[0].priority = 1;
+			rtnVal->allTransPrior( pd->curPriorOrd++, &priorDescs[0] );
+
+			/* The right machine gets the lower priority.  Since
+			 * startTransPrior might unnecessarily increase the number of
+			 * states during the state machine construction process (due to
+			 * isolation), we use allTransPrior instead, which has the same
+			 * effect. */
+			priorDescs[1].key = priorDescs[0].key;
+			priorDescs[1].priority = 0;
+			rhs->allTransPrior( pd->curPriorOrd++, &priorDescs[1] );
+
+			/* Perform concatenation. */
+			rtnVal->concatOp( rhs );
+			afterOpMinimize( rtnVal, lastInSeq );
+			break;
+		}
+		case FactorWithAugType: {
+			rtnVal = factorWithAug->walk( pd );
+			break;
+		}
+	}
+	return rtnVal;
+}
+
+void Term::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case ConcatType:
+	case RightStartType:
+	case RightFinishType:
+	case LeftType:
+		term->makeNameTree( pd );
+		factorWithAug->makeNameTree( pd );
+		break;
+	case FactorWithAugType:
+		factorWithAug->makeNameTree( pd );
+		break;
+	}
+}
+
+void Term::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case ConcatType:
+	case RightStartType:
+	case RightFinishType:
+	case LeftType:
+		term->resolveNameRefs( pd );
+		factorWithAug->resolveNameRefs( pd );
+		break;
+	case FactorWithAugType:
+		factorWithAug->resolveNameRefs( pd );
+		break;
+	}
+}
+
+/* Clean up after a factor with augmentation node. */
+FactorWithAug::~FactorWithAug()
+{
+	delete factorWithRep;
+
+	/* Walk the vector of parser actions, deleting function names. */
+
+	/* Clean up priority descriptors. */
+	if ( priorDescs != 0 )
+		delete[] priorDescs;
+}
+
+void FactorWithAug::assignActions( ParseData *pd, FsmGraph *graph, int *actionOrd )
+{
+	/* Assign actions. */
+	for ( int i = 0; i < actions.length(); i++ )  {
+		switch ( actions[i].type ) {
+		/* Transition actions. */
+		case at_start:
+			graph->startFsmAction( actionOrd[i], actions[i].action );
+			afterOpMinimize( graph );
+			break;
+		case at_all:
+			graph->allTransAction( actionOrd[i], actions[i].action );
+			break;
+		case at_finish:
+			graph->finishFsmAction( actionOrd[i], actions[i].action );
+			break;
+		case at_leave:
+			graph->leaveFsmAction( actionOrd[i], actions[i].action );
+			break;
+
+		/* Global error actions. */
+		case at_start_gbl_error:
+			graph->startErrorAction( actionOrd[i], actions[i].action, 0 );
+			afterOpMinimize( graph );
+			break;
+		case at_all_gbl_error:
+			graph->allErrorAction( actionOrd[i], actions[i].action, 0 );
+			break;
+		case at_final_gbl_error:
+			graph->finalErrorAction( actionOrd[i], actions[i].action, 0 );
+			break;
+		case at_not_start_gbl_error:
+			graph->notStartErrorAction( actionOrd[i], actions[i].action, 0 );
+			break;
+		case at_not_final_gbl_error:
+			graph->notFinalErrorAction( actionOrd[i], actions[i].action, 0 );
+			break;
+		case at_middle_gbl_error:
+			graph->middleErrorAction( actionOrd[i], actions[i].action, 0 );
+			break;
+
+		/* Local error actions. */
+		case at_start_local_error:
+			graph->startErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			afterOpMinimize( graph );
+			break;
+		case at_all_local_error:
+			graph->allErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			break;
+		case at_final_local_error:
+			graph->finalErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			break;
+		case at_not_start_local_error:
+			graph->notStartErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			break;
+		case at_not_final_local_error:
+			graph->notFinalErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			break;
+		case at_middle_local_error:
+			graph->middleErrorAction( actionOrd[i], actions[i].action,
+					actions[i].localErrKey );
+			break;
+
+		/* EOF actions. */
+		case at_start_eof:
+			graph->startEOFAction( actionOrd[i], actions[i].action );
+			afterOpMinimize( graph );
+			break;
+		case at_all_eof:
+			graph->allEOFAction( actionOrd[i], actions[i].action );
+			break;
+		case at_final_eof:
+			graph->finalEOFAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_start_eof:
+			graph->notStartEOFAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_final_eof:
+			graph->notFinalEOFAction( actionOrd[i], actions[i].action );
+			break;
+		case at_middle_eof:
+			graph->middleEOFAction( actionOrd[i], actions[i].action );
+			break;
+
+		/* To State Actions. */
+		case at_start_to_state:
+			graph->startToStateAction( actionOrd[i], actions[i].action );
+			afterOpMinimize( graph );
+			break;
+		case at_all_to_state:
+			graph->allToStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_final_to_state:
+			graph->finalToStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_start_to_state:
+			graph->notStartToStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_final_to_state:
+			graph->notFinalToStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_middle_to_state:
+			graph->middleToStateAction( actionOrd[i], actions[i].action );
+			break;
+
+		/* From State Actions. */
+		case at_start_from_state:
+			graph->startFromStateAction( actionOrd[i], actions[i].action );
+			afterOpMinimize( graph );
+			break;
+		case at_all_from_state:
+			graph->allFromStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_final_from_state:
+			graph->finalFromStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_start_from_state:
+			graph->notStartFromStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_not_final_from_state:
+			graph->notFinalFromStateAction( actionOrd[i], actions[i].action );
+			break;
+		case at_middle_from_state:
+			graph->middleFromStateAction( actionOrd[i], actions[i].action );
+			break;
+
+		/* Remaining cases, prevented by the parser. */
+		default: 
+			assert( false );
+			break;
+		}
+	}
+}
+
+void FactorWithAug::assignPriorities( FsmGraph *graph, int *priorOrd )
+{
+	/* Assign priorities. */
+	for ( int i = 0; i < priorityAugs.length(); i++ ) {
+		switch ( priorityAugs[i].type ) {
+		case at_start:
+			graph->startFsmPrior( priorOrd[i], &priorDescs[i]);
+			/* Start fsm priorities are a special case that may require
+			 * minimization afterwards. */
+			afterOpMinimize( graph );
+			break;
+		case at_all:
+			graph->allTransPrior( priorOrd[i], &priorDescs[i] );
+			break;
+		case at_finish:
+			graph->finishFsmPrior( priorOrd[i], &priorDescs[i] );
+			break;
+		case at_leave:
+			graph->leaveFsmPrior( priorOrd[i], &priorDescs[i] );
+			break;
+
+		default:
+			/* Parser Prevents this case. */
+			break;
+		}
+	}
+}
+
+void FactorWithAug::assignConditions( FsmGraph *graph )
+{
+	for ( int i = 0; i < conditions.length(); i++ )  {
+		switch ( conditions[i].type ) {
+		/* Transition actions. */
+		case at_start:
+			graph->startFsmCondition( conditions[i].action );
+			afterOpMinimize( graph );
+			break;
+		case at_all:
+			graph->allTransCondition( conditions[i].action );
+			break;
+		case at_leave:
+			graph->leaveFsmCondition( conditions[i].action );
+			break;
+		default:
+			break;
+		}
+	}
+}
+
+
+/* Evaluate a factor with augmentation node. */
+FsmGraph *FactorWithAug::walk( ParseData *pd )
+{
+	/* Enter into the scopes created for the labels. */
+	NameFrame nameFrame = pd->enterNameScope( false, labels.length() );
+
+	/* Make the array of function orderings. */
+	int *actionOrd = 0;
+	if ( actions.length() > 0 )
+		actionOrd = new int[actions.length()];
+	
+	/* First walk the list of actions, assigning order to all starting
+	 * actions. */
+	for ( int i = 0; i < actions.length(); i++ ) {
+		if ( actions[i].type == at_start || 
+				actions[i].type == at_start_gbl_error ||
+				actions[i].type == at_start_local_error ||
+				actions[i].type == at_start_to_state ||
+				actions[i].type == at_start_from_state ||
+				actions[i].type == at_start_eof )
+			actionOrd[i] = pd->curActionOrd++;
+	}
+
+	/* Evaluate the factor with repetition. */
+	FsmGraph *rtnVal = factorWithRep->walk( pd );
+
+	/* Compute the remaining action orderings. */
+	for ( int i = 0; i < actions.length(); i++ ) {
+		if ( actions[i].type != at_start && 
+				actions[i].type != at_start_gbl_error &&
+				actions[i].type != at_start_local_error &&
+				actions[i].type != at_start_to_state &&
+				actions[i].type != at_start_from_state &&
+				actions[i].type != at_start_eof )
+			actionOrd[i] = pd->curActionOrd++;
+	}
+
+	assignConditions( rtnVal );
+
+	assignActions( pd, rtnVal , actionOrd );
+
+	/* Make the array of priority orderings. Orderings are local to this walk
+	 * of the factor with augmentation. */
+	int *priorOrd = 0;
+	if ( priorityAugs.length() > 0 )
+		priorOrd = new int[priorityAugs.length()];
+	
+	/* Walk all priorities, assigning the priority ordering. */
+	for ( int i = 0; i < priorityAugs.length(); i++ )
+		priorOrd[i] = pd->curPriorOrd++;
+
+	/* If the priority descriptors have not been made, make them now.  Make
+	 * priority descriptors for each priority asignment that will be passed to
+	 * the fsm. Used to keep track of the key, value and used bit. */
+	if ( priorDescs == 0 && priorityAugs.length() > 0 ) {
+		priorDescs = new PriorDesc[priorityAugs.length()];
+		for ( int i = 0; i < priorityAugs.length(); i++ ) {
+			/* Init the prior descriptor for the priority setting. */
+			priorDescs[i].key = priorityAugs[i].priorKey;
+			priorDescs[i].priority = priorityAugs[i].priorValue;
+		}
+	}
+
+	/* Assign priorities into the machine. */
+	assignPriorities( rtnVal, priorOrd );
+
+	/* Assign epsilon transitions. */
+	for ( int e = 0; e < epsilonLinks.length(); e++ ) {
+		/* Get the name, which may not exist. If it doesn't then silently
+		 * ignore it because an error has already been reported. */
+		NameInst *epTarg = pd->epsilonResolvedLinks[pd->nextEpsilonResolvedLink++];
+		if ( epTarg != 0 ) {
+			/* Make the epsilon transitions. */
+			rtnVal->epsilonTrans( epTarg->id );
+
+			/* Note that we have made a link to the name. */
+			pd->localNameScope->referencedNames.append( epTarg );
+		}
+	}
+
+	/* Set entry points for labels. */
+	if ( labels.length() > 0 ) {
+		/* Pop the names. */
+		pd->resetNameScope( nameFrame );
+
+		/* Make labels that are referenced into entry points. */
+		for ( int i = 0; i < labels.length(); i++ ) {
+			pd->enterNameScope( false, 1 );
+
+			/* Will always be found. */
+			NameInst *name = pd->curNameInst;
+
+			/* If the name is referenced then set the entry point. */
+			if ( name->numRefs > 0 )
+				rtnVal->setEntry( name->id, rtnVal->startState );
+		}
+
+		pd->popNameScope( nameFrame );
+	}
+
+	if ( priorOrd != 0 )
+		delete[] priorOrd;
+	if ( actionOrd != 0 )
+		delete[] actionOrd;	
+	return rtnVal;
+}
+
+void FactorWithAug::makeNameTree( ParseData *pd )
+{
+	/* Add the labels to the tree of instantiated names. Each label
+	 * makes a new scope. */
+	NameInst *prevNameInst = pd->curNameInst;
+	for ( int i = 0; i < labels.length(); i++ )
+		pd->curNameInst = pd->addNameInst( labels[i].loc, labels[i].data, true );
+
+	/* Recurse, then pop the names. */
+	factorWithRep->makeNameTree( pd );
+	pd->curNameInst = prevNameInst;
+}
+
+
+void FactorWithAug::resolveNameRefs( ParseData *pd )
+{
+	/* Enter into the name scope created by any labels. */
+	NameFrame nameFrame = pd->enterNameScope( false, labels.length() );
+
+	/* Recurse first. IMPORTANT: we must do the exact same traversal as when
+	 * the tree is constructed. */
+	factorWithRep->resolveNameRefs( pd );
+
+	/* Resolve epsilon transitions. */
+	for ( int ep = 0; ep < epsilonLinks.length(); ep++ ) {
+		/* Get the link. */
+		EpsilonLink &link = epsilonLinks[ep];
+		NameInst *resolvedName = 0;
+
+		if ( link.target.length() == 1 && strcmp( link.target.data[0], "final" ) == 0 ) {
+			/* Epsilon drawn to an implicit final state. An implicit final is
+			 * only available in join operations. */
+			resolvedName = pd->localNameScope->final;
+		}
+		else {
+			/* Do an search for the name. */
+			NameSet resolved;
+			pd->resolveFrom( resolved, pd->localNameScope, link.target, 0 );
+			if ( resolved.length() > 0 ) {
+				/* Take the first one. */
+				resolvedName = resolved[0];
+				if ( resolved.length() > 1 ) {
+					/* Complain about the multiple references. */
+					error(link.loc) << "state reference " << link.target << 
+							" resolves to multiple entry points" << endl;
+					errorStateLabels( resolved );
+				}
+			}
+		}
+
+		/* This is tricky, we stuff resolved epsilon transitions into one long
+		 * vector in the parse data structure. Since the name resolution and
+		 * graph generation both do identical walks of the parse tree we
+		 * should always find the link resolutions in the right place.  */
+		pd->epsilonResolvedLinks.append( resolvedName );
+
+		if ( resolvedName != 0 ) {
+			/* Found the name, bump of the reference count on it. */
+			resolvedName->numRefs += 1;
+		}
+		else {
+			/* Complain, no recovery action, the epsilon op will ignore any
+			 * epsilon transitions whose names did not resolve. */
+			error(link.loc) << "could not resolve label " << link.target << endl;
+		}
+	}
+
+	if ( labels.length() > 0 )
+		pd->popNameScope( nameFrame );
+}
+
+
+/* Clean up after a factor with repetition node. */
+FactorWithRep::~FactorWithRep()
+{
+	switch ( type ) {
+		case StarType: case StarStarType: case OptionalType: case PlusType:
+		case ExactType: case MaxType: case MinType: case RangeType:
+			delete factorWithRep;
+			break;
+		case FactorWithNegType:
+			delete factorWithNeg;
+			break;
+	}
+}
+
+/* Evaluate a factor with repetition node. */
+FsmGraph *FactorWithRep::walk( ParseData *pd )
+{
+	FsmGraph *retFsm = 0;
+
+	switch ( type ) {
+	case StarType: {
+		/* Evaluate the FactorWithRep. */
+		retFsm = factorWithRep->walk( pd );
+		if ( retFsm->startState->isFinState() ) {
+			warning(loc) << "applying kleene star to a machine that "
+					"accepts zero length word" << endl;
+		}
+
+		/* Shift over the start action orders then do the kleene star. */
+		pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+		retFsm->starOp( );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case StarStarType: {
+		/* Evaluate the FactorWithRep. */
+		retFsm = factorWithRep->walk( pd );
+		if ( retFsm->startState->isFinState() ) {
+			warning(loc) << "applying kleene star to a machine that "
+					"accepts zero length word" << endl;
+		}
+
+		/* Set up the prior descs. All gets priority one, whereas leaving gets
+		 * priority zero. Make a unique key so that these priorities don't
+		 * interfere with any priorities set by the user. */
+		priorDescs[0].key = pd->nextPriorKey++;
+		priorDescs[0].priority = 1;
+		retFsm->allTransPrior( pd->curPriorOrd++, &priorDescs[0] );
+
+		/* Leaveing gets priority 0. Use same unique key. */
+		priorDescs[1].key = priorDescs[0].key;
+		priorDescs[1].priority = 0;
+		retFsm->leaveFsmPrior( pd->curPriorOrd++, &priorDescs[1] );
+
+		/* Shift over the start action orders then do the kleene star. */
+		pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+		retFsm->starOp( );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case OptionalType: {
+		/* Make the null fsm. */
+		FsmGraph *nu = new FsmGraph();
+		nu->lambdaFsm( );
+
+		/* Evaluate the FactorWithRep. */
+		retFsm = factorWithRep->walk( pd );
+
+		/* Perform the question operator. */
+		retFsm->unionOp( nu );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case PlusType: {
+		/* Evaluate the FactorWithRep. */
+		retFsm = factorWithRep->walk( pd );
+		if ( retFsm->startState->isFinState() ) {
+			warning(loc) << "applying plus operator to a machine that "
+					"accpets zero length word" << endl;
+		}
+
+		/* Need a duplicated for the star end. */
+		FsmGraph *dup = new FsmGraph( *retFsm );
+
+		/* The start func orders need to be shifted before doing the star. */
+		pd->curActionOrd += dup->shiftStartActionOrder( pd->curActionOrd );
+
+		/* Star the duplicate. */
+		dup->starOp( );
+		afterOpMinimize( dup );
+
+		retFsm->concatOp( dup );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case ExactType: {
+		/* Get an int from the repetition amount. */
+		if ( lowerRep == 0 ) {
+			/* No copies. Don't need to evaluate the factorWithRep. 
+			 * This Defeats the purpose so give a warning. */
+			warning(loc) << "exactly zero repetitions results "
+					"in the null machine" << endl;
+
+			retFsm = new FsmGraph();
+			retFsm->lambdaFsm();
+		}
+		else {
+			/* Evaluate the first FactorWithRep. */
+			retFsm = factorWithRep->walk( pd );
+			if ( retFsm->startState->isFinState() ) {
+				warning(loc) << "applying repetition to a machine that "
+						"accepts zero length word" << endl;
+			}
+
+			/* The start func orders need to be shifted before doing the
+			 * repetition. */
+			pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+
+			/* Do the repetition on the machine. Already guarded against n == 0 */
+			retFsm->repeatOp( lowerRep );
+			afterOpMinimize( retFsm );
+		}
+		break;
+	}
+	case MaxType: {
+		/* Get an int from the repetition amount. */
+		if ( upperRep == 0 ) {
+			/* No copies. Don't need to evaluate the factorWithRep. 
+			 * This Defeats the purpose so give a warning. */
+			warning(loc) << "max zero repetitions results "
+					"in the null machine" << endl;
+
+			retFsm = new FsmGraph();
+			retFsm->lambdaFsm();
+		}
+		else {
+			/* Evaluate the first FactorWithRep. */
+			retFsm = factorWithRep->walk( pd );
+			if ( retFsm->startState->isFinState() ) {
+				warning(loc) << "applying max repetition to a machine that "
+						"accepts zero length word" << endl;
+			}
+
+			/* The start func orders need to be shifted before doing the 
+			 * repetition. */
+			pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+
+			/* Do the repetition on the machine. Already guarded against n == 0 */
+			retFsm->optionalRepeatOp( upperRep );
+			afterOpMinimize( retFsm );
+		}
+		break;
+	}
+	case MinType: {
+		/* Evaluate the repeated machine. */
+		retFsm = factorWithRep->walk( pd );
+		if ( retFsm->startState->isFinState() ) {
+			warning(loc) << "applying min repetition to a machine that "
+					"accepts zero length word" << endl;
+		}
+
+		/* The start func orders need to be shifted before doing the repetition
+		 * and the kleene star. */
+		pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+	
+		if ( lowerRep == 0 ) {
+			/* Acts just like a star op on the machine to return. */
+			retFsm->starOp( );
+			afterOpMinimize( retFsm );
+		}
+		else {
+			/* Take a duplicate for the plus. */
+			FsmGraph *dup = new FsmGraph( *retFsm );
+
+			/* Do repetition on the first half. */
+			retFsm->repeatOp( lowerRep );
+			afterOpMinimize( retFsm );
+
+			/* Star the duplicate. */
+			dup->starOp( );
+			afterOpMinimize( dup );
+
+			/* Tak on the kleene star. */
+			retFsm->concatOp( dup );
+			afterOpMinimize( retFsm );
+		}
+		break;
+	}
+	case RangeType: {
+		/* Check for bogus range. */
+		if ( upperRep - lowerRep < 0 ) {
+			error(loc) << "invalid range repetition" << endl;
+
+			/* Return null machine as recovery. */
+			retFsm = new FsmGraph();
+			retFsm->lambdaFsm();
+		}
+		else if ( lowerRep == 0 && upperRep == 0 ) {
+			/* No copies. Don't need to evaluate the factorWithRep.  This
+			 * defeats the purpose so give a warning. */
+			warning(loc) << "zero to zero repetitions results "
+					"in the null machine" << endl;
+
+			retFsm = new FsmGraph();
+			retFsm->lambdaFsm();
+		}
+		else {
+			/* Now need to evaluate the repeated machine. */
+			retFsm = factorWithRep->walk( pd );
+			if ( retFsm->startState->isFinState() ) {
+				warning(loc) << "applying range repetition to a machine that "
+						"accepts zero length word" << endl;
+			}
+
+			/* The start func orders need to be shifted before doing both kinds
+			 * of repetition. */
+			pd->curActionOrd += retFsm->shiftStartActionOrder( pd->curActionOrd );
+
+			if ( lowerRep == 0 ) {
+				/* Just doing max repetition. Already guarded against n == 0. */
+				retFsm->optionalRepeatOp( upperRep );
+				afterOpMinimize( retFsm );
+			}
+			else if ( lowerRep == upperRep ) {
+				/* Just doing exact repetition. Already guarded against n == 0. */
+				retFsm->repeatOp( lowerRep );
+				afterOpMinimize( retFsm );
+			}
+			else {
+				/* This is the case that 0 < lowerRep < upperRep. Take a
+				 * duplicate for the optional repeat. */
+				FsmGraph *dup = new FsmGraph( *retFsm );
+
+				/* Do repetition on the first half. */
+				retFsm->repeatOp( lowerRep );
+				afterOpMinimize( retFsm );
+
+				/* Do optional repetition on the second half. */
+				dup->optionalRepeatOp( upperRep - lowerRep );
+				afterOpMinimize( dup );
+
+				/* Tak on the duplicate machine. */
+				retFsm->concatOp( dup );
+				afterOpMinimize( retFsm );
+			}
+		}
+		break;
+	}
+	case FactorWithNegType: {
+		/* Evaluate the Factor. Pass it up. */
+		retFsm = factorWithNeg->walk( pd );
+		break;
+	}}
+	return retFsm;
+}
+
+void FactorWithRep::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case StarType:
+	case StarStarType:
+	case OptionalType:
+	case PlusType:
+	case ExactType:
+	case MaxType:
+	case MinType:
+	case RangeType:
+		factorWithRep->makeNameTree( pd );
+		break;
+	case FactorWithNegType:
+		factorWithNeg->makeNameTree( pd );
+		break;
+	}
+}
+
+void FactorWithRep::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case StarType:
+	case StarStarType:
+	case OptionalType:
+	case PlusType:
+	case ExactType:
+	case MaxType:
+	case MinType:
+	case RangeType:
+		factorWithRep->resolveNameRefs( pd );
+		break;
+	case FactorWithNegType:
+		factorWithNeg->resolveNameRefs( pd );
+		break;
+	}
+}
+
+/* Clean up after a factor with negation node. */
+FactorWithNeg::~FactorWithNeg()
+{
+	switch ( type ) {
+		case NegateType:
+		case CharNegateType:
+			delete factorWithNeg;
+			break;
+		case FactorType:
+			delete factor;
+			break;
+	}
+}
+
+/* Evaluate a factor with negation node. */
+FsmGraph *FactorWithNeg::walk( ParseData *pd )
+{
+	FsmGraph *retFsm = 0;
+
+	switch ( type ) {
+	case NegateType: {
+		/* Evaluate the factorWithNeg. */
+		FsmGraph *toNegate = factorWithNeg->walk( pd );
+
+		/* Negation is subtract from dot-star. */
+		retFsm = dotStarFsm( pd );
+		retFsm->subtractOp( toNegate );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case CharNegateType: {
+		/* Evaluate the factorWithNeg. */
+		FsmGraph *toNegate = factorWithNeg->walk( pd );
+
+		/* CharNegation is subtract from dot. */
+		retFsm = dotFsm( pd );
+		retFsm->subtractOp( toNegate );
+		afterOpMinimize( retFsm );
+		break;
+	}
+	case FactorType: {
+		/* Evaluate the Factor. Pass it up. */
+		retFsm = factor->walk( pd );
+		break;
+	}}
+	return retFsm;
+}
+
+void FactorWithNeg::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case NegateType:
+	case CharNegateType:
+		factorWithNeg->makeNameTree( pd );
+		break;
+	case FactorType:
+		factor->makeNameTree( pd );
+		break;
+	}
+}
+
+void FactorWithNeg::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case NegateType:
+	case CharNegateType:
+		factorWithNeg->resolveNameRefs( pd );
+		break;
+	case FactorType:
+		factor->resolveNameRefs( pd );
+		break;
+	}
+}
+
+/* Clean up after a factor node. */
+Factor::~Factor()
+{
+	switch ( type ) {
+		case LiteralType:
+			delete literal;
+			break;
+		case RangeType:
+			delete range;
+			break;
+		case OrExprType:
+			delete reItem;
+			break;
+		case RegExprType:
+			delete regExp;
+			break;
+		case ReferenceType:
+			break;
+		case ParenType:
+			delete join;
+			break;
+	}
+}
+
+/* Evaluate a factor node. */
+FsmGraph *Factor::walk( ParseData *pd )
+{
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+	case LiteralType:
+		rtnVal = literal->walk( pd );
+		break;
+	case RangeType:
+		rtnVal = range->walk( pd );
+		break;
+	case OrExprType:
+		rtnVal = reItem->walk( pd, 0 );
+		break;
+	case RegExprType:
+		rtnVal = regExp->walk( pd, 0 );
+		break;
+	case ReferenceType:
+		rtnVal = varDef->walk( pd );
+		break;
+	case ParenType:
+		rtnVal = join->walk( pd );
+		break;
+	}
+
+	return rtnVal;
+}
+
+void Factor::makeNameTree( ParseData *pd )
+{
+	switch ( type ) {
+	case LiteralType:
+	case RangeType:
+	case OrExprType:
+	case RegExprType:
+		break;
+	case ReferenceType:
+		varDef->makeNameTree( loc, pd );
+		break;
+	case ParenType:
+		join->makeNameTree( pd );
+		break;
+	}
+}
+
+void Factor::resolveNameRefs( ParseData *pd )
+{
+	switch ( type ) {
+	case LiteralType:
+	case RangeType:
+	case OrExprType:
+	case RegExprType:
+		break;
+	case ReferenceType:
+		varDef->resolveNameRefs( pd );
+		break;
+	case ParenType:
+		join->resolveNameRefs( pd );
+		break;
+	}
+}
+
+/* Clean up a range object. Must delete the two literals. */
+Range::~Range()
+{
+	delete lowerLit;
+	delete upperLit;
+}
+
+bool Range::verifyRangeFsm( FsmGraph *rangeEnd )
+{
+	/* Must have two states. */
+	if ( rangeEnd->stateList.length() != 2 )
+		return false;
+	/* The start state cannot be final. */
+	if ( rangeEnd->startState->isFinState() )
+		return false;
+	/* There should be only one final state. */
+	if ( rangeEnd->finStateSet.length() != 1 )
+		return false;
+	/* The final state cannot have any transitions out. */
+	if ( rangeEnd->finStateSet[0]->outList.length() != 0 )
+		return false;
+	/* The start state should have only one transition out. */
+	if ( rangeEnd->startState->outList.length() != 1 )
+		return false;
+	/* The singe transition out of the start state should not be a range. */
+	FsmTrans *startTrans = rangeEnd->startState->outList.head;
+	if ( startTrans->lowKey != startTrans->highKey )
+		return false;
+	return true;
+}
+
+/* Evaluate a range. Gets the lower an upper key and makes an fsm range. */
+FsmGraph *Range::walk( ParseData *pd )
+{
+	/* Construct and verify the suitability of the lower end of the range. */
+	FsmGraph *lowerFsm = lowerLit->walk( pd );
+	if ( !verifyRangeFsm( lowerFsm ) ) {
+		error(lowerLit->loc) << 
+			"bad range lower end, must be a single character" << endl;
+	}
+
+	/* Construct and verify the upper end. */
+	FsmGraph *upperFsm = upperLit->walk( pd );
+	if ( !verifyRangeFsm( upperFsm ) ) {
+		error(upperLit->loc) << 
+			"bad range upper end, must be a single character" << endl;
+	}
+
+	/* Grab the keys from the machines, then delete them. */
+	Key lowKey = lowerFsm->startState->outList.head->lowKey;
+	Key highKey = upperFsm->startState->outList.head->lowKey;
+	delete lowerFsm;
+	delete upperFsm;
+
+	/* Validate the range. */
+	if ( lowKey > highKey ) {
+		/* Recover by setting upper to lower; */
+		error(lowerLit->loc) << "lower end of range is greater then upper end" << endl;
+		highKey = lowKey;
+	}
+
+	/* Return the range now that it is validated. */
+	FsmGraph *retFsm = new FsmGraph();
+	retFsm->rangeFsm( lowKey, highKey );
+	return retFsm;
+}
+
+/* Evaluate a literal object. */
+FsmGraph *Literal::walk( ParseData *pd )
+{
+	/* FsmGraph to return, is the alphabet signed. */
+	FsmGraph *rtnVal = 0;
+
+	switch ( type ) {
+	case Number: {
+		/* Make the fsm key in int format. */
+		Key fsmKey = makeFsmKeyNum( literal.data, loc, pd );
+		/* Make the new machine. */
+		rtnVal = new FsmGraph();
+		rtnVal->concatFsm( fsmKey );
+		break;
+	}
+	case LitString: {
+		/* Make the array of keys in int format. */
+		String interp;
+		bool caseInsensitive;
+		prepareLitString( interp, caseInsensitive, literal, loc );
+		Key *arr = new Key[interp.length()];
+		makeFsmKeyArray( arr, interp.data, interp.length(), pd );
+
+		/* Make the new machine. */
+		rtnVal = new FsmGraph();
+		if ( caseInsensitive )
+			rtnVal->concatFsmCI( arr, interp.length() );
+		else
+			rtnVal->concatFsm( arr, interp.length() );
+		delete[] arr;
+		break;
+	}}
+	return rtnVal;
+}
+
+/* Clean up after a regular expression object. */
+RegExpr::~RegExpr()
+{
+	switch ( type ) {
+		case RecurseItem:
+			delete regExp;
+			delete item;
+			break;
+		case Empty:
+			break;
+	}
+}
+
+/* Evaluate a regular expression object. */
+FsmGraph *RegExpr::walk( ParseData *pd, RegExpr *rootRegex )
+{
+	/* This is the root regex, pass down a pointer to this. */
+	if ( rootRegex == 0 )
+		rootRegex = this;
+
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+		case RecurseItem: {
+			/* Walk both items. */
+			FsmGraph *fsm1 = regExp->walk( pd, rootRegex );
+			FsmGraph *fsm2 = item->walk( pd, rootRegex );
+			if ( fsm1 == 0 )
+				rtnVal = fsm2;
+			else {
+				fsm1->concatOp( fsm2 );
+				rtnVal = fsm1;
+			}
+			break;
+		}
+		case Empty: {
+			/* FIXME: Return something here. */
+			rtnVal = 0;
+			break;
+		}
+	}
+	return rtnVal;
+}
+
+/* Clean up after an item in a regular expression. */
+ReItem::~ReItem()
+{
+	switch ( type ) {
+		case Data:
+		case Dot:
+			break;
+		case OrBlock:
+		case NegOrBlock:
+			delete orBlock;
+			break;
+	}
+}
+
+/* Evaluate a regular expression object. */
+FsmGraph *ReItem::walk( ParseData *pd, RegExpr *rootRegex )
+{
+	/* The fsm to return, is the alphabet signed? */
+	FsmGraph *rtnVal = 0;
+
+	switch ( type ) {
+		case Data: {
+			/* Move the data into an integer array and make a concat fsm. */
+			Key *arr = new Key[data.length()];
+			makeFsmKeyArray( arr, data.data, data.length(), pd );
+
+			/* Make the concat fsm. */
+			rtnVal = new FsmGraph();
+			if ( rootRegex != 0 && rootRegex->caseInsensitive )
+				rtnVal->concatFsmCI( arr, data.length() );
+			else
+				rtnVal->concatFsm( arr, data.length() );
+			delete[] arr;
+			break;
+		}
+		case Dot: {
+			/* Make the dot fsm. */
+			rtnVal = dotFsm( pd );
+			break;
+		}
+		case OrBlock: {
+			/* Get the or block and minmize it. */
+			rtnVal = orBlock->walk( pd, rootRegex );
+			rtnVal->minimizePartition2();
+			break;
+		}
+		case NegOrBlock: {
+			/* Get the or block and minimize it. */
+			FsmGraph *fsm = orBlock->walk( pd, rootRegex );
+			fsm->minimizePartition2();
+
+			/* Make a dot fsm and subtract from it. */
+			rtnVal = dotFsm( pd );
+			rtnVal->subtractOp( fsm );
+			rtnVal->minimizePartition2();
+			break;
+		}
+	}
+
+	/* If the item is followed by a star, then apply the star op. */
+	if ( star ) {
+		if ( rtnVal->startState->isFinState() ) {
+			warning(loc) << "applying kleene star to a machine that "
+					"accpets zero length word" << endl;
+		}
+
+		rtnVal->starOp();
+		rtnVal->minimizePartition2();
+	}
+	return rtnVal;
+}
+
+/* Clean up after an or block of a regular expression. */
+ReOrBlock::~ReOrBlock()
+{
+	switch ( type ) {
+		case RecurseItem:
+			delete orBlock;
+			delete item;
+			break;
+		case Empty:
+			break;
+	}
+}
+
+
+/* Evaluate an or block of a regular expression. */
+FsmGraph *ReOrBlock::walk( ParseData *pd, RegExpr *rootRegex )
+{
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+		case RecurseItem: {
+			/* Evaluate the two fsm. */
+			FsmGraph *fsm1 = orBlock->walk( pd, rootRegex );
+			FsmGraph *fsm2 = item->walk( pd, rootRegex );
+			if ( fsm1 == 0 )
+				rtnVal = fsm2;
+			else {
+				fsm1->unionOp( fsm2 );
+				rtnVal = fsm1;
+			}
+			break;
+		}
+		case Empty: {
+			rtnVal = 0;
+			break;
+		}
+	}
+	return rtnVal;;
+}
+
+/* Evaluate an or block item of a regular expression. */
+FsmGraph *ReOrItem::walk( ParseData *pd, RegExpr *rootRegex )
+{
+	/* The return value, is the alphabet signed? */
+	FsmGraph *rtnVal = 0;
+	switch ( type ) {
+	case Data: {
+		/* Make the or machine. */
+		rtnVal = new FsmGraph();
+
+		/* Put the or data into an array of ints. Note that we find unique
+		 * keys. Duplicates are silently ignored. The alternative would be to
+		 * issue warning or an error but since we can't with [a0-9a] or 'a' |
+		 * 'a' don't bother here. */
+		KeySet keySet;
+		makeFsmUniqueKeyArray( keySet, data.data, data.length(), 
+			rootRegex != 0 ? rootRegex->caseInsensitive : false, pd );
+
+		/* Run the or operator. */
+		rtnVal->orFsm( keySet.data, keySet.length() );
+		break;
+	}
+	case Range: {
+		/* Make the upper and lower keys. */
+		Key lowKey = makeFsmKeyChar( lower, pd );
+		Key highKey = makeFsmKeyChar( upper, pd );
+
+		/* Validate the range. */
+		if ( lowKey > highKey ) {
+			/* Recover by setting upper to lower; */
+			error(loc) << "lower end of range is greater then upper end" << endl;
+			highKey = lowKey;
+		}
+
+		/* Make the range machine. */
+		rtnVal = new FsmGraph();
+		rtnVal->rangeFsm( lowKey, highKey );
+
+		if ( rootRegex != 0 && rootRegex->caseInsensitive ) {
+			if ( lowKey <= 'Z' && 'A' <= highKey ) {
+				Key otherLow = lowKey < 'A' ? Key('A') : lowKey;
+				Key otherHigh = 'Z' < highKey ? Key('Z') : highKey;
+
+				otherLow = 'a' + ( otherLow - 'A' );
+				otherHigh = 'a' + ( otherHigh - 'A' );
+
+				FsmGraph *otherRange = new FsmGraph();
+				otherRange->rangeFsm( otherLow, otherHigh );
+				rtnVal->unionOp( otherRange );
+				rtnVal->minimizePartition2();
+			}
+			else if ( lowKey <= 'z' && 'a' <= highKey ) {
+				Key otherLow = lowKey < 'a' ? Key('a') : lowKey;
+				Key otherHigh = 'z' < highKey ? Key('z') : highKey;
+
+				otherLow = 'A' + ( otherLow - 'a' );
+				otherHigh = 'A' + ( otherHigh - 'a' );
+
+				FsmGraph *otherRange = new FsmGraph();
+				otherRange->rangeFsm( otherLow, otherHigh );
+				rtnVal->unionOp( otherRange );
+				rtnVal->minimizePartition2();
+			}
+		}
+
+		break;
+	}}
+	return rtnVal;
+}
diff --git a/colm/parsetree.h b/colm/parsetree.h
new file mode 100644
index 00000000..aceefea1
--- /dev/null
+++ b/colm/parsetree.h
@@ -0,0 +1,1605 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PARSETREE_H
+#define _PARSETREE_H
+
+#include <iostream>
+#include <string.h>
+#include "colm.h"
+#include "avlmap.h"
+#include "bstmap.h"
+#include "bstset.h"
+#include "vector.h"
+#include "dlist.h"
+#include "astring.h"
+#include "bytecode.h"
+#include "avlbasic.h"
+
+/* Operators that are represented with single symbol characters. */
+#define OP_DoubleEql 'e'
+#define OP_NotEql 'q'
+#define OP_LessEql 'l'
+#define OP_GrtrEql 'g'
+#define OP_LogicalAnd 'a'
+#define OP_LogicalOr 'o'
+#define OP_Deref 'd'
+
+struct NameInst;
+struct FsmGraph;
+struct RedFsm;
+struct FsmTables;
+struct FsmRun;
+struct ObjectDef;
+struct ElementOf;
+struct UniqueType;
+struct ObjField;
+struct TransBlock;
+struct CodeBlock;
+
+/* Types of builtin machines. */
+enum BuiltinMachine
+{
+	BT_Any,
+	BT_Ascii,
+	BT_Extend,
+	BT_Alpha,
+	BT_Digit,
+	BT_Alnum,
+	BT_Lower,
+	BT_Upper,
+	BT_Cntrl,
+	BT_Graph,
+	BT_Print,
+	BT_Punct,
+	BT_Space,
+	BT_Xdigit,
+	BT_Lambda,
+	BT_Empty
+};
+
+typedef BstSet<char> CharSet;
+
+
+struct ParseData;
+struct TypeRef;
+
+/* Leaf type. */
+struct Literal;
+
+/* Tree nodes. */
+
+struct Term;
+struct FactorWithAug;
+struct FactorWithRep;
+struct FactorWithNeg;
+struct Factor;
+struct Expression;
+struct Join;
+struct JoinOrLm;
+struct TokenRegion;
+struct Namespace;
+struct TokenDef;
+struct TokenDefList;
+struct Range;
+struct KlangEl;
+
+/* Type of augmentation. Describes locations in the machine. */
+enum AugType
+{
+	/* Transition actions/priorities. */
+	at_start,
+	at_all,
+	at_finish,
+	at_leave,
+
+	/* Global error actions. */
+	at_start_gbl_error,
+	at_all_gbl_error,
+	at_final_gbl_error,
+	at_not_start_gbl_error,
+	at_not_final_gbl_error,
+	at_middle_gbl_error,
+
+	/* Local error actions. */
+	at_start_local_error,
+	at_all_local_error,
+	at_final_local_error,
+	at_not_start_local_error,
+	at_not_final_local_error,
+	at_middle_local_error,
+	
+	/* To State Action embedding. */
+	at_start_to_state,
+	at_all_to_state,
+	at_final_to_state,
+	at_not_start_to_state,
+	at_not_final_to_state,
+	at_middle_to_state,
+
+	/* From State Action embedding. */
+	at_start_from_state,
+	at_all_from_state,
+	at_final_from_state,
+	at_not_start_from_state,
+	at_not_final_from_state,
+	at_middle_from_state,
+
+	/* EOF Action embedding. */
+	at_start_eof,
+	at_all_eof,
+	at_final_eof,
+	at_not_start_eof,
+	at_not_final_eof,
+	at_middle_eof
+};
+
+/* IMPORTANT: These must follow the same order as the state augs in AugType
+ * since we will be using this to compose AugType. */
+enum StateAugType
+{
+	sat_start = 0,
+	sat_all,
+	sat_final,
+	sat_not_start,
+	sat_not_final,
+	sat_middle
+};
+
+struct Action;
+struct PriorDesc;
+struct RegExpr;
+struct ReItem;
+struct ReOrBlock;
+struct ReOrItem;
+struct ExplicitMachine;
+struct InlineItem;
+struct InlineList;
+
+/* Reference to a named state. */
+typedef Vector<String> NameRef;
+typedef Vector<NameRef*> NameRefList;
+typedef Vector<NameInst*> NameTargList;
+
+/* Structure for storing location of epsilon transitons. */
+struct EpsilonLink
+{
+	EpsilonLink( const InputLoc &loc, NameRef &target )
+		: loc(loc), target(target) { }
+
+	InputLoc loc;
+	NameRef target;
+};
+
+struct Label
+{
+	Label( const InputLoc &loc, const String &data, ObjField *objField )
+		: loc(loc), data(data), objField(objField) { }
+
+	InputLoc loc;
+	String data;
+	ObjField *objField;
+};
+
+/* Structure represents an action assigned to some FactorWithAug node. The
+ * factor with aug will keep an array of these. */
+struct ParserAction
+{
+	ParserAction( const InputLoc &loc, AugType type, int localErrKey, Action *action )
+		: loc(loc), type(type), localErrKey(localErrKey), action(action) { }
+
+	InputLoc loc;
+	AugType type;
+	int localErrKey;
+	Action *action;
+};
+
+struct Token
+{
+	String data;
+	InputLoc loc;
+};
+
+void prepareLitString( String &result, bool &caseInsensitive, 
+		const String &srcString, const InputLoc &loc );
+
+std::ostream &operator<<(std::ostream &out, const Token &token );
+
+typedef AvlMap< String, KlangEl*, CmpStr > LiteralDict;
+typedef AvlMapEl< String, KlangEl* > LiteralDictEl;
+
+/* Store the value and type of a priority augmentation. */
+struct PriorityAug
+{
+	PriorityAug( AugType type, int priorKey, int priorValue ) :
+		type(type), priorKey(priorKey), priorValue(priorValue) { }
+
+	AugType type;
+	int priorKey;
+	int priorValue;
+};
+
+/*
+ * A Variable Definition
+ */
+struct VarDef
+{
+	VarDef( const String &name, JoinOrLm *joinOrLm )
+		: name(name), joinOrLm(joinOrLm) { }
+	
+	/* Parse tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( const InputLoc &loc, ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	String name;
+	JoinOrLm *joinOrLm;
+};
+
+typedef Vector<String> StringVect;
+typedef CmpTable<String, CmpStr> CmpStrVect;
+
+struct NamespaceQual
+{
+	NamespaceQual( Namespace *declInNspace, TokenRegion *declInRegion ) : 
+		cachedNspaceQual(0), declInNspace(declInNspace) {}
+
+	Namespace *cachedNspaceQual;
+	Namespace *declInNspace;
+
+	StringVect qualNames;
+
+	Namespace *searchFrom( Namespace *from, StringVect::Iter &qualPart );
+	Namespace *getQual( ParseData *pd );
+};
+
+struct TokenDef
+{
+	TokenDef( Join *join, KlangEl *token, InputLoc &semiLoc, 
+		int longestMatchId, Namespace *nspace, TokenRegion *tokenRegion )
+	: 
+		join(join), action(0), token(token), semiLoc(semiLoc), 
+		longestMatchId(longestMatchId), inLmSelect(false), 
+		nspace(nspace), tokenRegion(tokenRegion) {}
+
+	InputLoc getLoc();
+	
+	Join *join;
+	Action *action;
+	KlangEl *token;
+	InputLoc semiLoc;
+
+	Action *setActId;
+	Action *actOnLast;
+	Action *actOnNext;
+	Action *actLagBehind;
+	int longestMatchId;
+	bool inLmSelect;
+	Namespace *nspace;
+	TokenRegion *tokenRegion;
+
+	TokenDef *prev, *next;
+};
+
+/* Declare a new type so that ptreetypes.h need not include dlist.h. */
+struct TokenDefList : DList<TokenDef> {};
+
+/* Symbol Map. */
+typedef AvlMap< String, KlangEl*, CmpStr > SymbolMap;
+typedef AvlMapEl< String, KlangEl* > SymbolMapEl;
+
+typedef Vector<TokenRegion*> RegionVect;
+
+struct TokenRegion
+{
+	/* Construct with a list of joins */
+	TokenRegion( const InputLoc &loc, const String &name, int id, 
+			TokenRegion *parentRegion ) : 
+		loc(loc), name(name), id(id),
+		lmSwitchHandlesError(false), regionNameInst(0),
+		parentRegion(parentRegion), defaultTokenDef(0),
+		preEofBlock(0) { }
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+	void runLongestMatch( ParseData *pd, FsmGraph *graph );
+	void transferScannerLeavingActions( FsmGraph *graph );
+	Action *newAction( ParseData *pd, const InputLoc &loc, const String &name, 
+			InlineList *inlineList );
+	void makeActions( ParseData *pd );
+	void findName( ParseData *pd );
+	void restart( FsmGraph *graph, FsmTrans *trans );
+
+	InputLoc loc;
+	TokenDefList tokenDefList;
+	String name;
+	int id;
+
+	Action *lmActSelect;
+	bool lmSwitchHandlesError;
+
+	/* This gets saved off during the name walk. Can save it off because token
+	 * regions are referenced once only. */
+	NameInst *regionNameInst;
+
+	TokenRegion *parentRegion;
+	RegionVect childRegions;
+
+	TokenDef *defaultTokenDef;
+
+	TokenRegion *next, *prev;
+
+	CodeBlock *preEofBlock;
+};
+
+typedef DList<TokenRegion> RegionList;
+typedef BstSet< TokenRegion*, CmpOrd<TokenRegion*> > RegionSet;
+
+typedef Vector<Namespace*> NamespaceVect;
+
+struct GenericType 
+	: public DListEl<GenericType>
+{
+	GenericType( const String &name, long typeId, long id, 
+			KlangEl *langEl, TypeRef *typeArg )
+	:
+		name(name), typeId(typeId), id(id), langEl(langEl),
+		typeArg(typeArg), keyTypeArg(0), 
+		utArg(0), keyUT(0),
+		objDef(0)
+	{}
+
+	const String &getKey() const 
+		{ return name; };
+
+	String name;
+	long typeId;
+	long id;
+	KlangEl *langEl;
+	TypeRef *typeArg;
+	TypeRef *keyTypeArg;
+	UniqueType *utArg;
+	UniqueType *keyUT;
+
+	ObjectDef *objDef;
+};
+
+typedef DList<GenericType> GenericList;
+
+struct UserIter;
+typedef AvlMap<String, UserIter*, CmpStr> UserIterMap;
+typedef AvlMapEl<String, UserIter*> UserIterMapEl;
+
+/* Graph dictionary. */
+struct GraphDictEl 
+:
+	public AvlTreeEl<GraphDictEl>,
+	public DListEl<GraphDictEl>
+{
+	GraphDictEl( const String &key ) 
+		: key(key), value(0), isInstance(false) { }
+	GraphDictEl( const String &key, VarDef *value ) 
+		: key(key), value(value), isInstance(false) { }
+
+	const String &getKey() { return key; }
+
+	String key;
+	VarDef *value;
+	bool isInstance;
+
+	/* Location info of graph definition. Points to variable name of assignment. */
+	InputLoc loc;
+};
+
+typedef AvlTree<GraphDictEl, String, CmpStr> GraphDict;
+typedef DList<GraphDictEl> GraphList;
+
+struct Namespace
+{
+	/* Construct with a list of joins */
+	Namespace( const InputLoc &loc, const String &name, int id, 
+			Namespace *parentNamespace ) : 
+		loc(loc), name(name), id(id),
+		parentNamespace(parentNamespace) { }
+
+	/* Tree traversal. */
+	Namespace *findNamespace( const String &name );
+
+	InputLoc loc;
+	String name;
+	int id;
+
+	/* Literal patterns and the dictionary mapping literals to the underlying
+	 * tokens. */
+	LiteralDict literalDict;
+
+	/* Dictionary of symbols within the region. */
+	SymbolMap symbolMap;
+	GenericList genericList;
+
+	/* Dictionary of graphs. Both instances and non-instances go here. */
+	GraphDict graphDict;
+
+	Namespace *parentNamespace;
+	NamespaceVect childNamespaces;
+
+	Namespace *next, *prev;
+};
+
+typedef DList<Namespace> NamespaceList;
+typedef BstSet< Namespace*, CmpOrd<Namespace*> > NamespaceSet;
+
+/* List of Expressions. */
+typedef DList<Expression> ExprList;
+
+struct JoinOrLm
+{
+	enum Type {
+		JoinType,
+		LongestMatchType
+	};
+
+	JoinOrLm( Join *join ) : 
+		join(join), type(JoinType) {}
+	JoinOrLm( TokenRegion *tokenRegion ) :
+		tokenRegion(tokenRegion), type(LongestMatchType) {}
+
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+	
+	Join *join;
+	TokenRegion *tokenRegion;
+	Type type;
+};
+
+/*
+ * Join
+ */
+struct Join
+{
+	/* Construct with the first expression. */
+	Join( Expression *expr );
+	Join( const InputLoc &loc, Expression *expr );
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	FsmGraph *walkJoin( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	/* Data. */
+	InputLoc loc;
+	ExprList exprList;
+};
+
+/*
+ * Expression
+ */
+struct Expression
+{
+	enum Type { 
+		OrType,
+		IntersectType, 
+		SubtractType, 
+		StrongSubtractType,
+		TermType, 
+		BuiltinType
+	};
+
+	/* Construct with an expression on the left and a term on the right. */
+	Expression( Expression *expression, Term *term, Type type ) : 
+		expression(expression), term(term), 
+		builtin(builtin), type(type), prev(this), next(this) { }
+
+	/* Construct with only a term. */
+	Expression( Term *term ) : 
+		expression(0), term(term), builtin(builtin), 
+		type(TermType) , prev(this), next(this) { }
+	
+	/* Construct with a builtin type. */
+	Expression( BuiltinMachine builtin ) : 
+		expression(0), term(0), builtin(builtin), 
+		type(BuiltinType), prev(this), next(this) { }
+
+	~Expression();
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd, bool lastInSeq = true );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	/* Node data. */
+	Expression *expression;
+	Term *term;
+	BuiltinMachine builtin;
+	Type type;
+
+	Expression *prev, *next;
+};
+
+/*
+ * Term
+ */
+struct Term 
+{
+	enum Type { 
+		ConcatType, 
+		RightStartType,
+		RightFinishType,
+		LeftType,
+		FactorWithAugType
+	};
+
+	Term( Term *term, FactorWithAug *factorWithAug ) :
+		term(term), factorWithAug(factorWithAug), type(ConcatType) { }
+
+	Term( Term *term, FactorWithAug *factorWithAug, Type type ) :
+		term(term), factorWithAug(factorWithAug), type(type) { }
+
+	Term( FactorWithAug *factorWithAug ) :
+		term(0), factorWithAug(factorWithAug), type(FactorWithAugType) { }
+	
+	~Term();
+
+	FsmGraph *walk( ParseData *pd, bool lastInSeq = true );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	Term *term;
+	FactorWithAug *factorWithAug;
+	Type type;
+
+	/* Priority descriptor for RightFinish type. */
+	PriorDesc priorDescs[2];
+};
+
+
+/* Third level of precedence. Augmenting nodes with actions and priorities. */
+struct FactorWithAug
+{
+	FactorWithAug( FactorWithRep *factorWithRep ) :
+		priorDescs(0), factorWithRep(factorWithRep) { }
+	~FactorWithAug();
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	void assignActions( ParseData *pd, FsmGraph *graph, int *actionOrd );
+	void assignPriorities( FsmGraph *graph, int *priorOrd );
+
+	void assignConditions( FsmGraph *graph );
+
+	/* Actions and priorities assigned to the factor node. */
+	Vector<ParserAction> actions;
+	Vector<PriorityAug> priorityAugs;
+	PriorDesc *priorDescs;
+	Vector<Label> labels;
+	Vector<EpsilonLink> epsilonLinks;
+	Vector<ParserAction> conditions;
+
+	FactorWithRep *factorWithRep;
+};
+
+/* Fourth level of precedence. Trailing unary operators. Provide kleen star,
+ * optional and plus. */
+struct FactorWithRep
+{
+	enum Type { 
+		StarType,
+		StarStarType,
+		OptionalType,
+		PlusType, 
+		ExactType,
+		MaxType,
+		MinType,
+		RangeType,
+		FactorWithNegType
+	};
+
+	 FactorWithRep( const InputLoc &loc, FactorWithRep *factorWithRep, 
+			int lowerRep, int upperRep, Type type ) :
+		loc(loc), factorWithRep(factorWithRep), 
+		factorWithNeg(0), lowerRep(lowerRep), 
+		upperRep(upperRep), type(type) { }
+	
+	FactorWithRep( const InputLoc &loc, FactorWithNeg *factorWithNeg )
+		: loc(loc), factorWithNeg(factorWithNeg), type(FactorWithNegType) { }
+
+	~FactorWithRep();
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	InputLoc loc;
+	FactorWithRep *factorWithRep;
+	FactorWithNeg *factorWithNeg;
+	int lowerRep, upperRep;
+	Type type;
+
+	/* Priority descriptor for StarStar type. */
+	PriorDesc priorDescs[2];
+};
+
+/* Fifth level of precedence. Provides Negation. */
+struct FactorWithNeg
+{
+	enum Type { 
+		NegateType, 
+		CharNegateType,
+		FactorType
+	};
+
+	FactorWithNeg( const InputLoc &loc, FactorWithNeg *factorWithNeg, Type type) :
+		loc(loc), factorWithNeg(factorWithNeg), factor(0), type(type) { }
+
+	FactorWithNeg( const InputLoc &loc, Factor *factor ) :
+		loc(loc), factorWithNeg(0), factor(factor), type(FactorType) { }
+
+	~FactorWithNeg();
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	InputLoc loc;
+	FactorWithNeg *factorWithNeg;
+	Factor *factor;
+	Type type;
+};
+
+/*
+ * Factor
+ */
+struct Factor
+{
+	/* Language elements a factor node can be. */
+	enum Type {
+		LiteralType, 
+		RangeType, 
+		OrExprType,
+		RegExprType, 
+		ReferenceType,
+		ParenType,
+	}; 
+
+	/* Construct with a literal fsm. */
+	Factor( Literal *literal ) :
+		literal(literal), type(LiteralType) { }
+
+	/* Construct with a range. */
+	Factor( Range *range ) : 
+		range(range), type(RangeType) { }
+	
+	/* Construct with the or part of a regular expression. */
+	Factor( ReItem *reItem ) :
+		reItem(reItem), type(OrExprType) { }
+
+	/* Construct with a regular expression. */
+	Factor( RegExpr *regExp ) :
+		regExp(regExp), type(RegExprType) { }
+
+	/* Construct with a reference to a var def. */
+	Factor( const InputLoc &loc, VarDef *varDef ) :
+		loc(loc), varDef(varDef), type(ReferenceType) {}
+
+	/* Construct with a parenthesized join. */
+	Factor( Join *join ) :
+		join(join), type(ParenType) {}
+	
+	/* Cleanup. */
+	~Factor();
+
+	/* Tree traversal. */
+	FsmGraph *walk( ParseData *pd );
+	void makeNameTree( ParseData *pd );
+	void resolveNameRefs( ParseData *pd );
+
+	InputLoc loc;
+	Literal *literal;
+	Range *range;
+	ReItem *reItem;
+	RegExpr *regExp;
+	VarDef *varDef;
+	Join *join;
+	int lower, upper;
+	Type type;
+};
+
+/* A range machine. Only ever composed of two literals. */
+struct Range
+{
+	Range( Literal *lowerLit, Literal *upperLit ) 
+		: lowerLit(lowerLit), upperLit(upperLit) { }
+
+	~Range();
+	FsmGraph *walk( ParseData *pd );
+	bool verifyRangeFsm( FsmGraph *rangeEnd );
+
+	Literal *lowerLit;
+	Literal *upperLit;
+};
+
+/* Some literal machine. Can be a number or literal string. */
+struct Literal
+{
+	enum LiteralType { Number, LitString };
+
+	Literal( const InputLoc &loc, const String &literal, LiteralType type )
+		: loc(loc), literal(literal), type(type) { }
+
+	FsmGraph *walk( ParseData *pd );
+	
+	InputLoc loc;
+	String literal;
+	LiteralType type;
+};
+
+/* Regular expression. */
+struct RegExpr
+{
+	enum RegExpType { RecurseItem, Empty };
+
+	/* Constructors. */
+	RegExpr() : 
+		type(Empty), caseInsensitive(false) { }
+	RegExpr(RegExpr *regExp, ReItem *item) : 
+		regExp(regExp), item(item), 
+		type(RecurseItem), caseInsensitive(false) { }
+
+	~RegExpr();
+	FsmGraph *walk( ParseData *pd, RegExpr *rootRegex );
+
+	RegExpr *regExp;
+	ReItem *item;
+	RegExpType type;
+	bool caseInsensitive;
+};
+
+/* An item in a regular expression. */
+struct ReItem
+{
+	enum ReItemType { Data, Dot, OrBlock, NegOrBlock };
+	
+	ReItem( const InputLoc &loc, const String &data ) 
+		: loc(loc), data(data), star(false), type(Data) { }
+	ReItem( const InputLoc &loc, ReItemType type )
+		: loc(loc), star(false), type(type) { }
+	ReItem( const InputLoc &loc, ReOrBlock *orBlock, ReItemType type )
+		: loc(loc), orBlock(orBlock), star(false), type(type) { }
+
+	~ReItem();
+	FsmGraph *walk( ParseData *pd, RegExpr *rootRegex );
+
+	InputLoc loc;
+	String data;
+	ReOrBlock *orBlock;
+	bool star;
+	ReItemType type;
+};
+
+/* An or block item. */
+struct ReOrBlock
+{
+	enum ReOrBlockType { RecurseItem, Empty };
+
+	/* Constructors. */
+	ReOrBlock()
+		: type(Empty) { }
+	ReOrBlock(ReOrBlock *orBlock, ReOrItem *item)
+		: orBlock(orBlock), item(item), type(RecurseItem) { }
+
+	~ReOrBlock();
+	FsmGraph *walk( ParseData *pd, RegExpr *rootRegex );
+	
+	ReOrBlock *orBlock;
+	ReOrItem *item;
+	ReOrBlockType type;
+};
+
+/* An item in an or block. */
+struct ReOrItem
+{
+	enum ReOrItemType { Data, Range };
+
+	ReOrItem( const InputLoc &loc, const String &data ) 
+		: loc(loc), data(data), type(Data) {}
+	ReOrItem( const InputLoc &loc, char lower, char upper )
+		: loc(loc), lower(lower), upper(upper), type(Range) { }
+
+	FsmGraph *walk( ParseData *pd, RegExpr *rootRegex );
+
+	InputLoc loc;
+	String data;
+	char lower;
+	char upper;
+	ReOrItemType type;
+};
+
+
+/*
+ * Inline code tree
+ */
+struct InlineList;
+struct InlineItem
+{
+	enum Type 
+	{
+		Text, 
+		LmSwitch, 
+		LmSetActId, 
+		LmSetTokEnd, 
+		LmOnLast, 
+		LmOnNext,
+		LmOnLagBehind, 
+		LmInitAct, 
+		LmInitTokStart, 
+		LmSetTokStart 
+	};
+
+	InlineItem( const InputLoc &loc, const String &data, Type type ) : 
+		loc(loc), data(data), nameRef(0), children(0), type(type) { }
+
+	InlineItem( const InputLoc &loc, NameRef *nameRef, Type type ) : 
+		loc(loc), nameRef(nameRef), children(0), type(type) { }
+
+	InlineItem( const InputLoc &loc, TokenRegion *tokenRegion, 
+		TokenDef *longestMatchPart, Type type ) : loc(loc),
+		nameRef(0), children(0), tokenRegion(tokenRegion),
+		longestMatchPart(longestMatchPart), type(type) { } 
+
+	InlineItem( const InputLoc &loc, NameInst *nameTarg, Type type ) : 
+		loc(loc), nameRef(0), nameTarg(nameTarg), children(0),
+		type(type) { }
+
+	InlineItem( const InputLoc &loc, Type type ) : 
+		loc(loc), nameRef(0), children(0), type(type) { }
+	
+	InputLoc loc;
+	String data;
+	NameRef *nameRef;
+	NameInst *nameTarg;
+	InlineList *children;
+	TokenRegion *tokenRegion;
+	TokenDef *longestMatchPart;
+	Type type;
+
+	InlineItem *prev, *next;
+};
+
+/* Normally this would be atypedef, but that would entail including DList from
+ * ptreetypes, which should be just typedef forwards. */
+struct InlineList : public DList<InlineItem> { };
+
+struct PdaFactor;
+struct LangVarRef;
+struct ObjField;
+
+struct PatternItem
+{
+	enum Type { 
+		FactorType,
+		InputText
+	};
+
+	PatternItem( const String &data, Type type ) : 
+			factor(0), data(data), type(type), region(0), 
+			varRef(0), bindId(0) {}
+
+	PatternItem( PdaFactor *factor, Type type ) : 
+			factor(factor), type(type), region(0), 
+			varRef(0), bindId(0) {}
+
+	PdaFactor *factor;
+	String data;
+	Type type;
+	TokenRegion *region;
+	LangVarRef *varRef;
+	long bindId;
+
+	PatternItem *prev, *next;
+};
+
+typedef DList<PatternItem> PatternItemList;
+
+struct ReplItem
+{
+	enum Type { 
+		InputText, 
+		VarRefType,
+		FactorType
+	};
+
+	ReplItem( Type type, const String &data ) : 
+		type(type), data(data), varRef(0), bindId(0) {}
+
+	ReplItem( Type type, LangVarRef *varRef ) : 
+		type(type), varRef(varRef), bindId(0) {}
+
+	ReplItem( Type type, PdaFactor *factor ) : 
+		type(type), factor(factor), bindId(0) {}
+
+	Type type;
+	String data;
+	LangVarRef *varRef;
+	KlangEl *langEl;
+	PdaFactor *factor;
+	long bindId;
+
+	ReplItem *prev, *next;
+};
+
+typedef DList<ReplItem> ReplItemList;
+
+struct PdaRun;
+
+struct Pattern
+{
+	Pattern( const InputLoc &loc, Namespace *nspace, TokenRegion *region, 
+			PatternItemList *list, int patRepId ) : 
+		loc(loc), nspace(nspace), region(region), list(list), patRepId(patRepId), 
+		langEl(0), pdaRun(0), nextBindId(1) {}
+	
+	InputLoc loc;
+	Namespace *nspace;
+	TokenRegion *region;
+	PatternItemList *list;
+	long patRepId;
+	KlangEl *langEl;
+	PdaRun *pdaRun;
+	long nextBindId;
+
+	Pattern *prev, *next;
+};
+
+typedef DList<Pattern> PatternList;
+
+struct Replacement
+{
+	Replacement( Namespace *nspace, TokenRegion *region, 
+			ReplItemList *list, int patRepId ) :
+		nspace(nspace), region(region), list(list), patRepId(patRepId), langEl(0),
+		pdaRun(0), nextBindId(1) {}
+
+	Namespace *nspace;
+	TokenRegion *region;
+	ReplItemList *list;
+	int patRepId;
+	KlangEl *langEl;
+	PdaRun *pdaRun;
+	long nextBindId;
+
+	Replacement *prev, *next;
+};
+
+typedef DList<Replacement> ReplList;
+
+struct UserIter;
+struct Function;
+
+struct IterDef
+{
+	enum Type { Tree, Child, RevChild, User };
+
+	IterDef( Type type, Function *func );
+	IterDef( Type type );
+
+	Type type;
+
+	Function *func;
+	bool useFuncId;
+	bool useSearchUT;
+
+	Code inCreate;
+	Code inDestroy;
+	Code inAdvance;
+
+	Code inGetCurR;
+	Code inGetCurWC;
+	Code inSetCurWC;
+
+	Code inRefFromCur;
+};
+
+struct CmpIterDef
+{
+	static int compare( const IterDef &id1, const IterDef &id2 )
+	{
+		if ( id1.type < id2.type )
+			return -1;
+		else if ( id1.type > id2.type )
+			return 1;
+		else if ( id1.type == IterDef::User ) {
+			if ( id1.func < id2.func )
+				return -1;
+			else if ( id1.func > id2.func )
+				return 1;
+		}
+			
+		return 0;
+	}
+};
+
+typedef AvlSet<IterDef, CmpIterDef> IterDefSet;
+typedef AvlSetEl<IterDef> IterDefSetEl;
+
+
+/*
+ * Language features.
+ */
+
+struct UniqueType : public AvlTreeEl<UniqueType>
+{
+	UniqueType( int typeId ) :
+		typeId(typeId), 
+		langEl(0), 
+		iterDef(0) {}
+
+	UniqueType( int typeId, KlangEl *langEl ) :
+		typeId(typeId),
+		langEl(langEl),
+		iterDef(0) {}
+
+	UniqueType( int typeId, IterDef *iterDef ) :
+		typeId(typeId),
+		langEl(langEl),
+		iterDef(iterDef) {}
+
+	int typeId;
+	KlangEl *langEl;
+	IterDef *iterDef;
+};
+
+struct CmpUniqueType
+{
+	static int compare( const UniqueType &ut1, const UniqueType &ut2 );
+};
+
+
+typedef AvlBasic< UniqueType, CmpUniqueType > UniqueTypeMap;
+
+typedef AvlMap< StringVect, int, CmpStrVect > VectorTypeIdMap;
+typedef AvlMapEl< StringVect, int > VectorTypeIdMapEl;
+
+typedef Vector<TypeRef*> TypeRefVect;
+
+struct TypeRef
+{
+	/* Qualification and a type name. These require lookup. */
+	TypeRef( const InputLoc &loc, NamespaceQual *nspaceQual, String typeName ) :
+		loc(loc), nspaceQual(nspaceQual), typeName(typeName), iterDef(0),
+		searchTypeRef(0), factor(0),
+		isPtr(false), isRef(false), isRepeat(false), isOpt(false),
+		uniqueType(0) {}
+
+	/* Iterator definition. */
+	TypeRef( const InputLoc &loc, IterDef *iterDef, TypeRef *searchTypeRef ) :
+		loc(loc), iterDef(iterDef), searchTypeRef(searchTypeRef), factor(0),
+		isPtr(false), isRef(false), isRepeat(false), isOpt(false),
+		uniqueType(0) {}
+
+	/* Unique type is given directly. */
+	TypeRef( const InputLoc &loc, UniqueType *uniqueType ) :
+		loc(loc), nspaceQual(0), iterDef(0), searchTypeRef(0), factor(0),
+		isPtr(false), isRef(false), isRepeat(false), isOpt(false), 
+		uniqueType(uniqueType) {}
+
+	/* A factor in a pattern. In the case of matches we need a type ref at
+	 * parse time, but factors have not been resolved yet, so this allows us
+	 * to do it on demand. */
+	TypeRef( const InputLoc &loc, PdaFactor *factor ) :
+		loc(loc), nspaceQual(0), iterDef(0), searchTypeRef(0), factor(factor),
+		isPtr(false), isRef(false), isRepeat(false), isOpt(false), 
+		uniqueType(0) {}
+
+
+	UniqueType *lookupType( ParseData *pd );
+
+	InputLoc loc;
+	NamespaceQual *nspaceQual;
+	String typeName;
+	IterDef *iterDef;
+	TypeRef *searchTypeRef;
+	PdaFactor *factor;
+	bool isPtr;
+	bool isRef;
+	bool isRepeat;
+	bool isOpt;
+
+private:
+	UniqueType *lookupTypePart( ParseData *pd, NamespaceQual *nspaceQual, 
+			const String &name );
+	UniqueType *uniqueType;
+};
+
+typedef DList<ObjField> ParameterList; 
+
+struct ObjMethod
+{
+	ObjMethod( UniqueType *returnUT, String name, 
+			int opcodeWC, int opcodeWV, int numParams, 
+			UniqueType **types, ParameterList *paramList, bool isConst )
+		: 
+			returnUT(returnUT),
+			returnTypeId(0), name(name), 
+			opcodeWC(opcodeWC), opcodeWV(opcodeWV), 
+			numParams(numParams), paramList(paramList), 
+			isConst(isConst), funcId(0), 
+			useFuncId(false), useCallObj(true), func(0), 
+			iterDef(0)
+	{
+		this->paramUTs = new UniqueType*[numParams];
+		memcpy( this->paramUTs, types, sizeof(UniqueType*)*numParams );
+	}
+
+	UniqueType *returnUT;
+	long returnTypeId;
+	String name;
+	long opcodeWC;
+	long opcodeWV;
+	long numParams;
+	UniqueType **paramUTs;
+	ParameterList *paramList;
+	bool isConst;
+	long funcId;
+	bool useFuncId;
+	bool useCallObj;
+	Function *func;
+	IterDef *iterDef;
+};
+
+typedef AvlMap<String, ObjMethod*, CmpStr> ObjMethodMap;
+typedef AvlMapEl<String, ObjMethod*> ObjMethodMapEl;
+
+struct ObjField
+{
+	ObjField( const InputLoc &loc, TypeRef *typeRef, const String &name ) : 
+		loc(loc), typeRef(typeRef), name(name), pos(0), offset(0),
+		beenReferenced(false),
+		beenInitialized(false),
+		useOffset(true),
+		isConst(false), 
+		isLhsEl(false), isRhsEl(false), 
+		refActive(false),
+		inGetR( IN_HALT ),
+		inGetWC( IN_HALT ),
+		inGetWV( IN_HALT ),
+		inSetWC( IN_HALT ),
+		inSetWV( IN_HALT )
+		{}
+	
+	InputLoc loc;
+	TypeRef *typeRef;
+	String name;
+	long pos;
+	long offset;
+	bool beenReferenced;
+	bool beenInitialized;
+	bool useOffset;
+	bool isConst;
+	bool isLhsEl;
+	bool isRhsEl;
+	bool refActive;
+
+	Code inGetR;
+	Code inGetWC;
+	Code inGetWV;
+	Code inSetWC;
+	Code inSetWV;
+
+	ObjField *prev, *next;
+};
+
+typedef AvlMap<String, ObjField*, CmpStr> ObjFieldMap;
+typedef AvlMapEl<String, ObjField*> ObjFieldMapEl;
+
+typedef DList<ObjField> ParameterList; 
+
+struct TemplateType;
+
+struct ObjectDef
+{
+	enum Type {
+		UserType,
+		FrameType,
+		IterType,
+		BuiltinType
+	};
+
+	ObjectDef( Type type, String name, 
+			ObjFieldMap *objFieldMap, ObjMethodMap *objMethodMap, int id )
+	:
+		type(type), name(name), objFieldMap(objFieldMap), 
+		objMethodMap(objMethodMap), id(id), nextOffset(0) {}
+
+	Type type;
+	String name;
+	ObjFieldMap *objFieldMap;	
+	ObjMethodMap *objMethodMap;	
+
+	long id;
+	long nextOffset;
+	long firstNonTree;
+
+	void referenceField( ParseData *pd, ObjField *field );
+	void initField( ParseData *pd, ObjField *field );
+	void createCode( ParseData *pd, CodeVect &code );
+	ObjMethod *findMethod( String name );
+	ObjField *findField( String name );
+
+	long size() { return nextOffset; }
+	long sizeTrees() { return firstNonTree; }
+
+	ObjectDef *prev, *next;
+};
+
+struct LangExpr;
+typedef Vector<LangExpr*> ExprVect;
+typedef Vector<String> StringVect;
+
+struct FieldInit
+{
+	FieldInit( const InputLoc &loc, String name, LangExpr *expr )
+		: loc(loc), name(name), expr(expr) {}
+
+	InputLoc loc;
+	String name;
+	LangExpr *expr;
+
+	UniqueType *exprUT;
+};
+
+typedef Vector<FieldInit*> FieldInitVect;
+
+struct VarRefLookup
+{
+	VarRefLookup( int lastPtrInQual, int firstConstPart, ObjectDef *inObject ) :
+		lastPtrInQual(lastPtrInQual), 
+		firstConstPart(firstConstPart),
+		inObject(inObject),
+		objField(0), 
+		objMethod(0), 
+		uniqueType(0),
+		iterSearchUT(0)
+	{}
+
+	int lastPtrInQual;
+	int firstConstPart;
+	ObjectDef *inObject;
+	ObjField *objField;
+	ObjMethod *objMethod;
+	UniqueType *uniqueType;
+	UniqueType *iterSearchUT;
+};
+
+struct QualItem
+{
+	enum Type { Dot, Arrow };
+
+	QualItem( const InputLoc &loc, const String &data, Type type )
+		: loc(loc), data(data), type(type) {}
+
+	InputLoc loc;
+	String data;
+	Type type;
+};
+
+typedef Vector<QualItem> QualItemVect;
+
+struct LangVarRef
+{
+	LangVarRef( const InputLoc &loc, QualItemVect *qual, String name )
+		: loc(loc), qual(qual), name(name) {}
+
+	UniqueType *loadFieldInstr( ParseData *pd, CodeVect &code, ObjectDef *inObject,
+			ObjField *el, bool forWriting, bool revert );
+	void setFieldInstr( ParseData *pd, CodeVect &code, ObjectDef *inObject, 
+			ObjField *el, UniqueType *exprUT, bool revert );
+
+	VarRefLookup lookupMethod( ParseData *pd );
+	VarRefLookup lookupField( ParseData *pd );
+
+	VarRefLookup lookupQualification( ParseData *pd, ObjectDef *rootDef ) const;
+	VarRefLookup lookupObj( ParseData *pd );
+
+	bool isLocalRef( ParseData *pd );
+	void loadQualification( ParseData *pd, CodeVect &code, ObjectDef *rootObj, 
+			int lastPtrInQual, bool forWriting, bool revert );
+	void loadLocalObj( ParseData *pd, CodeVect &code, 
+			int lastPtrInQual, bool forWriting );
+	void loadGlobalObj( ParseData *pd, CodeVect &code, 
+			int lastPtrInQual, bool forWriting );
+	void loadObj( ParseData *pd, CodeVect &code, int lastPtrInQual, bool forWriting );
+
+	void setFieldIter( ParseData *pd, CodeVect &code, 
+			ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert );
+	void setFieldSearch( ParseData *pd, CodeVect &code, 
+			ObjectDef *inObject, UniqueType *exprType );
+	void setField( ParseData *pd, CodeVect &code, 
+			ObjectDef *inObject, UniqueType *type, bool revert );
+
+	void assignValue( ParseData *pd, CodeVect &code, UniqueType *exprUT );
+	ObjField **evaluateArgs( ParseData *pd, CodeVect &code, 
+			VarRefLookup &lookup, ExprVect *args );
+	void callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup );
+	UniqueType *evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args );
+	UniqueType *evaluate( ParseData *pd, CodeVect &code, bool forWriting = false );
+	ObjField *evaluateRef( ParseData *pd, CodeVect &code );
+	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs );
+
+	InputLoc loc;
+	QualItemVect *qual;
+	String name;
+};
+
+struct LangTerm
+{
+	enum Type {
+		VarRefType,
+		MethodCallType,
+		NumberType,
+		StringType,
+		MatchType,
+		NewType,
+		ConstructType,
+		TypeIdType,
+		SearchType,
+		NilType,
+		TrueType,
+		FalseType,
+		ParseType,
+		ParseStopType,
+		MakeTreeType,
+		MakeTokenType
+	};
+
+	LangTerm( Type type, LangVarRef *varRef )
+		: type(type), varRef(varRef) {}
+
+	LangTerm( LangVarRef *varRef, ExprVect *args )
+		: type(MethodCallType), varRef(varRef), args(args) {}
+
+	LangTerm( const InputLoc &loc, Type type, ExprVect *args )
+		: loc(loc), type(type), args(args) {}
+
+	LangTerm( Type type, String data )
+		: type(type), varRef(0), data(data) {}
+
+	LangTerm( Type type, NamespaceQual *nspaceQual, const String &data )
+		: type(type), varRef(0), nspaceQual(nspaceQual), data(data) {}
+
+	LangTerm( const InputLoc &loc, Type type )
+		: loc(loc), type(type), varRef(0), typeRef(0) {}
+
+	LangTerm( const InputLoc &loc, Type type, TypeRef *typeRef )
+		: loc(loc), type(type), varRef(0), typeRef(typeRef) {}
+
+	LangTerm( const InputLoc &loc, Type type, LangVarRef *varRef )
+		: loc(loc), type(type), varRef(varRef) {}
+
+	LangTerm( Type type, LangVarRef *varRef, Pattern *pattern )
+		: type(type), varRef(varRef), pattern(pattern) {}
+
+	LangTerm( const InputLoc &loc, Type type, TypeRef *typeRef, LangVarRef *varRef )
+		: loc(loc), type(type), varRef(varRef), typeRef(typeRef) {}
+
+	LangTerm( const InputLoc &loc, Type type, TypeRef *typeRef, FieldInitVect *fieldInitArgs, 
+			Replacement *replacement )
+		: loc(loc), type(type), typeRef(typeRef), fieldInitArgs(fieldInitArgs), 
+		replacement(replacement) {}
+
+	LangTerm( Type type, LangExpr *expr )
+		: type(type), expr(expr) {}
+
+	UniqueType *evaluateParse( ParseData *pd, CodeVect &code, bool stop );
+	UniqueType *evaluateNew( ParseData *pd, CodeVect &code );
+	UniqueType *evaluateConstruct( ParseData *pd, CodeVect &code );
+	UniqueType *evaluateTreeConstruct( ParseData *pd, CodeVect &code );
+	UniqueType *evaluateTermConstruct( ParseData *pd, CodeVect &code );
+	bool constructTermFromString( ParseData *pd );
+	UniqueType *evaluateMatch( ParseData *pd, CodeVect &code );
+	UniqueType *evaluate( ParseData *pd, CodeVect &code );
+	void assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT );
+	UniqueType *evaluateMakeToken( ParseData *pd, CodeVect &code );
+	UniqueType *evaluateMakeTree( ParseData *pd, CodeVect &code );
+
+	InputLoc loc;
+	Type type;
+	LangVarRef *varRef;
+	ExprVect *args;
+	NamespaceQual *nspaceQual;
+	String data;
+	TypeRef *typeRef;
+	Pattern *pattern;
+	FieldInitVect *fieldInitArgs;
+	Replacement *replacement;
+	LangExpr *expr;
+};
+
+struct LangExpr
+{
+	enum Type {
+		BinaryType,
+		UnaryType,
+		TermType
+	};
+
+	LangExpr( const InputLoc &loc, LangExpr *left, char op, LangExpr *right )
+		: loc(loc), type(BinaryType), left(left), op(op), right(right) {}
+
+	LangExpr( const InputLoc &loc, char op, LangExpr *right )
+		: loc(loc), type(UnaryType), left(0), op(op), right(right) {}
+
+	LangExpr( LangTerm *term )
+		: type(TermType), term(term) {}
+
+	UniqueType *evaluate( ParseData *pd, CodeVect &code );
+
+	InputLoc loc;
+	Type type;
+	LangExpr *left;
+	char op;
+	LangExpr *right;
+	LangTerm *term;
+};
+
+struct LangStmt;
+typedef DList<LangStmt> StmtList;
+
+struct LangStmt
+{
+	enum Type {
+		AssignType,
+		PrintType,
+		PrintXMLType,
+		ExprType,
+		IfType,
+		RejectType,
+		WhileType,
+		ReturnType,
+		YieldType,
+		ForIterType,
+		BreakType
+	};
+
+	LangStmt( const InputLoc &loc, Type type, FieldInitVect *fieldInitVect ) : 
+		loc(loc), type(type), varRef(0), expr(0), fieldInitVect(fieldInitVect), next(0) {}
+
+	LangStmt( const InputLoc &loc, Type type, ExprVect *exprPtrVect ) : 
+		loc(loc), type(type), varRef(0), expr(0), exprPtrVect(exprPtrVect), next(0) {}
+	
+	LangStmt( const InputLoc &loc, Type type, LangExpr *expr ) : 
+		loc(loc), type(type), varRef(0), expr(expr), exprPtrVect(0), next(0) {}
+
+	LangStmt( Type type, LangVarRef *varRef ) : 
+		type(type), varRef(varRef), expr(0), exprPtrVect(0), next(0) {}
+
+	LangStmt( const InputLoc &loc, Type type, ObjField *objField ) :
+		loc(loc), type(type), varRef(0), objField(objField), expr(0), 
+		exprPtrVect(0), next(0) {}
+	
+	LangStmt( const InputLoc &loc, Type type, LangVarRef *varRef, LangExpr *expr ) : 
+		loc(loc), type(type), varRef(varRef), expr(expr), exprPtrVect(0), next(0) {}
+	
+	LangStmt( Type type, LangExpr *expr, StmtList *stmtList ) : 
+		type(type), expr(expr), stmtList(stmtList), next(0) {}
+
+	LangStmt( Type type, LangExpr *expr, StmtList *stmtList, StmtList *elsePart ) : 
+		type(type), expr(expr), stmtList(stmtList), elsePart(elsePart), next(0) {}
+
+	LangStmt( const InputLoc &loc, Type type ) : 
+		loc(loc), type(type), next(0) {}
+
+	LangStmt( Type type, LangVarRef *varRef, Replacement *replacement ) : 
+		type(type), varRef(varRef), expr(0), replacement(replacement), 
+		exprPtrVect(0), next(0) {}
+
+	LangStmt( const InputLoc &loc, Type type, const String &varName, 
+			TypeRef *typeRef, LangTerm *langTerm, StmtList *stmtList ) : 
+		loc(loc), type(type), langTerm(langTerm), typeRef(typeRef), 
+		stmtList(stmtList), name(varName), next(0) {}
+
+	LangStmt( Type type ) : 
+		type(type), next(0) {}
+
+	LangTerm *chooseDefaultIter( ParseData *pd );
+	void compileWhile( ParseData *pd, CodeVect &code );
+	void unscopeIterVariable( ParseData *pd, ObjField *iterObjField );
+	ObjField *createIterVariable( ParseData *pd, TypeRef *iterTypeRef );
+	void compileForIterBody( ParseData *pd, CodeVect &code, 
+			ObjField *iterObjField, LangVarRef *iterVarRef, UniqueType *iterUT );
+	void compileForIter( ParseData *pd, CodeVect &code );
+	void compile( ParseData *pd, CodeVect &code );
+
+	InputLoc loc;
+	Type type;
+	LangVarRef *varRef;
+	LangTerm *langTerm;
+	ObjField *objField;
+	TypeRef *typeRef;
+	LangExpr *expr;
+	Replacement *replacement;
+	ExprVect *exprPtrVect;
+	FieldInitVect *fieldInitVect;
+	StmtList *stmtList;
+	StmtList *elsePart;
+	String name;
+
+	/* Normally you don't need to initialize double list pointers, however, we
+	 * make use of the next pointer for returning a pair of statements using
+	 * one pointer to a LangStmt, so we need to initialize it above. */
+	LangStmt *prev, *next;
+};
+
+struct CodeBlock
+{
+	CodeBlock( StmtList *stmtList ) 
+		: stmtList(stmtList), localFrame(0), frameId(-1) {}
+
+	void compile( ParseData *pd, CodeVect &code );
+
+	StmtList *stmtList;
+	ObjectDef *localFrame;
+	CodeVect code;
+	long frameId;
+	CharSet trees;
+};
+
+struct Function
+{
+	Function( TypeRef *typeRef, const String &name, 
+			ParameterList *paramList, CodeBlock *codeBlock, 
+			int funcId, bool isUserIter )
+	:
+		typeRef(typeRef),
+		name(name),
+		paramList(paramList),
+		codeBlock(codeBlock),
+		funcId(funcId),
+		isUserIter(isUserIter),
+		paramListSize(0),
+		paramUTs(0)
+	{}
+
+	TransBlock *transBlock;
+	TypeRef *typeRef;
+	String name;
+	ParameterList *paramList;
+	CodeBlock *codeBlock;
+	ObjectDef *localFrame;
+	long funcId;
+	bool isUserIter;
+	long paramListSize;
+	UniqueType **paramUTs;
+
+	Function *prev, *next;
+};
+
+typedef DList<Function> FunctionList;
+
+#endif /* _PARSETREE_H */
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
new file mode 100644
index 00000000..7d01deca
--- /dev/null
+++ b/colm/pdabuild.cpp
@@ -0,0 +1,1698 @@
+/*
+ *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <iomanip>
+#include <errno.h>
+#include <stdlib.h>
+
+/* Parsing. */
+#include "colm.h"
+#include "parsedata.h"
+#include "pdacodegen.h"
+#include "pdarun.h"
+#include "redfsm.h"
+#include "fsmcodegen.h"
+#include "redbuild.h"
+#include "fsmrun.h"
+
+/* Dumping the fsm. */
+#include "mergesort.h"
+
+using namespace std;
+
+char startDefName[] = "start";
+
+/* Count the transitions in the fsm by walking the state list. */
+int countTransitions( PdaGraph *fsm )
+{
+	int numTrans = 0;
+	PdaState *state = fsm->stateList.head;
+	while ( state != 0 ) {
+		numTrans += state->transMap.length();
+		state = state->next;
+	}
+	return numTrans;
+}
+
+KlangEl::KlangEl( Namespace *nspace, const String &name, Type type )
+:
+	nspace(nspace),
+	name(name),
+	lit(name),
+	type(type),
+	id(-1),
+	isUserTerm(false),
+	isContext(false),
+	displayString(0),
+	numAppearances(0),
+	commit(false),
+	ignore(false),
+	reduceFirst(false),
+	isLiteral(false),
+	isRepeat(false),
+	isOpt(false),
+	parseStop(false),
+	tokenDef(0),
+	rootDef(0),
+	termDup(0),
+	pdaGraph(0),
+	pdaTables(0),
+	transBlock(0),
+	objectDef(0),
+	thisSize(0),
+	ofiOffset(0),
+	generic(0),
+	parserId(-1)
+{
+}
+ 
+PdaGraph *ProdElList::walk( ParseData *pd )
+{
+	PdaGraph *prodFsm = new PdaGraph();
+	PdaState *last = prodFsm->addState();
+	prodFsm->setStartState( last );
+
+	int prodLength = 0;
+	for ( Iter prodEl = first(); prodEl.lte(); prodEl++, prodLength++ ) {
+		//PdaGraph *itemFsm = prodEl->walk( pd );
+		long value = 0;
+
+		value = prodEl->langEl->id;
+
+		PdaState *newState = prodFsm->addState();
+		PdaTrans *newTrans = prodFsm->appendNewTrans( last, newState, value, value );
+
+		newTrans->isShift = true;
+		newTrans->shiftPrior = prodEl->priorVal;
+		//cerr << "PRIOR VAL: " << newTrans->shiftPrior << endl;
+
+		if ( prodEl->commit ) {
+			//cout << "COMMIT: inserting commit of length: " << pd->prodLength << endl;
+			/* Insert the commit into transitions out of last */
+			for ( TransMap::Iter trans = last->transMap; trans.lte(); trans++ )
+				trans->value->commits.insert( prodLength );
+		}
+
+		last = newState;
+	}
+
+	/* Make the last state the final state. */
+	prodFsm->setFinState( last );
+	return prodFsm;
+}
+
+
+KlangEl *getKlangEl( ParseData *pd, Namespace *nspace,
+		const String &data, KlangEl::Type defType )
+{
+    /* If the id is already in the dict, it will be placed in last found. If
+     * it is not there then it will be inserted and last found will be set to it. */
+    SymbolMapEl *inDict = nspace->symbolMap.find( data );
+    if ( inDict == 0 ) {
+        /* Language element not there. Make the new lang el and insert.. */
+        KlangEl *langEl = new KlangEl( nspace, data, defType );
+        inDict = nspace->symbolMap.insert( langEl->name, langEl );
+        pd->langEls.append( langEl );
+    }
+    return inDict->value;
+}
+
+ProdElList *makeProdElList( KlangEl *langEl )
+{
+	ProdElList *prodElList = new ProdElList();
+	prodElList->append( new PdaFactor( InputLoc(), langEl ) );
+	prodElList->tail->langEl = langEl;
+	return prodElList;
+}
+
+void ParseData::makeDefinitionNames()
+{
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		int prodNum = 1;
+		for ( LelDefList::Iter def = lel->defList; def.lte(); def++ ) {
+			def->data.setAs( lel->name.length() + 32, "%s-%i", 
+					lel->name.data, prodNum++ );
+		}
+	}
+}
+
+/* Make sure there there are no language elements whose type is unkonwn. This
+ * can happen when an id is used on the rhs of a definition but is not defined
+ * as anything. */
+void ParseData::noUndefindKlangEls()
+{
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->type == KlangEl::Unknown )
+			error() << "'" << lel->name << "' was not defined as anything" << endp;
+	}
+}
+
+void ParseData::makeKlangElIds()
+{
+	/* Make the "stream" language element */
+	streamKlangEl = new KlangEl( rootNamespace, strdup("stream"), KlangEl::Term );
+	langEls.prepend( streamKlangEl );
+	SymbolMapEl *streamMapEl = rootNamespace->symbolMap.insert( 
+			streamKlangEl->name, streamKlangEl );
+	assert( streamMapEl != 0 );
+
+	/* Make the "str" language element */
+	strKlangEl = new KlangEl( rootNamespace, strdup("str"), KlangEl::Term );
+	langEls.prepend( strKlangEl );
+	SymbolMapEl *stringMapEl = rootNamespace->symbolMap.insert( 
+			strKlangEl->name, strKlangEl );
+	assert( stringMapEl != 0 );
+
+	/* Make the "int" language element */
+	intKlangEl = new KlangEl( rootNamespace, strdup("int"), KlangEl::Term );
+	langEls.prepend( intKlangEl );
+	SymbolMapEl *integerMapEl = rootNamespace->symbolMap.insert( 
+			intKlangEl->name, intKlangEl );
+	assert( integerMapEl != 0 );
+
+	/* Make the "bool" language element */
+	boolKlangEl = new KlangEl( rootNamespace, strdup("bool"), KlangEl::Term );
+	langEls.prepend( boolKlangEl );
+	SymbolMapEl *boolMapEl = rootNamespace->symbolMap.insert( 
+			boolKlangEl->name, boolKlangEl );
+	assert( boolMapEl != 0 );
+
+	/* Make the "ptr" language element */
+	ptrKlangEl = new KlangEl( rootNamespace, strdup("ptr"), KlangEl::Term );
+	langEls.prepend( ptrKlangEl );
+	SymbolMapEl *ptrMapEl = rootNamespace->symbolMap.insert( 
+			ptrKlangEl->name, ptrKlangEl );
+	assert( ptrMapEl != 0 );
+
+	/* Make the EOF language element. */
+	eofKlangEl = new KlangEl( rootNamespace, strdup("_eof"), KlangEl::Term );
+	langEls.prepend( eofKlangEl );
+	SymbolMapEl *eofMapEl = rootNamespace->symbolMap.insert( eofKlangEl->name, eofKlangEl );
+	assert( eofMapEl != 0 );
+
+	/* Make the "any" language element */
+	anyKlangEl = new KlangEl( rootNamespace, strdup("any"), KlangEl::NonTerm );
+	langEls.prepend( anyKlangEl );
+	SymbolMapEl *anyMapEl = rootNamespace->symbolMap.insert( anyKlangEl->name, anyKlangEl );
+	assert( anyMapEl != 0 );
+
+	/* Make a translate token language element. */
+
+	/* Make terminal language elements corresponding to each nonterminal in
+	 * the grammar. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->type == KlangEl::NonTerm ) {
+			String name( lel->name.length() + 5, "_T_%s", lel->name.data );
+			KlangEl *termDup = new KlangEl( lel->nspace, name, KlangEl::Term );
+
+			/* Give the dup the attributes of the nonterminal. This ensures
+			 * that the attributes are allocated when patterns and
+			 * constructors are parsed. */
+			termDup->objectDef = lel->objectDef;
+
+			langEls.append( termDup );
+			lel->termDup = termDup;
+			termDup->termDup = lel;
+		}
+	}
+
+	/* The first id 0 is reserved for the stack sentinal. A negative id means
+	 * error to the parsing function, inducing backtracking. */
+	nextSymbolId = 1;
+
+	/* First pass assigns to the user terminals. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		/* Must be a term, and not any of the special reserved terminals.
+		 * Remember if the non terminal is a user non terminal. */
+		if ( lel->type == KlangEl::Term && lel != eofKlangEl && lel != errorKlangEl ) {
+			lel->isUserTerm = true;
+			lel->id = nextSymbolId++;
+		}
+	}
+
+	/* Next assign to the eof token, which we always create. */
+	eofKlangEl->id = nextSymbolId++;
+
+	/* First pass assigns to the user terminals. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->id < 0 ) {
+			/* Must be a term, and not any of the special reserved terminals.
+			 * Remember if the non terminal is a user non terminal. */
+			if ( lel->type == KlangEl::Term && lel != eofKlangEl && lel != errorKlangEl ) {
+				assert( false );
+				lel->isUserTerm = true;
+				lel->id = nextSymbolId++;
+			}
+		}
+	}
+
+	/* Possibly assign to the error language element. */
+	if ( errorKlangEl != 0 )
+		errorKlangEl->id = nextSymbolId++;
+
+	/* Save this for the code generation. */
+	firstNonTermId = nextSymbolId;
+
+	/* A third and final pass assigns to everything else. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		/* Anything else not yet assigned gets assigned now. */
+		if ( lel->id < 0 )
+			lel->id = nextSymbolId++;
+	}
+
+	assert( ptrKlangEl->id == LEL_ID_PTR );
+	assert( boolKlangEl->id == LEL_ID_BOOL );
+	assert( intKlangEl->id == LEL_ID_INT );
+	assert( strKlangEl->id == LEL_ID_STR );
+	assert( streamKlangEl->id == LEL_ID_STREAM );
+}
+
+void ParseData::makeKlangElNames()
+{
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		lel->fullName = lel->name;
+		lel->fullLit = lel->lit;
+
+		Namespace *nspace = lel->nspace;
+		while ( nspace != 0 ) {
+			if ( nspace == defaultNamespace || nspace == rootNamespace )
+				break;
+			lel->fullName = nspace->name + "_" + lel->fullName;
+			nspace = nspace->parentNamespace;
+		}
+
+		nspace = lel->nspace;
+		while ( nspace != 0 ) {
+			if ( nspace == defaultNamespace || nspace == rootNamespace )
+				break;
+			lel->fullLit = nspace->name + "::" + lel->fullLit;
+			nspace = nspace->parentNamespace;
+		}
+	}
+}
+
+/* Set up dot sets, shift info, and prod sets. */
+void ParseData::makeProdFsms()
+{
+	/* There are two items in the index for each production (high and low). */
+	int indexLen = prodList.length() * 2;
+	dotItemIndex.setAsNew( indexLen );
+	int dsiLow = 0, indexPos = 0;
+
+	/* Build FSMs for all production language elements. */
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ )
+		prod->fsm = prod->prodElList->walk( this );
+
+	makeNonTermFirstSets();
+	makeFirstSets();
+
+	/* Build FSMs for all production language elements. */
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		if ( addUniqueEmptyProductions ) {
+			/* This must be re-implemented. */
+			assert( false );
+			//if ( !prod->isLeftRec && prod->uniqueEmptyLeader != 0 ) {
+			//	PdaGraph *emptyLeader = prod->uniqueEmptyLeader->walk( this );
+			//	emptyLeader->concatOp( prod->fsm );
+			//	prod->fsm = emptyLeader;
+			//}
+		}
+
+		/* Compute the machine's length. */
+		prod->fsmLength = prod->fsm->fsmLength( );
+
+		/* Productions have a unique production id for each final state.
+		 * This lets us use a production length specific to each final state.
+		 * Start states are always isolated therefore if the start state is
+		 * final then reductions from it will always have a fixed production
+		 * length. This is a simple method for determining the length
+		 * of zero-length derivations when reducing. */
+
+		/* Number of dot items needed for the production is elements + 1
+		 * because the dot can be before the first and after the last element. */
+		int numForProd = prod->fsm->stateList.length() + 1;
+
+		/* Set up the low and high values in the index for this production. */
+		dotItemIndex.data[indexPos].key = dsiLow;
+		dotItemIndex.data[indexPos].value = prod;
+		dotItemIndex.data[indexPos+1].key = dsiLow + numForProd - 1;
+		dotItemIndex.data[indexPos+1].value = prod;
+
+		int dsi = dsiLow;
+		for ( PdaStateList::Iter state = prod->fsm->stateList; state.lte(); state++, dsi++ ) {
+			/* All transitions are shifts. */
+			for ( TransMap::Iter out = state->transMap; out.lte(); out++ )
+				assert( out->value->isShift );
+
+			state->dotSet.insert( dsi );
+		}
+
+		/* Move over the production. */
+		dsiLow += numForProd;
+		indexPos += 2;
+
+		if ( prod->prodCommit ) {
+			for ( PdaStateSet::Iter fin = prod->fsm->finStateSet; fin.lte(); fin++ ) {
+				int length = prod->fsmLength;
+				//cerr << "PENDING COMMIT IN FINAL STATE of " << prod->prodId <<
+				//		" with len: " << length << endl;
+				(*fin)->pendingCommits.insert( ProdIdPair( prod->prodId, length ) );
+			}
+		}
+	}
+
+	/* Make the final state specific prod id to prod id mapping. */
+	prodIdIndex = new Definition*[prodList.length()];
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ )
+		prodIdIndex[prod->prodId] = prod;
+}
+
+/* Want the first set of over src. If the first set contains epsilon, go over
+ * it and over tab. If overSrc is the end of the production, find the follow
+ * from the table, taking only the characters on which the parent is reduced.
+ * */
+void ParseData::findFollow( AlphSet &result, PdaState *overTab, 
+		PdaState *overSrc, Definition *parentDef )
+{
+	if ( overSrc->isFinState() ) {
+		assert( overSrc->transMap.length() == 0 );
+
+		/* At the end of the production. Turn to the table. */
+		long redCode = makeReduceCode( parentDef->prodId, false );
+		for ( TransMap::Iter tabTrans = overTab->transMap; tabTrans.lte(); tabTrans++ ) {
+			for ( ActDataList::Iter adl = tabTrans->value->actions; adl.lte(); adl++ ) {
+				if ( *adl == redCode )
+					result.insert( tabTrans->key );
+			}
+		}
+	}
+	else {
+		/* Get the first set of the item. If the first set contains epsilon
+		 * then move over overSrc and overTab and recurse. */
+		assert( overSrc->transMap.length() == 1 );
+		TransMap::Iter pastTrans = overSrc->transMap;
+
+		KlangEl *langEl = langElIndex[pastTrans->key];
+		if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+			bool hasEpsilon = false;
+			for ( LelDefList::Iter def = langEl->defList; def.lte(); def++ ) {
+				result.insert( def->firstSet );
+
+				if ( def->firstSet.find( -1 ) )
+					hasEpsilon = true;
+			}
+
+			/* Find the equivalent state in the parser. */
+			if ( hasEpsilon ) {
+				PdaTrans *tabTrans = overTab->findTrans( pastTrans->key );
+				findFollow( result, tabTrans->toState, 
+						pastTrans->value->toState, parentDef );
+			}
+
+			/* Now possibly the dup. */
+			if ( langEl->termDup != 0 )
+				result.insert( langEl->termDup->id );
+		}
+		else {
+			result.insert( pastTrans->key );
+		}
+	}
+}
+
+PdaState *ParseData::followProd( PdaState *tabState, PdaState *prodState )
+{
+	while ( prodState->transMap.length() == 1 ) {
+		TransMap::Iter prodTrans = prodState->transMap;
+		PdaTrans *tabTrans = tabState->findTrans( prodTrans->key );
+		prodState = prodTrans->value->toState;
+		tabState = tabTrans->toState;
+	}
+	return tabState;
+}
+
+void ParseData::trySetTime( PdaTrans *trans, long code, long &time )
+{
+	/* Find the item. */
+	for ( ActDataList::Iter adl = trans->actions; adl.lte(); adl++ ) {
+		if ( *adl == code ) {
+			/* If the time of the shift is not already set, set it. */
+			if ( trans->actOrds[adl.pos()] == 0 ) {
+				//cerr << "setting time: state = " << tabState->stateNum 
+				//		<< ", trans = " << tabTrans->lowKey
+				//		<< ", time = " << time << endl;
+				trans->actOrds[adl.pos()] = time++;
+			}
+			break;
+		}
+	}
+}
+
+/* Go down a defintiion and then handle the follow actions. */
+void ParseData::pdaOrderFollow( KlangEl *rootEl, PdaState *tabState, 
+		PdaTrans *tabTrans, PdaTrans *srcTrans, Definition *parentDef, 
+		Definition *definition, long &time )
+{
+	/* We need the follow from tabState/srcState over the defintion we are
+	 * currently processing. */
+	PdaState *overTab = tabTrans->toState;
+	PdaState *overSrc = srcTrans->toState;
+
+	AlphSet alphSet;
+	if ( parentDef == rootEl->rootDef )
+		alphSet.insert( eofKlangEl->id );
+	else
+		findFollow( alphSet, overTab, overSrc, parentDef );		
+
+	/* Now follow the production to find out where it expands to. */
+	PdaState *expandToState = followProd( tabState, definition->fsm->startState );
+
+	/* Find the reduce item. */
+	long redCode = makeReduceCode( definition->prodId, false );
+
+	for ( TransMap::Iter tt = expandToState->transMap; tt.lte(); tt++ ) {
+		if ( alphSet.find( tt->key ) ) {
+			trySetTime( tt->value, redCode, time );
+	
+			/* If the items token region is not recorded in the state, do it now. */
+			addRegion( expandToState, tt->key );
+		}
+	}
+}
+
+bool regionVectHas( RegionVect &regVect, TokenRegion *region )
+{
+	for ( RegionVect::Iter trvi = regVect; trvi.lte(); trvi++ ) {
+		if ( *trvi == region )
+			return true;
+	}
+	return false;
+}
+
+void ParseData::addRegion( PdaState *tabState, long pdaKey )
+{
+	KlangEl *klangEl = langElIndex[pdaKey];
+	if ( klangEl != 0 && klangEl->type == KlangEl::Term ) {
+		TokenRegion *region = 0;
+
+		/* If it is not the eof, then use the region associated 
+		 * with the token definition. */
+		if ( klangEl != eofKlangEl && klangEl->tokenDef != 0 )
+			region = klangEl->tokenDef->tokenRegion;
+
+		if ( region != 0 && !regionVectHas( tabState->regions, region ) )
+			tabState->regions.append( region );
+	}
+}
+
+#if 0
+    orderState( tabState, prodState, time ):
+        if not tabState.dotSet.find( prodState.dotID )
+            tabState.dotSet.insert( prodState.dotID )
+            tabTrans = tabState.findMatchingTransition( prodState.getTransition() )
+
+            if tabTrans is NonTerminal:
+                for production in tabTrans.nonTerm.prodList:
+                    orderState( tabState, production.startState, time )
+
+                    for all expandToState in tabTrans.expandToStates:
+                        for all followTrans in expandToState.transList 
+                            reduceAction = findAction( production.reduction )
+                            if reduceAction.time is unset:
+                                reduceAction.time = time++
+                            end
+                        end
+                    end
+                end
+            end
+
+            shiftAction = tabTrans.findAction( shift )
+            if shiftAction.time is unset:
+                shiftAction.time = time++
+            end
+
+            orderState( tabTrans.toState, prodTrans.toState, time )
+        end
+    end
+
+    orderState( parseTable.startState, startProduction.startState, 1 )
+#endif
+
+void ParseData::pdaOrderProd( KlangEl *rootEl, PdaState *tabState, 
+	PdaState *srcState, Definition *parentDef, long &time )
+{
+	assert( srcState->dotSet.length() == 1 );
+	if ( tabState->dotSet2.find( srcState->dotSet[0] ) )
+		return;
+	tabState->dotSet2.insert( srcState->dotSet[0] );
+	
+	assert( srcState->transMap.length() == 0 || srcState->transMap.length() == 1 );
+
+	if ( srcState->transMap.length() == 1 ) { 
+		TransMap::Iter srcTrans = srcState->transMap;
+
+		/* Find the equivalent state in the parser. */
+		PdaTrans *tabTrans = tabState->findTrans( srcTrans->key );
+
+		/* Recurse into the transition if it is a non-terminal. */
+		KlangEl *langEl = langElIndex[srcTrans->key];
+		if ( langEl != 0 ) {
+			if ( langEl->reduceFirst ) {
+				/* Use a shortest match ordering for the contents of this
+				 * nonterminal. Does follows for all productions first, then
+				 * goes down the productions. */
+				for ( LelDefList::Iter expDef = langEl->defList; expDef.lte(); expDef++ ) {
+					pdaOrderFollow( rootEl, tabState, tabTrans, srcTrans->value, 
+							parentDef, expDef, time );
+				}
+				for ( LelDefList::Iter expDef = langEl->defList; expDef.lte(); expDef++ )
+					pdaOrderProd( rootEl, tabState, expDef->fsm->startState, expDef, time );
+				
+			}
+			else {
+				/* The default action ordering. For each prod, goes down the
+				 * prod then sets the follow before going to the next prod. */
+				for ( LelDefList::Iter expDef = langEl->defList; expDef.lte(); expDef++ ) {
+					pdaOrderProd( rootEl, tabState, expDef->fsm->startState, expDef, time );
+
+					pdaOrderFollow( rootEl, tabState, tabTrans, srcTrans->value, 
+							parentDef, expDef, time );
+				}
+			}
+		}
+
+		trySetTime( tabTrans, SHIFT_CODE, time );
+
+		/* Now possibly for the dup. */
+		if ( langEl != 0 && langEl->termDup != 0 ) {
+			PdaTrans *dupTrans = tabState->findTrans( langEl->termDup->id );
+			trySetTime( dupTrans, SHIFT_CODE, time );
+		}
+
+		/* If the items token region is not recorded in the state, do it now. */
+		addRegion( tabState, srcTrans->key );
+
+		/* Go over one in the production. */
+		pdaOrderProd( rootEl, tabTrans->toState, 
+				srcTrans->value->toState, parentDef, time );
+	}
+}
+
+void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl )
+{
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		assert( (state->stateBits & SB_ISMARKED) == 0 );
+
+		/* Traverse the src state's transitions. */
+		long last = 0;
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			if ( ! trans.first() )
+				assert( last < trans->key );
+			last = trans->key;
+		}
+	}
+
+	/* Compute the action orderings, record the max value. */
+	long time = 1;
+	PdaState *startState = rootEl->rootDef->fsm->startState;
+	pdaOrderProd( rootEl, pdaGraph->startState, startState, rootEl->rootDef, time );
+
+	/* Walk over the start lang el and set the time for shift of
+	 * the eof action that completes the parse. */
+	PdaTrans *overStart = pdaGraph->startState->findTrans( rootEl->id );
+	PdaTrans *eofTrans = overStart->toState->findTrans( eofKlangEl->id );
+	eofTrans->actOrds[0] = time++;
+
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		if ( state->regions.length() == 0 ) {
+			for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+				/* There are no regions and EOF leaves the state. Add the eof
+				 * token region. */
+				PdaTrans *trans = tel->value;
+				if ( trans->lowKey == eofKlangEl->id )
+					state->regions.append( eofTokenRegion );
+			}
+		}
+	}
+
+	#ifdef COLM_LOG_COMPILE
+	/* Warn about states with empty token region lists. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		if ( state->regions.length() == 0 ) {
+			warning() << "state has an empty token region, state: " << 
+				state->stateNum << endl;
+		}
+	}
+	#endif
+
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
+		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+			PdaTrans *trans = tel->value;
+			/* Check every action has an ordering. */
+			for ( ActDataList::Iter adl = trans->actOrds; adl.lte(); adl++ ) {
+				if ( *adl == 0 ) {
+					warning() << "action ordering for " << 
+						trans->actions[adl.pos()] << " is unset, state: " << 
+						state->stateNum << ", trans: ";
+
+					KlangEl *lel = langElIndex[trans->lowKey];
+					if ( lel == 0 )
+						cerr << (char)trans->lowKey << endl;
+					else
+						cerr << lel->name << endl;
+					*adl = time++;
+				}
+			}
+		}
+	}
+}
+
+void ParseData::advanceReductions( PdaGraph *pdaGraph )
+{
+	/* Loop all states. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		bool outHasShift = false;
+		ReductionMap outReds;
+		LongSet outCommits;
+		for ( TransMap::Iter out = state->transMap; out.lte(); out++ ) {
+			/* Get the transition from the trans el. */
+			if ( out->value->isShift )
+				outHasShift = true;
+			outReds.insert( out->value->reductions );
+			outCommits.insert( out->value->commits );
+		}
+
+		bool inHasShift = false;
+		ReductionMap inReds;
+		for ( PdaTransInList::Iter in = state->inRange; in.lte(); in++ ) {
+			/* Get the transition from the trans el. */
+			if ( in->isShift )
+				inHasShift = true;
+			inReds.insert( in->reductions );
+		}
+
+		if ( !outHasShift && outReds.length() == 1 && 
+				inHasShift && inReds.length() == 0 )
+		{
+			//cerr << "moving reduction to shift" << endl;
+
+			/* Move the reduction to all in transitions. */
+			for ( PdaTransInList::Iter in = state->inRange; in.lte(); in++ ) {
+				assert( in->actions.length() == 1 );
+				assert( in->actions[0] == SHIFT_CODE );
+				in->actions[0] = makeReduceCode( outReds[0].key, true );
+				in->afterShiftCommits.insert( outCommits );
+			}
+
+			/* 
+			 * Remove all transitions out of the state.
+			 */
+
+			/* Detach out range transitions. */
+			for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+				pdaGraph->detachTrans( state, trans->value->toState, trans->value );
+				delete trans->value;
+			}
+			state->transMap.empty();
+
+			/* Redirect all the in transitions to the actionDestState. */
+			pdaGraph->inTransMove( actionDestState, state );
+		}
+	}
+
+	pdaGraph->removeUnreachableStates();
+}
+
+void ParseData::sortActions( PdaGraph *pdaGraph )
+{
+	/* Sort the actions. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
+		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+			PdaTrans *trans = tel->value;
+
+			/* Sort by the action ords. */
+			ActDataList actions( trans->actions );
+			ActDataList actOrds( trans->actOrds );
+			ActDataList actPriors( trans->actPriors );
+			trans->actions.empty();
+			trans->actOrds.empty();
+			trans->actPriors.empty();
+			while ( actOrds.length() > 0 ) {
+				int min = 0;
+				for ( int i = 1; i < actOrds.length(); i++ ) {
+					if ( actPriors[i] > actPriors[min] ||
+							(actPriors[i] == actPriors[min] &&
+							actOrds[i] < actOrds[min] ) )
+					{
+						min = i;
+					}
+				}
+				trans->actions.append( actions[min] );
+				trans->actOrds.append( actOrds[min] );
+				trans->actPriors.append( actPriors[min] );
+				actions.remove(min);
+				actOrds.remove(min);
+				actPriors.remove(min);
+			}
+
+			if ( branchPointInfo && trans->actions.length() > 1 ) {
+				cerr << "info: branch point"
+						<< " state: " << state->stateNum
+						<< " trans: ";
+				KlangEl *lel = langElIndex[trans->lowKey];
+				if ( lel == 0 )
+					cerr << (char)trans->lowKey << endl;
+				else
+					cerr << lel->lit << endl;
+
+				for ( ActDataList::Iter act = trans->actions; act.lte(); act++ ) {
+					switch ( *act & 0x3 ) {
+					case 1: 
+						cerr << "    shift" << endl;
+						break;
+					case 2: 
+						cerr << "    reduce " << 
+								prodIdIndex[(*act >> 2)]->data << endl;
+						break;
+					case 3:
+						cerr << "    shift-reduce" << endl;
+						break;
+					}
+				}
+			}
+
+			/* Verify that shifts of nonterminals don't have any branch
+			 * points or commits. */
+			if ( trans->lowKey >= firstNonTermId ) {
+				if ( trans->actions.length() != 1 || 
+					(trans->actions[0] & 0x3) != 1 )
+				{
+					error() << "TRANS ON NONTERMINAL is something "
+						"other than a shift" << endl;
+				}
+				if ( trans->commits.length() > 0 )
+					error() << "TRANS ON NONTERMINAL has a commit" << endl;
+			}
+
+			/* TODO: Shift-reduces are optimizations. Verify that
+			 * shift-reduces exist only if they don't entail a conflict. */
+		}
+	}
+}
+
+void ParseData::reduceActions( PdaGraph *pdaGraph )
+{
+	/* Reduce the actions. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+			PdaTrans *trans = tel->value;
+			PdaActionSetEl *inSet;
+
+			int commitLen = trans->commits.length() > 0 ?
+				trans->commits[trans->commits.length()-1] : 0;
+
+			if ( trans->afterShiftCommits.length() > 0 ) {
+				int afterShiftCommit = trans->afterShiftCommits[
+					trans->afterShiftCommits.length()-1];
+
+				if ( commitLen > 0 && commitLen+1 > afterShiftCommit )
+					commitLen = ( commitLen + 1 );
+				else
+					commitLen = afterShiftCommit;
+			}
+			else {
+				commitLen = commitLen * -1;
+			}
+			
+			//if ( commitLen != 0 ) {
+			//	cerr << "FINAL ACTION COMMIT LEN: " << commitLen << endl;
+			//}
+
+			pdaGraph->actionSet.insert( ActionData( trans->toState->stateNum, 
+					trans->actions, commitLen ), &inSet );
+			trans->actionSetEl = inSet;
+		}
+	}
+}
+
+void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl )
+{
+	pdaGraph->maxState = pdaGraph->stateList.length() - 1;
+	pdaGraph->maxLelId = nextSymbolId - 1;
+	pdaGraph->maxOffset = pdaGraph->stateList.length() * pdaGraph->maxLelId;
+
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			if ( trans->value->isShift ) {
+				trans->value->actions.append( SHIFT_CODE );
+				trans->value->actPriors.append( trans->value->shiftPrior );
+			}
+			for ( ReductionMap::Iter red = trans->value->reductions; red.lte(); red++ ) {
+				trans->value->actions.append( makeReduceCode( red->key, false ) );
+				trans->value->actPriors.append( red->value );
+			}
+			trans->value->actOrds.appendDup( 0, trans->value->actions.length() );
+		}
+	}
+
+	pdaActionOrder( pdaGraph, rootEl );
+	sortActions( pdaGraph );
+	advanceReductions( pdaGraph );
+	pdaGraph->setStateNumbers();
+	reduceActions( pdaGraph );
+
+	/* Set the action ids. */
+	int actionSetId = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ )
+		asi->key.id = actionSetId++;
+	
+	/* Get the max index. */
+	pdaGraph->maxIndex = actionSetId - 1;
+
+	/* Compute the max prod length. */
+	pdaGraph->maxProdLen = 0;
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		if ( (unsigned)prod->fsmLength > pdaGraph->maxProdLen )
+			pdaGraph->maxProdLen = prod->fsmLength;
+	}
+
+	/* Asserts that any transition with a nonterminal has a single action
+	 * which is either a shift or a shift-reduce. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			KlangEl *langEl = langElIndex[trans->value->lowKey];
+			if ( langEl != 0 && langEl->type == KlangEl::NonTerm ) {
+				assert( trans->value->actions.length() == 1 );
+				assert( trans->value->actions[0] == SHIFT_CODE ||
+					(trans->value->actions[0] & 0x3) == SHIFT_REDUCE_CODE );
+			}
+		}
+	}
+
+	/* Assert that shift reduces always appear on their own. */
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			for ( ActDataList::Iter act = trans->value->actions; act.lte(); act++ ) {
+				if ( (*act & 0x3) == SHIFT_REDUCE_CODE )
+					assert( trans->value->actions.length() == 1 );
+			}
+		}
+	}
+}
+
+void ParseData::wrapNonTerminals()
+{
+	/* Make a language element that will be used to make the root productions.
+	 * These are used for making parsers rooted at any production (including
+	 * the start symbol). */
+	rootKlangEl = new KlangEl( rootNamespace, "_root", KlangEl::NonTerm );
+	langEls.append( rootKlangEl );
+	SymbolMapEl *rootMapEl = rootNamespace->symbolMap.insert( 
+			rootKlangEl->name, rootKlangEl );
+	assert( rootMapEl != 0 );
+
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		/* Make a single production used when the lel is a root. */
+		ProdElList *prodElList = makeProdElList( lel );
+		lel->rootDef = new Definition( InputLoc(), rootKlangEl, 
+				prodElList, false, 0,
+				prodList.length(), Definition::Production );
+		prodList.append( lel->rootDef );
+		rootKlangEl->defList.append( lel->rootDef );
+	}
+}
+
+bool ParseData::makeNonTermFirstSetProd( Definition *prod, PdaState *state )
+{
+	bool modified = false;
+	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+		if ( trans->key >= firstNonTermId ) {
+			long *inserted = prod->nonTermFirstSet.insert( trans->key );
+			if ( inserted != 0 )
+				modified = true;
+
+			bool hasEpsilon = false;
+			KlangEl *lel = langElIndex[trans->key];
+			for ( LelDefList::Iter ldef = lel->defList; ldef.lte(); ldef++ ) {
+				for ( ProdIdSet::Iter pid = ldef->nonTermFirstSet; 
+						pid.lte(); pid++ )
+				{
+					if ( *pid == -1 )
+						hasEpsilon = true;
+					else {
+						long *inserted = prod->nonTermFirstSet.insert( *pid );
+						if ( inserted != 0 )
+							modified = true;
+					}
+				}
+			}
+
+			if ( hasEpsilon ) {
+				if ( trans->value->toState->isFinState() ) {
+					long *inserted = prod->nonTermFirstSet.insert( -1 );
+					if ( inserted != 0 )
+						modified = true;
+				}
+
+				bool lmod = makeNonTermFirstSetProd( prod, trans->value->toState );
+				if ( lmod )
+					modified = true;
+			}
+		}
+	}
+	return modified;
+}
+
+
+void ParseData::makeNonTermFirstSets()
+{
+	bool modified = true;
+	while ( modified ) {
+		modified = false;
+		for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+			if ( prod->fsm->startState->isFinState() ) {
+				long *inserted = prod->nonTermFirstSet.insert( -1 );
+				if ( inserted != 0 )
+					modified = true;
+			}
+
+			bool lmod = makeNonTermFirstSetProd( prod, prod->fsm->startState );
+			if ( lmod )
+				modified = true;
+		}
+	}
+
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		if ( prod->nonTermFirstSet.find( prod->prodName->id ) )
+			prod->isLeftRec = true;
+	}
+}
+
+void ParseData::printNonTermFirstSets()
+{
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		cerr << prod->data << ": ";
+		for ( ProdIdSet::Iter pid = prod->nonTermFirstSet; pid.lte(); pid++ )
+		{
+			if ( *pid < 0 )
+				cerr << " <EPSILON>";
+			else {
+				KlangEl *lel = langElIndex[*pid];
+				cerr << " " << lel->name;
+			}
+		}
+		cerr << endl;
+
+		if ( prod->isLeftRec )
+			cerr << "PROD IS LEFT REC: " << prod->data << endl;
+	}
+}
+
+bool ParseData::makeFirstSetProd( Definition *prod, PdaState *state )
+{
+	bool modified = false;
+	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+		if ( trans->key < firstNonTermId ) {
+			long *inserted = prod->firstSet.insert( trans->key );
+			if ( inserted != 0 )
+				modified = true;
+		}
+		else {
+			long *inserted = prod->firstSet.insert( trans->key );
+			if ( inserted != 0 )
+				modified = true;
+
+			KlangEl *klangEl = langElIndex[trans->key];
+			if ( klangEl != 0 && klangEl->termDup != 0 ) {
+				long *inserted2 = prod->firstSet.insert( klangEl->termDup->id );
+				if ( inserted2 != 0 )
+					modified = true;
+			}
+
+			bool hasEpsilon = false;
+			KlangEl *lel = langElIndex[trans->key];
+			for ( LelDefList::Iter ldef = lel->defList; ldef.lte(); ldef++ ) {
+				for ( ProdIdSet::Iter pid = ldef->firstSet; 
+						pid.lte(); pid++ )
+				{
+					if ( *pid == -1 )
+						hasEpsilon = true;
+					else {
+						long *inserted = prod->firstSet.insert( *pid );
+						if ( inserted != 0 )
+							modified = true;
+					}
+				}
+			}
+
+			if ( hasEpsilon ) {
+				if ( trans->value->toState->isFinState() ) {
+					long *inserted = prod->firstSet.insert( -1 );
+					if ( inserted != 0 )
+						modified = true;
+				}
+
+				bool lmod = makeFirstSetProd( prod, trans->value->toState );
+				if ( lmod )
+					modified = true;
+			}
+		}
+	}
+	return modified;
+}
+
+
+void ParseData::makeFirstSets()
+{
+	bool modified = true;
+	while ( modified ) {
+		modified = false;
+		for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+			if ( prod->fsm->startState->isFinState() ) {
+				long *inserted = prod->firstSet.insert( -1 );
+				if ( inserted != 0 )
+					modified = true;
+			}
+
+			bool lmod = makeFirstSetProd( prod, prod->fsm->startState );
+			if ( lmod )
+				modified = true;
+		}
+	}
+}
+
+void ParseData::printFirstSets()
+{
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		cerr << prod->data << ": ";
+		for ( ProdIdSet::Iter pid = prod->firstSet; pid.lte(); pid++ )
+		{
+			if ( *pid < 0 )
+				cerr << " <EPSILON>";
+			else {
+				KlangEl *lel = langElIndex[*pid];
+				if ( lel != 0 ) 
+					cerr << endl << "    " << lel->name;
+				else
+					cerr << endl << "    " << *pid;
+			}
+		}
+		cerr << endl;
+	}
+}
+
+void ParseData::insertUniqueEmptyProductions()
+{
+	int limit = prodList.length();
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		if ( prod->prodId == limit )
+			break;
+
+		/* Get a language element. */
+		char name[20];
+		sprintf(name, "U%li", prodList.length());
+		KlangEl *prodName = getKlangEl( this, rootNamespace,
+				name, KlangEl::NonTerm );
+		Definition *newDef = new Definition( InputLoc(), prodName, 
+				0 /* FIXME new VarDef( name, 0 )*/, 
+				false, 0, prodList.length(), Definition::Production );
+		prodName->defList.append( newDef );
+		prodList.append( newDef );
+
+		prod->uniqueEmptyLeader = prodName;
+	}
+}
+
+void ParseData::makeRuntimeData()
+{
+	long count = 0;
+
+	/*
+	 * ProdLengths
+	 * ProdLhsIs
+	 * ProdNames
+	 * ProdCodeBlocks
+	 * ProdCodeBlockLens
+	 */
+
+	runtimeData->frameInfo = new FrameInfo[nextFrameId];
+	runtimeData->numFrames = nextFrameId;
+	memset( runtimeData->frameInfo, 0, sizeof(FrameInfo) * nextFrameId );
+
+	/*
+	 * Init code block.
+	 */
+	if ( rootCodeBlock == 0 ) {
+		runtimeData->rootCode = 0;
+		runtimeData->rootCodeLen = 0;
+	}
+	else {
+		runtimeData->rootCode = rootCodeBlock->code.data;
+		runtimeData->rootCodeLen = rootCodeBlock->code.length();
+	}
+
+	runtimeData->frameInfo[rootCodeBlock->frameId].code = 0;
+	runtimeData->frameInfo[rootCodeBlock->frameId].codeLen = 0;
+	runtimeData->frameInfo[rootCodeBlock->frameId].trees = rootCodeBlock->trees.data;
+	runtimeData->frameInfo[rootCodeBlock->frameId].treesLen = rootCodeBlock->trees.length();
+
+	/*
+	 * prodInfo
+	 */
+	count = prodList.length();
+	runtimeData->prodInfo = new ProdInfo[count];
+	runtimeData->numProds = count;
+
+	count = 0;
+	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		runtimeData->prodInfo[count].length = prod->fsmLength;
+		runtimeData->prodInfo[count].lhsId = prod->prodName->id;
+		runtimeData->prodInfo[count].name = prod->data;
+		runtimeData->prodInfo[count].frameId = -1;
+
+		CodeBlock *block = prod->redBlock;
+		if ( block != 0 ) {
+			runtimeData->prodInfo[count].frameId = block->frameId;
+			runtimeData->frameInfo[block->frameId].code = block->code.data;
+			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
+			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
+		}
+
+		runtimeData->prodInfo[count].lhsUpref = true;
+		count += 1;
+	}
+
+	/*
+	 * regionInfo
+	 */
+	runtimeData->numRegions = regionList.length()+1;
+	runtimeData->regionInfo = new RegionInfo[runtimeData->numRegions];
+	runtimeData->regionInfo[0].name = "___EMPTY";
+	runtimeData->regionInfo[0].defaultToken = -1;
+	for ( RegionList::Iter reg = regionList; reg.lte(); reg++ ) {
+		long regId = reg->id+1;
+		runtimeData->regionInfo[regId].name = reg->name;
+		runtimeData->regionInfo[regId].defaultToken =
+			reg->defaultTokenDef == 0 ? -1 : reg->defaultTokenDef->token->id;
+		runtimeData->regionInfo[regId].eofFrameId = -1;
+
+		CodeBlock *block = reg->preEofBlock;
+		if ( block != 0 ) {
+			runtimeData->regionInfo[regId].eofFrameId = block->frameId;
+			runtimeData->frameInfo[block->frameId].code = block->code.data;
+			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
+			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
+		}
+	}
+
+	/*
+	 * lelInfo
+	 */
+
+	count = nextSymbolId;
+	runtimeData->lelInfo = new LangElInfo[count];
+	runtimeData->numLangEls = count;
+
+	for ( int i = 0; i < nextSymbolId; i++ ) {
+		KlangEl *lel = langElIndex[i];
+		if ( lel != 0 ) {
+			runtimeData->lelInfo[i].name = lel->fullLit;
+			runtimeData->lelInfo[i].repeat = lel->isRepeat;
+			runtimeData->lelInfo[i].literal = lel->isLiteral;
+			runtimeData->lelInfo[i].ignore = lel->ignore;
+			runtimeData->lelInfo[i].frameId = -1;
+
+			CodeBlock *block = lel->transBlock;
+			if ( block != 0 ) {
+				runtimeData->lelInfo[i].frameId = block->frameId;
+				runtimeData->frameInfo[block->frameId].code = block->code.data;
+				runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+				runtimeData->frameInfo[block->frameId].trees = block->trees.data;
+				runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
+			}
+
+			runtimeData->lelInfo[i].objectTypeId = 
+					lel->objectDef == 0 ? 0 : lel->objectDef->id;
+			runtimeData->lelInfo[i].ofiOffset = lel->ofiOffset;
+			runtimeData->lelInfo[i].objectLength = 
+					( lel->objectDef == 0 || lel->objectDef == tokenObj ) ? 0 : 
+					lel->objectDef->size();
+			runtimeData->lelInfo[i].termDupId = lel->termDup == 0 ? 0 : lel->termDup->id;
+			runtimeData->lelInfo[i].genericId = lel->generic == 0 ? 0 : lel->generic->id;
+		}
+		else {
+			memset(&runtimeData->lelInfo[i], 0, sizeof(LangElInfo) );
+			runtimeData->lelInfo[i].name = "__UNUSED";
+			runtimeData->lelInfo[i].frameId = -1;
+		}
+	}
+
+	/*
+	 * FunctionInfo
+	 */
+	count = functionList.length();
+
+	runtimeData->functionInfo = new FunctionInfo[count];
+	runtimeData->numFunctions = count;
+	for ( FunctionList::Iter func = functionList; func.lte(); func++ ) {
+		runtimeData->functionInfo[func->funcId].name = func->name;
+		runtimeData->functionInfo[func->funcId].frameId = -1;
+
+		CodeBlock *block = func->codeBlock;
+		if ( block != 0 ) {
+			runtimeData->functionInfo[func->funcId].frameId = block->frameId;
+			runtimeData->frameInfo[block->frameId].code = block->code.data;
+			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
+			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
+		}
+
+		runtimeData->functionInfo[func->funcId].argSize = func->paramListSize;
+		runtimeData->functionInfo[func->funcId].ntrees = func->localFrame->sizeTrees();
+		runtimeData->functionInfo[func->funcId].frameSize = func->localFrame->size();
+	}
+
+	/*
+	 * PatReplInfo
+	 */
+
+	/* Filled in later after patterns are parsed. */
+	runtimeData->patReplInfo = new PatReplInfo[nextPatReplId];
+	memset( runtimeData->patReplInfo, 0, sizeof(PatReplInfo) * nextPatReplId );
+	runtimeData->numPatterns = nextPatReplId;
+	runtimeData->patReplNodes = 0;
+	runtimeData->numPatternNodes = 0;
+
+	
+	/*
+	 * GenericInfo
+	 */
+	count = 1;
+	for ( NamespaceList::Iter nspace = namespaceList; nspace.lte(); nspace++ )
+		count += nspace->genericList.length();
+	assert( count == nextGenericId );
+
+	runtimeData->genericInfo = new GenericInfo[count];
+	runtimeData->numGenerics = count;
+	memset( &runtimeData->genericInfo[0], 0, sizeof(GenericInfo) );
+	for ( NamespaceList::Iter nspace = namespaceList; nspace.lte(); nspace++ ) {
+		for ( GenericList::Iter gen = nspace->genericList; gen.lte(); gen++ ) {
+			runtimeData->genericInfo[gen->id].type = gen->typeId;
+			runtimeData->genericInfo[gen->id].typeArg = gen->utArg->typeId;
+			runtimeData->genericInfo[gen->id].keyType = gen->keyUT != 0 ? 
+					gen->keyUT->typeId : 0;
+			runtimeData->genericInfo[gen->id].keyOffset = 0;
+			runtimeData->genericInfo[gen->id].langElId = gen->langEl->id;
+		}
+	}
+
+	/*
+	 * Literals
+	 */
+	runtimeData->numLiterals = literalStrings.length();
+	runtimeData->litdata = new const char *[literalStrings.length()];
+	runtimeData->litlen = new long [literalStrings.length()];
+	runtimeData->literals = 0;
+	for ( StringMap::Iter el = literalStrings; el.lte(); el++ ) {
+		/* Data. */
+		char *data = new char[el->key.length()+1];
+		memcpy( data, el->key.data, el->key.length() );
+		data[el->key.length()] = 0;
+		runtimeData->litdata[el->value] = data;
+
+		/* Length. */
+		runtimeData->litlen[el->value] = el->key.length();
+	}
+
+	runtimeData->fsmTables = fsmTables;
+
+	runtimeData->parsers = new PdaTables*[nextParserId];
+	runtimeData->numParsers = nextParserId;
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->parserId >= 0 )
+			runtimeData->parsers[lel->parserId] = lel->pdaTables;
+	}
+		
+
+	runtimeData->globalSize = globalObjectDef->size();
+
+	/*
+	 * firstNonTermId
+	 */
+	runtimeData->firstNonTermId = firstNonTermId;
+
+	/* Special trees. */
+	runtimeData->integerId = intKlangEl->id;
+	runtimeData->stringId = strKlangEl->id;
+	runtimeData->anyId = anyKlangEl->id;
+	runtimeData->eofId = eofKlangEl->id;
+}
+
+/* Borrow alg->state for mapsTo. */
+void mapNodes( Program *prg, int &count, Kid *kid )
+{
+	if ( kid != 0 ) {
+		kid->tree->alg->state = count++;
+
+		Kid *ignore = tree_ignore( prg, kid->tree );
+		while ( tree_is_ignore( prg, ignore ) ) {
+			count += 1;
+			ignore = ignore->next;
+		}
+		mapNodes( prg, count, tree_child( prg, kid->tree ) );
+		mapNodes( prg, count, kid->next );
+	}
+}
+
+void fillNodes( Program *prg, Bindings &bindings, long &bindId, 
+		PatReplNode *nodes, Kid *kid )
+{
+	if ( kid != 0 ) {
+		long ind = kid->tree->alg->state;
+		PatReplNode &node = nodes[ind++];
+
+		Kid *child = tree_child( prg, kid->tree );
+
+		/* Set up the fields. */
+		node.id = kid->tree->id;
+		node.child = child == 0 ? -1 : child->tree->alg->state;
+		node.next = kid->next == 0 ? -1 : kid->next->tree->alg->state;
+		node.length = string_length( kid->tree->tokdata );
+		node.data = string_data( kid->tree->tokdata );
+
+		Kid *ignore = tree_ignore( prg, kid->tree );
+		node.ignore = ignore == 0 ? -1 : ind;
+
+		while ( ignore != 0 ) {
+			PatReplNode &node = nodes[ind++];
+
+			memset( &node, 0, sizeof(PatReplNode) );
+			node.id = ignore->tree->id;
+			node.next = ignore->next == 0 ? -1 : ind;
+			
+			node.length = string_length( ignore->tree->tokdata );
+			node.data = string_data( ignore->tree->tokdata );
+
+			ignore = ignore->next;
+		}
+
+		node.stop = kid->tree->alg->flags & AF_GENERATED;
+
+		/* Recurse. */
+		fillNodes( prg, bindings, bindId, nodes, child );
+
+		/* Since the parser is bottom up the bindings are in a bottom up
+		 * traversal order. Check after recursing. */
+		node.bindId = 0;
+		if ( bindings.data[bindId] == kid->tree ) {
+			/* Remember that binding ids are indexed from one. */
+			node.bindId = bindId++;
+
+			//cout << "binding match in " << __PRETTY_FUNCTION__ << endl;
+			//cout << "bindId: " << node.bindId << endl;
+		}
+
+		/* Move to the next child. */
+		fillNodes( prg, bindings, bindId, nodes, kid->next );
+	}
+}
+
+void ParseData::fillInPatterns( Program *prg )
+{
+	/*
+	 * patReplNodes
+	 */
+
+	/* Count is referenced and computed by mapNode. */
+	int count = 0;
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ )
+		mapNodes( prg, count, pat->pdaRun->stackTop );
+
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ )
+		mapNodes( prg, count, repl->pdaRun->stackTop );
+	
+	runtimeData->patReplNodes = new PatReplNode[count];
+	runtimeData->numPatternNodes = count;
+
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
+		runtimeData->patReplInfo[pat->patRepId].offset = 
+				pat->pdaRun->stackTop->next->tree->alg->state;
+
+		/* BindIds are indexed base one. */
+		runtimeData->patReplInfo[pat->patRepId].numBindings = 
+				pat->pdaRun->bindings.length() - 1;
+
+		/* Init the bind */
+		long bindId = 1;
+		fillNodes( prg, pat->pdaRun->bindings, bindId,
+			runtimeData->patReplNodes, pat->pdaRun->stackTop );
+	}
+
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
+		runtimeData->patReplInfo[repl->patRepId].offset = 
+				repl->pdaRun->stackTop->next->tree->alg->state;
+
+		/* BindIds are indexed base one. */
+		runtimeData->patReplInfo[repl->patRepId].numBindings = 
+				repl->pdaRun->bindings.length() - 1;
+
+		long bindId = 1;
+		fillNodes( prg, repl->pdaRun->bindings, bindId,
+				runtimeData->patReplNodes, repl->pdaRun->stackTop );
+	}
+}
+
+
+PdaTables *ParseData::makePdaTables( PdaGraph *pdaGraph )
+{
+	int count, curOffset, pos;
+	PdaTables *pdaTables = new PdaTables;
+
+	pdaTables->startState = pdaGraph->startState->stateNum;
+
+	/*
+	 * Indicies.
+	 */
+	count = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			count++;
+			if ( ! trans.last() ) {
+				TransMap::Iter next = trans.next();
+				for ( long key = trans->key+1; key < next->key; key++ )
+					count++;
+			}
+		}
+	}
+	pdaTables->indicies = new int[count];
+	pdaTables->numIndicies = count;
+
+	count = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			pdaTables->indicies[count++] = trans->value->actionSetEl->key.id;
+
+			if ( ! trans.last() ) {
+				TransMap::Iter next = trans.next();
+				for ( long key = trans->key+1; key < next->key; key++ )
+					pdaTables->indicies[count++] = -1;
+			}
+		}
+	}
+
+	/*
+	 * Keys
+	 */
+	count = pdaGraph->stateList.length() * 2;;
+	pdaTables->keys = new int[count];
+	pdaTables->numKeys = count;
+
+	count = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		if ( state->transMap.length() == 0 ) {
+			pdaTables->keys[count+0] = 0;
+			pdaTables->keys[count+1] = 0;
+		}
+		else {
+			TransMap::Iter first = state->transMap.first();
+			TransMap::Iter last = state->transMap.last();
+			pdaTables->keys[count+0] = first->key;
+			pdaTables->keys[count+1] = last->key;
+		}
+		count += 2;
+	}
+
+	/*
+	 * Offsets
+	 */
+	count = pdaGraph->stateList.length(); 
+	pdaTables->offsets = new unsigned int[count];
+	pdaTables->numStates = count;
+
+	count = 0;
+	curOffset = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		pdaTables->offsets[count++] = curOffset;
+
+		/* Increment the offset. */
+		if ( state->transMap.length() > 0 ) {
+			TransMap::Iter first = state->transMap.first();
+			TransMap::Iter last = state->transMap.last();
+			curOffset += last->key - first->key + 1;
+		}
+	}
+
+	/*
+	 * Targs
+	 */
+	count = pdaGraph->actionSet.length();
+	pdaTables->targs = new unsigned int[count];
+	pdaTables->numTargs = count;
+
+	count = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ )
+		pdaTables->targs[count++] = asi->key.targ;
+
+	/* 
+	 * ActInds
+	 */
+	count = pdaGraph->actionSet.length();
+	pdaTables->actInds = new unsigned int[count];
+	pdaTables->numActInds = count;
+
+	count = pos = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ ) {
+		pdaTables->actInds[count++] = pos;
+		pos += asi->key.actions.length() + 1;
+	}
+
+	/*
+	 * Actions
+	 */
+	count = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ )
+		count += asi->key.actions.length() + 1;
+
+	pdaTables->actions = new unsigned int[count];
+	pdaTables->numActions = count;
+
+	count = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ ) {
+		for ( ActDataList::Iter ali = asi->key.actions; ali.lte(); ali++ )
+			pdaTables->actions[count++] = *ali;
+
+		pdaTables->actions[count++] = 0;
+	}
+
+	/*
+	 * CommitLen
+	 */
+	count = pdaGraph->actionSet.length();
+	pdaTables->commitLen = new int[count];
+	pdaTables->numCommitLen = count;
+
+	count = 0;
+	for ( PdaActionSet::Iter asi = pdaGraph->actionSet; asi.lte(); asi++ )
+		pdaTables->commitLen[count++] = asi->key.commitLen;
+	
+	/*
+	 * tokenRegionInds
+	 */
+	count = pos = 0;
+	pdaTables->tokenRegionInds = new int[pdaTables->numStates];
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		pdaTables->tokenRegionInds[count++] = pos;
+		pos += state->regions.length() + 1;
+	}
+
+	/*
+	 * tokenRegions
+	 */
+
+	count = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ )
+		count += state->regions.length() + 1;
+
+	pdaTables->numRegionItems = count;
+	pdaTables->tokenRegions = new int[pdaTables->numRegionItems];
+
+	count = 0;
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		for ( RegionVect::Iter reg = state->regions; reg.lte(); reg++ )
+			pdaTables->tokenRegions[count++] = (*reg)->id + 1;
+
+		pdaTables->tokenRegions[count++] = 0;
+	}
+
+	/* Get a pointer to the (yet unfilled) global runtime data. */
+	pdaTables->gbl = runtimeData;
+
+	return pdaTables;
+}
+
+void ParseData::prepGrammar()
+{
+	wrapNonTerminals();
+	makeKlangElIds();
+	makeKlangElNames();
+	makeDefinitionNames();
+	noUndefindKlangEls();
+
+	/* Put the language elements in an index by language element id. */
+	langElIndex = new KlangEl*[nextSymbolId+1];
+	memset( langElIndex, 0, sizeof(KlangEl*)*(nextSymbolId+1) );
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ )
+		langElIndex[lel->id] = lel;
+
+	makeProdFsms();
+
+	/* Allocate the Runtime data now. Every PdaTable that we make 
+	 * will reference it, but it will be filled in after all the tables are
+	 * built. */
+	runtimeData = new RuntimeData;
+}
+
+PdaGraph *ParseData::makePdaGraph( KlangEl *rootEl )
+{
+	//for ( DefList::Iter prod = prodList; prod.lte(); prod++ )
+	//	cerr << prod->prodId << " " << prod->data << endl;
+
+	PdaGraph *pdaGraph = new PdaGraph();
+	lalr1GenerateParser( pdaGraph, rootEl );
+	pdaGraph->setStateNumbers();
+	analyzeMachine( pdaGraph, rootEl );
+
+	//cerr << "NUMBER OF STATES: " << pdaGraph->stateList.length() << endl;
+
+	return pdaGraph;
+}
+
+void ParseData::makeParser( KlangEl *rootEl )
+{
+	if ( rootEl->pdaTables == 0 ) {
+		rootEl->pdaGraph = makePdaGraph( rootEl );
+		rootEl->pdaTables = makePdaTables( rootEl->pdaGraph );
+	}
+}
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
new file mode 100644
index 00000000..fee17754
--- /dev/null
+++ b/colm/pdacodegen.cpp
@@ -0,0 +1,536 @@
+/*
+ *  Copyright 2003-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <stdlib.h>
+#include <ctype.h>
+#include <limits.h>
+#include "colm.h"
+#include "parsedata.h"
+#include "avlmap.h"
+#include "avlbasic.h"
+#include "avlset.h"
+#include "mergesort.h"
+#include "pdacodegen.h"
+
+using std::cerr;
+using std::endl;
+
+#define FRESH_BLOCK 8128
+#define act_sb "0x1"
+#define act_rb "0x2"
+#define lower "0x0000ffff"
+#define upper "0xffff0000"
+
+void escapeLiteralString( std::ostream &out, const char *path, int length )
+{
+	for ( const char *pc = path, *end = path+length; pc != end; pc++ ) {
+		switch ( *pc ) {
+			case '\\': out << "\\\\"; break;
+			case '"':  out << "\\\""; break;
+			case '\a': out << "\\a"; break;
+			case '\b': out << "\\b"; break;
+			case '\t': out << "\\t"; break;
+			case '\n': out << "\\n"; break;
+			case '\v': out << "\\v"; break;
+			case '\f': out << "\\f"; break;
+			case '\r': out << "\\r"; break;
+			default:   out << *pc; break;
+		}
+	}
+}
+
+void escapeLiteralString( std::ostream &out, const char *path )
+{
+	escapeLiteralString( out, path, strlen(path) );
+}
+
+void PdaCodeGen::writeTokenIds()
+{
+	out << "/*\n";
+	for ( LelList::Iter lel = pd->langEls; lel.lte(); lel++ ) {
+		if ( lel->name != 0 )
+			out << "	" << lel->name << " " << lel->id << endl;
+		else
+			out << "	" << lel->id << endl;
+	}
+	out << "*/\n\n";
+}
+
+
+void PdaCodeGen::writeFirst()
+{
+	out << 
+		"/*\n"
+		" * This code is generated\n"
+		"*/\n"
+		"\n"
+		"#include \"pdarun.h\"\n"
+		"#include \"fsmrun.h\"\n"
+		"\n"
+		"extern RuntimeData main_runtimeData;\n";
+
+	out <<
+		"\n";
+}
+
+void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
+{
+	/*
+	 * Blocks of code in frames.
+	 */
+	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
+		if ( runtimeData->frameInfo[i].codeLen > 0 ) {
+			out << "Code code_" << i << "[] = {\n\t";
+
+			Code *block = runtimeData->frameInfo[i].code;
+			for ( int j = 0; j < runtimeData->frameInfo[i].codeLen; j++ ) {
+				out << (unsigned long) block[j];
+
+				if ( j < runtimeData->frameInfo[i].codeLen-1 ) {
+					out << ", ";
+					if ( (j+1) % 8 == 0 )
+						out << "\n\t";
+				}
+			}
+			out << "\n};\n\n";
+		}
+
+		if ( runtimeData->frameInfo[i].treesLen > 0 ) {
+			out << "char trees_" << i << "[] = {\n\t";
+
+			char *block = runtimeData->frameInfo[i].trees;
+			for ( int j = 0; j < runtimeData->frameInfo[i].treesLen; j++ ) {
+				out << (long) block[j];
+
+				if ( j < runtimeData->frameInfo[i].treesLen-1 ) {
+					out << ", ";
+					if ( (j+1) % 8 == 0 )
+						out << "\n\t";
+				}
+			}
+			out << "\n};\n\n";
+		}
+	}
+
+	/* 
+	 * Init code.
+	 */
+	out << "Code " << rootCode() << "[] = {\n\t";
+	Code *block = runtimeData->rootCode ;
+	for ( int j = 0; j < runtimeData->rootCodeLen; j++ ) {
+		out << (unsigned int) block[j];
+
+		if ( j < runtimeData->rootCodeLen-1 ) {
+			out << ", ";
+			if ( (j+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	/*
+	 * lelInfo
+	 */
+	out << "LangElInfo " << lelInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numLangEls; i++ ) {
+		out << "\t{ \"";
+
+		/* Name. */
+		escapeLiteralString( out, runtimeData->lelInfo[i].name );
+		out << "\"";
+		
+		/* Repeat, literal, ignore flags. */
+		out << ", " << runtimeData->lelInfo[i].repeat << ", " << 
+				runtimeData->lelInfo[i].literal << ", " <<
+				runtimeData->lelInfo[i].ignore << ", ";
+
+		out << runtimeData->lelInfo[i].frameId << ", ";
+
+		out << runtimeData->lelInfo[i].objectTypeId << ", ";
+
+		out << runtimeData->lelInfo[i].ofiOffset << ", ";
+
+		out << runtimeData->lelInfo[i].objectLength << ", ";
+
+		out << runtimeData->lelInfo[i].termDupId << ", ";
+
+		out << runtimeData->lelInfo[i].genericId;
+
+		out << " }";
+
+		if ( i < runtimeData->numLangEls-1 )
+			out << ",\n";
+	}
+	out << "\n};\n\n";
+
+	/*
+	 * frameInfo
+	 */
+	out << "FrameInfo " << frameInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
+		out << "\t{ ";
+
+		if ( runtimeData->frameInfo[i].codeLen > 0 )
+			out << "code_" << i << ", ";
+		else
+			out << "0, ";
+
+		out << runtimeData->frameInfo[i].codeLen << ", ";
+
+		if ( runtimeData->frameInfo[i].treesLen > 0 )
+			out << "trees_" << i << ", ";
+		else
+			out << "0, ";
+
+		out << runtimeData->frameInfo[i].treesLen << ", ";
+
+		out << " }";
+
+		if ( i < runtimeData->numFrames-1 )
+			out << ",\n";
+	}
+	out << "\n};\n\n";
+
+
+	/*
+	 * prodInfo
+	 */
+	out << "ProdInfo " << prodInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numProds; i++ ) {
+		out << "\t{ ";
+
+		out << runtimeData->prodInfo[i].length << ", ";
+		out << runtimeData->prodInfo[i].lhsId << ", ";
+		out << '"' << runtimeData->prodInfo[i].name << "\", ";
+		out << runtimeData->prodInfo[i].frameId << ", ";
+		out << runtimeData->prodInfo[i].lhsUpref;
+
+		out << " }";
+
+		if ( i < runtimeData->numProds-1 )
+			out << ",\n";
+	}
+	out << "\n};\n\n";
+
+	/*
+	 * patReplInfo
+	 */
+	out << "PatReplInfo " << patReplInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numPatterns; i++ ) {
+		out << "	{ " << runtimeData->patReplInfo[i].offset << ", " <<
+				runtimeData->patReplInfo[i].numBindings << " },\n";
+	}
+	out << "};\n\n";
+
+	/*
+	 * patReplNodes
+	 */
+	out << "PatReplNode " << patReplNodes() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numPatternNodes; i++ ) {
+		PatReplNode &node = runtimeData->patReplNodes[i];
+		out << "	{ " << node.id << ", " << node.next << ", " << 
+				node.child << ", " << node.bindId << ", ";
+		if ( node.data == 0 )
+			out << "0";
+		else {
+			out << '\"';
+			escapeLiteralString( out, node.data, node.length );
+			out << '\"';
+		}
+		out << ", " << node.length << ", ";
+
+		out << node.ignore << ", ";
+
+		out << node.stop << " },\n";
+	}
+	out << "};\n\n";
+
+	/*
+	 * functionInfo
+	 */
+	out << "FunctionInfo " << functionInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numFunctions; i++ ) {
+		out << "\t{ " <<
+				"\"" << runtimeData->functionInfo[i].name << "\", " <<
+				runtimeData->functionInfo[i].frameId << ", " <<
+				runtimeData->functionInfo[i].argSize << ", " <<
+				runtimeData->functionInfo[i].ntrees << ", " <<
+				runtimeData->functionInfo[i].frameSize;
+		out << " }";
+
+		if ( i < runtimeData->numFunctions-1 )
+			out << ",\n";
+	}
+	out << "\n};\n\n";
+
+	/*
+	 * regionInfo
+	 */
+	out << "RegionInfo " << regionInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numRegions; i++ ) {
+		out << "\t{ \"";
+		/* Name. */
+		escapeLiteralString( out, runtimeData->regionInfo[i].name );
+		out << "\", " << runtimeData->regionInfo[i].defaultToken <<
+			", " << runtimeData->regionInfo[i].eofFrameId <<
+			" }";
+
+		if ( i < runtimeData->numRegions-1 )
+			out << ",\n";
+	}
+	out << "\n};\n\n";
+
+	/* 
+	 * genericInfo
+	 */
+	out << "GenericInfo " << genericInfo() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numGenerics; i++ ) {
+		out << "\t{ " << 
+				runtimeData->genericInfo[i].type << ", " <<
+				runtimeData->genericInfo[i].typeArg << ", " <<
+				runtimeData->genericInfo[i].keyOffset << ", " <<
+				runtimeData->genericInfo[i].keyType << ", " << 
+				runtimeData->genericInfo[i].langElId << " },\n";
+	}
+	out << "};\n\n";
+
+	/* 
+	 * literals
+	 */
+	out << "const char *" << litdata() << "[] = {\n";
+	for ( int i = 0; i < runtimeData->numLiterals; i++ ) {
+		out << "\t\"";
+		escapeLiteralString( out, runtimeData->litdata[i] );
+		out << "\",\n";
+	}
+	out << "};\n\n";
+
+	out << "long " << litlen() << "[] = {\n\t";
+	for ( int i = 0; i < runtimeData->numLiterals; i++ )
+		out << runtimeData->litlen[i] << ", ";
+	out << "};\n\n";
+
+	out << "Head *" << literals() << "[] = {\n\t";
+	for ( int i = 0; i < runtimeData->numLiterals; i++ )
+		out << "0, ";
+	out << "};\n\n";
+
+	/* Parsers. */
+	out << "PdaTables *parsers[] = {\n\t";
+	for ( long i = 0; i < runtimeData->numParsers; i++ ) {
+		out << "&pid_" << i << "_pdaTables,\n";
+	}
+	out << "};\n\n";
+
+	out <<
+		"RuntimeData main_runtimeData = \n"
+		"{\n"
+		"	" << lelInfo() << ",\n"
+		"	" << runtimeData->numLangEls << ",\n"
+		"\n"
+		"	" << prodInfo() << ",\n"
+		"	" << runtimeData->numProds << ",\n"
+		"\n"
+		"	" << regionInfo() << ",\n"
+		"	" << runtimeData->numRegions << ",\n"
+		"\n"
+		"	" << rootCode() << ",\n"
+		"	" << runtimeData->rootCodeLen << ",\n"
+		"\n"
+		"	" << frameInfo() << ",\n"
+		"	" << runtimeData->numFrames << ",\n"
+		"\n"
+		"	" << functionInfo() << ",\n"
+		"	" << runtimeData->numFunctions << ",\n"
+		"\n"
+		"	" << patReplInfo() << ",\n"
+		"	" << runtimeData->numPatterns << ",\n"
+		"\n"
+		"	" << patReplNodes() << ",\n"
+		"	" << runtimeData->numPatternNodes << ",\n"
+		"\n"
+		"	" << genericInfo() << ",\n"
+		"	" << runtimeData->numGenerics << ",\n"
+		"\n"
+		"	" << litdata() << ",\n"
+		"	" << litlen() << ",\n"
+		"	" << literals() << ",\n"
+		"	" << runtimeData->numLiterals << ",\n"
+		"\n"
+		"	&fsmTables_start,\n"
+		"	parsers, " << runtimeData->numParsers << ",\n"
+		"\n"
+		"	" << runtimeData->globalSize << ",\n"
+		"\n"
+		"	" << runtimeData->firstNonTermId << ",\n"
+		"	" << runtimeData->integerId << ",\n"
+		"	" << runtimeData->stringId << ",\n"
+		"	" << runtimeData->anyId << ",\n"
+		"	" << runtimeData->eofId << "\n"
+		"};\n"
+		"\n";
+}
+
+void PdaCodeGen::writeParserData( long id, PdaTables *tables )
+{
+	String prefix = "pid_" + String(0, "%ld", id) + "_";
+	out << "unsigned int " << prefix << startState() << " = " <<
+		tables->startState << ";\n\n";
+
+	out << "int " << prefix << indicies() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numIndicies; i++ ) {
+		out << tables->indicies[i];
+
+		if ( i < tables->numIndicies-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "int " << prefix << keys() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numKeys; i++ ) {
+		out << tables->keys[i];
+
+		if ( i < tables->numKeys-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "unsigned int " << prefix << offsets() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numStates; i++ ) {
+		out << tables->offsets[i];
+
+		if ( i < tables->numStates-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "unsigned int " << prefix << targs() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numTargs; i++ ) {
+		out << tables->targs[i];
+
+		if ( i < tables->numTargs-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "unsigned int " << prefix << actInds() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numActInds; i++ ) {
+		out << tables->actInds[i];
+
+		if ( i < tables->numActInds-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "unsigned int " << prefix << actions() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numActions; i++ ) {
+		out << tables->actions[i];
+
+		if ( i < tables->numActions-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "int " << prefix << commitLen() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numCommitLen; i++ ) {
+		out << tables->commitLen[i];
+
+		if ( i < tables->numCommitLen-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "int " << prefix << tokenRegionInds() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numStates; i++ ) {
+		out << tables->tokenRegionInds[i];
+
+		if ( i < tables->numStates-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << "int " << prefix << tokenRegions() << "[] = {\n\t";
+	for ( int i = 0; i < tables->numRegionItems; i++ ) {
+		out << tables->tokenRegions[i];
+
+		if ( i < tables->numRegionItems-1 ) {
+			out << ", ";
+			if ( (i+1) % 8 == 0 )
+				out << "\n\t";
+		}
+	}
+	out << "\n};\n\n";
+
+	out << 
+		"PdaTables " << prefix << "pdaTables =\n"
+		"{\n"
+		"	" << prefix << startState() << ",\n"
+		"	" << prefix << indicies() << ",\n"
+		"	" << prefix << keys() << ",\n"
+		"	" << prefix << offsets() << ",\n"
+		"	" << prefix << targs() << ",\n"
+		"	" << prefix << actInds() << ",\n"
+		"	" << prefix << actions() << ",\n"
+		"	" << prefix << commitLen() << ",\n"
+
+		"	" << prefix << tokenRegionInds() << ",\n"
+		"	" << prefix << tokenRegions() << ",\n"
+		"\n"
+		"	" << tables->numIndicies << ",\n"
+		"	" << tables->numKeys << ",\n"
+		"	" << tables->numStates << ",\n"
+		"	" << tables->numTargs << ",\n"
+		"	" << tables->numActInds << ",\n"
+		"	" << tables->numActions << ",\n"
+		"	" << tables->numCommitLen << ",\n"
+		"	" << tables->numRegionItems << ",\n"
+		"\n"
+		"\n"
+		"	&main_runtimeData\n"
+		"};\n"
+		"\n";
+}
+
diff --git a/colm/pdacodegen.h b/colm/pdacodegen.h
new file mode 100644
index 00000000..79e6677c
--- /dev/null
+++ b/colm/pdacodegen.h
@@ -0,0 +1,105 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+
+#ifndef _PDACODEGEN_H
+#define _PDACODEGEN_H
+
+struct ParseData;
+
+struct PdaCodeGen
+{
+	PdaCodeGen( const char *fileName, const char *parserName, ParseData *pd, ostream &out )
+	:
+		fileName(fileName),
+		parserName(parserName),
+		pd(pd),
+		out(out)
+	{}
+
+	/*
+	 * Code Generation.
+	 */
+	void startCodeGen();
+	void endCodeGen( int endLine );
+
+	void writeTokenIds();
+	void writeLangEls();
+
+	void writeReference( Definition *prod, char *data );
+	void writeUndoReference( Definition *prod, char *data );
+	void writeFinalReference( Definition *prod, char *data );
+	void writeFirstLocate( Definition *prod );
+	void writeRhsLocate( Definition *prod );
+
+	void writeFirst();
+	void writeRuntimeData( RuntimeData *runtimeData );
+	void writeParserData( long id, PdaTables *tables );
+
+	String PARSER() { return "parser_"; }
+
+	String startState() { return PARSER() + "startState"; }
+	String indicies() { return PARSER() + "indicies"; }
+	String keys() { return PARSER() + "keys"; }
+	String offsets() { return PARSER() + "offsets"; }
+	String targs() { return PARSER() + "targs"; }
+	String actInds() { return PARSER() + "actInds"; }
+	String actions() { return PARSER() + "actions"; }
+	String commitLen() { return PARSER() + "commitLen"; }
+	String fssProdIdIndex() { return PARSER() + "fssProdIdIndex"; }
+	String prodLengths() { return PARSER() + "prodLengths"; }
+	String prodLhsIds() { return PARSER() + "prodLhsIds"; }
+	String prodNames() { return PARSER() + "prodNames"; }
+	String lelInfo() { return PARSER() + "lelInfo"; }
+	String prodInfo() { return PARSER() + "prodInfo"; }
+	String tokenRegionInds() { return PARSER() + "tokenRegionInds"; }
+	String tokenRegionsDirect() { return PARSER() + "tokenRegionsDirect"; }
+	String tokenRegions() { return PARSER() + "tokenRegions"; }
+	String prodCodeBlocks() { return PARSER() + "prodCodeBlocks"; }
+	String prodCodeBlockLens() { return PARSER() + "prodCodeBlockLens"; }
+	String rootCode() { return PARSER() + "rootCode"; }
+	String frameInfo() { return PARSER() + "frameInfo"; }
+	String functionInfo() { return PARSER() + "functionInfo"; }
+	String objFieldInfo() { return PARSER() + "objFieldInfo"; }
+	String patReplInfo() { return PARSER() + "patReplInfo"; }
+	String patReplNodes() { return PARSER() + "patReplNodes"; }
+	String regionInfo() { return PARSER() + "regionInfo"; }
+	String genericInfo() { return PARSER() + "genericInfo"; }
+	String litdata() { return PARSER() + "litdata"; }
+	String litlen() { return PARSER() + "litlen"; }
+	String literals() { return PARSER() + "literals"; }
+	String fsmTables() { return PARSER() + "fsmTables"; }
+
+	/* 
+	 * Graphviz Generation
+	 */
+	void writeTransList( PdaState *state );
+	void writeDotFile( PdaGraph *graph );
+	void writeDotFile( );
+	
+
+	const char *fileName;
+	const char *parserName;
+	ParseData *pd;
+	ostream &out;
+};
+
+#endif
diff --git a/colm/pdagraph.cpp b/colm/pdagraph.cpp
new file mode 100644
index 00000000..22c77dcc
--- /dev/null
+++ b/colm/pdagraph.cpp
@@ -0,0 +1,518 @@
+/*
+ *  Copyright 2001, 2002, 2005 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <string.h>
+#include <iostream>
+#include <string.h>
+#include <assert.h>
+#include "colm.h"
+#include "pdagraph.h"
+#include "mergesort.h"
+
+using std::cerr;
+using std::endl;
+
+/* Create a new fsm state. State has not out transitions or in transitions, not
+ * out out transition data and not number. */
+PdaState::PdaState()
+:
+	/* No in transitions. */
+	inRange(),
+
+	/* No entry points, or epsilon trans. */
+	pendingCommits(),
+
+	stateSet(0),
+
+	/* Only used during merging. Normally null. */
+	stateDictEl(0),
+
+	/* No state identification bits. */
+	stateBits(0),
+
+	onClosureQueue(false),
+	inClosedMap(false),
+	followMarked(false)
+{
+}
+
+/* Copy everything except actual the transitions. That is left up to the
+ * PdaGraph copy constructor. */
+PdaState::PdaState(const PdaState &other)
+:
+	inRange(),
+
+	/* Duplicate the entry id set, epsilon transitions and context sets. These
+	 * are sets of integers and as such need no fixing. */
+	pendingCommits(other.pendingCommits),
+
+	stateSet(0),
+
+	/* This is only used during merging. Normally null. */
+	stateDictEl(0),
+
+	/* Fsm state data. */
+	stateBits(other.stateBits),
+
+	dotSet(other.dotSet),
+	onClosureQueue(false),
+	inClosedMap(false),
+	followMarked(false),
+
+	transMap()
+{
+	/* Duplicate all the transitions. */
+	for ( TransMap::Iter trans = other.transMap; trans.lte(); trans++ ) {
+		/* Dupicate and store the orginal target in the transition. This will
+		 * be corrected once all the states have been created. */
+		PdaTrans *newTrans = new PdaTrans(*trans->value);
+		newTrans->toState = trans->value->toState;
+		transMap.append( TransMapEl( newTrans->lowKey, newTrans ) );
+	}
+}
+
+/* If there is a state dict element, then delete it. Everything else is left
+ * up to the FsmGraph destructor. */
+PdaState::~PdaState()
+{
+	if ( stateDictEl != 0 )
+		delete stateDictEl;
+}
+
+/* Graph constructor. */
+PdaGraph::PdaGraph()
+:
+	/* No start state. */
+	startState(0)
+{
+}
+
+/* Copy all graph data including transitions. */
+PdaGraph::PdaGraph( const PdaGraph &graph )
+:
+	/* Lists start empty. Will be filled by copy. */
+	stateList(),
+	misfitList(),
+
+	/* Copy in the entry points, 
+	 * pointers will be resolved later. */
+	startState(graph.startState),
+
+	/* Will be filled by copy. */
+	finStateSet()
+{
+	/* Create the states and record their map in the original state. */
+	PdaStateList::Iter origState = graph.stateList;
+	for ( ; origState.lte(); origState++ ) {
+		/* Make the new state. */
+		PdaState *newState = new PdaState( *origState );
+
+		/* Add the state to the list.  */
+		stateList.append( newState );
+
+		/* Set the mapsTo item of the old state. */
+		origState->stateMap = newState;
+	}
+	
+	/* Derefernce all the state maps. */
+	for ( PdaStateList::Iter state = stateList; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+			/* The points to the original in the src machine. The taget's duplicate
+			 * is in the statemap. */
+			PdaState *toState = trans->value->toState != 0 ? 
+					trans->value->toState->stateMap : 0;
+
+			/* Attach The transition to the duplicate. */
+			trans->value->toState = 0;
+			attachTrans( state, toState, trans->value );
+		}
+	}
+
+	/* Fix the start state pointer and the new start state's count of in
+	 * transiions. */
+	startState = startState->stateMap;
+
+	/* Build the final state set. */
+	PdaStateSet::Iter st = graph.finStateSet; 
+	for ( ; st.lte(); st++ ) 
+		finStateSet.insert((*st)->stateMap);
+}
+
+/* Deletes all transition data then deletes each state. */
+PdaGraph::~PdaGraph()
+{
+	/* Delete all the transitions. */
+	PdaStateList::Iter state = stateList;
+	for ( ; state.lte(); state++ ) {
+		for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ )
+			delete trans->value;
+	}
+
+	/* Delete all the states. */
+	stateList.empty();
+}
+
+/* Set a state final. The state has its isFinState set to true and the state
+ * is added to the finStateSet. */
+void PdaGraph::setFinState( PdaState *state )
+{
+	/* Is it already a fin state. */
+	if ( state->stateBits & SB_ISFINAL )
+		return;
+	
+	state->stateBits |= SB_ISFINAL;
+	finStateSet.insert( state );
+}
+
+void PdaGraph::unsetAllFinStates( )
+{
+	for ( PdaStateSet::Iter st = finStateSet; st.lte(); st++ ) {
+		PdaState *state = *st;
+		state->stateBits &= ~ SB_ISFINAL;
+	}
+	finStateSet.empty();
+}
+
+/* Set and unset a state as the start state. */
+void PdaGraph::setStartState( PdaState *state )
+{
+	/* Sould change from unset to set. */
+	assert( startState == 0 );
+	startState = state;
+}
+
+/* Mark all states reachable from state. Traverses transitions forward. Used
+ * for removing states that have no path into them. */
+void PdaGraph::markReachableFromHere( PdaState *state )
+{
+	/* Base case: return; */
+	if ( state->stateBits & SB_ISMARKED )
+		return;
+	
+	/* Set this state as processed. We are going to visit all states that this
+	 * state has a transition to. */
+	state->stateBits |= SB_ISMARKED;
+
+	/* Recurse on all out transitions. */
+	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+		if ( trans->value->toState != 0 )
+			markReachableFromHere( trans->value->toState );
+	}
+}
+
+void PdaGraph::setStateNumbers()
+{
+	int curNum = 0;
+	PdaStateList::Iter state = stateList;
+	for ( ; state.lte(); state++ )
+		state->stateNum = curNum++;
+}
+
+/* Insert a transition into an inlist. The head must be supplied. */
+void PdaGraph::attachToInList( PdaState *from, PdaState *to, 
+		PdaTrans *&head, PdaTrans *trans )
+{
+	trans->ilnext = head;
+	trans->ilprev = 0;
+
+	/* If in trans list is not empty, set the head->prev to trans. */
+	if ( head != 0 )
+		head->ilprev = trans;
+
+	/* Now insert ourselves at the front of the list. */
+	head = trans;
+};
+
+/* Detach a transition from an inlist. The head of the inlist must be supplied. */
+void PdaGraph::detachFromInList( PdaState *from, PdaState *to, 
+		PdaTrans *&head, PdaTrans *trans )
+{
+	/* Detach in the inTransList. */
+	if ( trans->ilprev == 0 ) 
+		head = trans->ilnext; 
+	else
+		trans->ilprev->ilnext = trans->ilnext; 
+
+	if ( trans->ilnext != 0 )
+		trans->ilnext->ilprev = trans->ilprev; 
+}
+
+/* Attach states on the default transition, range list or on out/in list key.
+ * Type of attaching and is controlled by keyType. First makes a new
+ * transition. If there is already a transition out from fromState on the
+ * default, then will assertion fail. */
+PdaTrans *PdaGraph::appendNewTrans( PdaState *from, PdaState *to, long lowKey, long )
+{
+	/* Make the new transition. */
+	PdaTrans *retVal = new PdaTrans();
+
+	/* The transition is now attached. Remember the parties involved. */
+	retVal->fromState = from;
+	retVal->toState = to;
+
+	/* Make the entry in the out list for the transitions. */
+	from->transMap.append( TransMapEl( lowKey, retVal ) );
+
+	/* Set the the keys of the new trans. */
+	retVal->lowKey = lowKey;
+
+	/* Attach using inRange as the head pointer. */
+	attachToInList( from, to, to->inRange.head, retVal );
+
+	return retVal;
+}
+
+PdaTrans *PdaGraph::insertNewTrans( PdaState *from, PdaState *to, long lowKey, long )
+{
+	/* Make the new transition. */
+	PdaTrans *retVal = new PdaTrans();
+
+	/* The transition is now attached. Remember the parties involved. */
+	retVal->fromState = from;
+	retVal->toState = to;
+
+	/* Make the entry in the out list for the transitions. */
+	from->transMap.insert( lowKey, retVal );
+
+	/* Set the the keys of the new trans. */
+	retVal->lowKey = lowKey;
+
+	/* Attach using inRange as the head pointer. */
+	attachToInList( from, to, to->inRange.head, retVal );
+
+	return retVal;
+}
+
+/* Attach for range lists or for the default transition. Type of attaching is
+ * controlled by the keyType parameter. This attach should be used when a
+ * transition already is allocated and must be attached to a target state.
+ * Does not handle adding the transition into the out list. */
+void PdaGraph::attachTrans( PdaState *from, PdaState *to, PdaTrans *trans )
+{
+	assert( trans->fromState == 0 && trans->toState == 0 );
+	trans->fromState = from;
+	trans->toState = to;
+
+	/* Attach using the inRange pointer as the head pointer. */
+	attachToInList( from, to, to->inRange.head, trans );
+}
+
+/* Detach for out/in lists or for default transition. The type of detaching is
+ * controlled by the keyType parameter. */
+void PdaGraph::detachTrans( PdaState *from, PdaState *to, PdaTrans *trans )
+{
+	assert( trans->fromState == from && trans->toState == to );
+	trans->fromState = 0;
+	trans->toState = 0;
+
+	/* Detach using to's inRange pointer as the head. */
+	detachFromInList( from, to, to->inRange.head, trans );
+}
+
+
+/* Detach a state from the graph. Detaches and deletes transitions in and out
+ * of the state. Empties inList and outList. Removes the state from the final
+ * state set. A detached state becomes useless and should be deleted. */
+void PdaGraph::detachState( PdaState *state )
+{
+	/* Detach the in transitions from the inRange list of transitions. */
+	while ( state->inRange.head != 0 ) {
+		/* Get pointers to the trans and the state. */
+		PdaTrans *trans = state->inRange.head;
+		PdaState *fromState = trans->fromState;
+
+		/* Detach the transitions from the source state. */
+		detachTrans( fromState, state, trans );
+
+		/* Ok to delete the transition. */
+		fromState->transMap.remove( trans->lowKey );
+		delete trans;
+	}
+
+	/* Detach out range transitions. */
+	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
+		detachTrans( state, trans->value->toState, trans->value );
+		delete trans->value;
+	}
+
+	/* Delete all of the out range pointers. */
+	state->transMap.empty();
+
+	/* Unset final stateness before detaching from graph. */
+	if ( state->stateBits & SB_ISFINAL )
+		finStateSet.remove( state );
+}
+
+/* Move all the transitions that go into src so that they go into dest.  */
+void PdaGraph::inTransMove( PdaState *dest, PdaState *src )
+{
+	/* Do not try to move in trans to and from the same state. */
+	assert( dest != src );
+
+	/* If src is the start state, dest becomes the start state. */
+	assert( src != startState );
+
+	/* Move the transitions in inRange. */
+	while ( src->inRange.head != 0 ) {
+		/* Get trans and from state. */
+		PdaTrans *trans = src->inRange.head;
+		PdaState *fromState = trans->fromState;
+
+		/* Detach from src, reattach to dest. */
+		detachTrans( fromState, src, trans );
+		attachTrans( fromState, dest, trans );
+	}
+}
+
+void PdaGraph::addInReduction( PdaTrans *dest, long prodId, long prior )
+{
+	/* Look for the reduction. If not there insert it, otherwise take
+	 * the max of the priorities. */
+	ReductionMapEl *redMapEl = dest->reductions.find( prodId );
+	if ( redMapEl == 0 )
+		dest->reductions.insert( prodId, prior );
+	else if ( prior > redMapEl->value )
+		redMapEl->value = prior;
+}
+
+/* Callback invoked when another trans (or possibly this) is added into this
+ * transition during the merging process.  Draw in any properties of srcTrans
+ * into this transition. AddInTrans is called when a new transitions is made
+ * that will be a duplicate of another transition or a combination of several
+ * other transitions. AddInTrans will be called for each transition that the
+ * new transition is to represent. */
+void PdaGraph::addInTrans( PdaTrans *destTrans, PdaTrans *srcTrans )
+{
+	/* Protect against adding in from ourselves. */
+	if ( srcTrans != destTrans ) {
+
+		/* Add in the shift priority. */
+		if ( destTrans->isShift && srcTrans->isShift ) {
+			/* Both shifts are set. We want the max of the two. */
+			if ( srcTrans->shiftPrior > destTrans->shiftPrior )
+				destTrans->shiftPrior = srcTrans->shiftPrior;
+		}
+		else if ( srcTrans->isShift ) {
+			/* Just the source is set, copy the source prior over. */
+			destTrans->shiftPrior = srcTrans->shiftPrior;
+		}
+
+		/* If either is a shift, dest is a shift. */
+		destTrans->isShift = destTrans->isShift || srcTrans->isShift;
+
+		/* Add in the reductions. */
+		for ( ReductionMap::Iter red = srcTrans->reductions; red.lte(); red++ )
+			addInReduction( destTrans, red->key, red->value );
+
+		/* Add in the commit points. */
+		destTrans->commits.insert( srcTrans->commits );
+	}
+}
+
+void PdaGraph::addInState( PdaState *destState, PdaState *srcState )
+{
+	/* Draw in any properties of srcState into destState. */
+	if ( srcState != destState ) {
+		/* Get the epsilons, context, out priorities. */
+		destState->pendingCommits.insert( srcState->pendingCommits );
+		if ( srcState->pendingCommits.length() > 0 )
+			cerr << "THERE ARE PENDING COMMITS DRAWN IN" << endl;
+
+		/* Parser generation data. */
+		destState->dotSet.insert( srcState->dotSet );
+
+		if ( srcState->onClosureQueue && !destState->onClosureQueue ) {
+			stateClosureQueue.append( destState );
+			destState->onClosureQueue = true;
+		}
+	}
+}
+
+/* Make a new state. The new state will be put on the graph's
+ * list of state. The new state can be created final or non final. */
+PdaState *PdaGraph::addState()
+{
+	/* Make the new state to return. */
+	PdaState *state = new PdaState();
+
+	/* Create the new state. */
+	stateList.append( state );
+
+	return state;
+}
+
+
+/* Follow from to the final state of srcFsm. */
+PdaState *PdaGraph::followFsm( PdaState *from, PdaGraph *srcFsm )
+{
+	PdaState *followSrc = srcFsm->startState;
+
+	while ( ! followSrc->isFinState() ) {
+		assert( followSrc->transMap.length() == 1 );
+		PdaTrans *followTrans = followSrc->transMap[0].value;
+
+		PdaTrans *inTrans = from->findTrans( followTrans->lowKey );
+		assert( inTrans != 0 );
+
+		from = inTrans->toState;
+		followSrc = followTrans->toState;
+	}
+
+	return from;
+}
+
+int PdaGraph::fsmLength( )
+{
+	int length = 0;
+	PdaState *state = startState;
+	while ( ! state->isFinState() ) {
+		length += 1;
+		state = state->transMap[0].value->toState;
+	}
+	return length;
+}
+
+/* Remove states that have no path to them from the start state. Recursively
+ * traverses the graph marking states that have paths into them. Then removes
+ * all states that did not get marked. */
+void PdaGraph::removeUnreachableStates()
+{
+	/* Mark all the states that can be reached 
+	 * through the existing set of entry points. */
+	markReachableFromHere( startState );
+
+	/* Delete all states that are not marked
+	 * and unmark the ones that are marked. */
+	PdaState *state = stateList.head;
+	while ( state ) {
+		PdaState *next = state->next;
+
+		if ( state->stateBits & SB_ISMARKED )
+			state->stateBits &= ~ SB_ISMARKED;
+		else {
+			detachState( state );
+			stateList.detach( state );
+			delete state;
+		}
+
+		state = next;
+	}
+}
diff --git a/colm/pdagraph.h b/colm/pdagraph.h
new file mode 100644
index 00000000..8442ac10
--- /dev/null
+++ b/colm/pdagraph.h
@@ -0,0 +1,504 @@
+/*
+ *  Copyright 2001-2005 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PDAGRAPH_H
+#define _PDAGRAPH_H
+
+#include <assert.h>
+#include "vector.h"
+#include "bstset.h"
+#include "compare.h"
+#include "avltree.h"
+#include "dlist.h"
+#include "bstmap.h"
+#include "sbstmap.h"
+#include "sbstset.h"
+#include "sbsttable.h"
+#include "avlset.h"
+#include "dlistmel.h"
+#include "avltree.h"
+
+/* Flags for states. */
+#define SB_ISFINAL    0x04
+#define SB_ISMARKED   0x08
+#define SB_ISSTART    0x10
+
+/* Flags for transitions. */
+#define TB_ISMARKED   0x01
+
+struct PdaTrans;
+struct PdaState;
+struct PdaGraph;
+struct TokenDef;
+struct Definition;
+struct KlangEl;
+struct TokenRegion;
+
+typedef Vector<TokenRegion*> RegionVect;
+
+typedef Vector<long> ActDataList;
+
+struct ActionData
+{
+	ActionData( int targ, ActDataList &actions, int commitLen )
+		: targ(targ), commitLen(commitLen), id(0), actions(actions) { }
+
+	int targ;
+	int commitLen;
+	int id;
+
+	ActDataList actions;
+};
+
+
+struct CmpActionData
+{
+	static int compare( const ActionData &ap1, const ActionData &ap2 )
+	{
+		if ( ap1.targ < ap2.targ )
+			return -1;
+		else if ( ap1.targ > ap2.targ )
+			return 1;
+		else if ( ap1.commitLen < ap2.commitLen )
+			return -1;
+		else if ( ap1.commitLen > ap2.commitLen )
+			return 1;
+		else if ( ap1.id < ap2.id )
+			return -1;
+		else if ( ap1.id > ap2.id )
+			return 1;
+
+		return CmpTable< long, CmpOrd<long> >::
+			compare( ap1.actions, ap2.actions );
+	}
+};
+
+typedef AvlSet<ActionData, CmpActionData> PdaActionSet;
+typedef AvlSetEl<ActionData> PdaActionSetEl;
+
+/* List pointers for the closure queue. Goes into state. */
+struct ClosureQueueListEl { PdaState *prev, *next; };
+
+/* Queue of states, transitions to be closed. */
+typedef DListMel< PdaState, ClosureQueueListEl > StateClosureQueue;
+typedef DList<PdaTrans> TransClosureQueue;
+
+typedef BstSet< Definition*, CmpOrd<Definition*> > DefSet;
+typedef CmpTable< Definition*, CmpOrd<Definition*> > CmpDefSet;
+typedef BstSet< DefSet, CmpDefSet > DefSetSet;
+
+typedef Vector< Definition* > DefVect;
+typedef BstSet< long, CmpOrd<long> > AlphSet;
+
+struct ExpandToEl
+{
+	ExpandToEl( PdaState *state, int prodId )
+		: state(state), prodId(prodId) { }
+
+	PdaState *state;
+	int prodId;
+};
+
+struct CmpExpandToEl
+{
+	static inline int compare( const ExpandToEl &etel1, const ExpandToEl &etel2 )
+	{ 
+		if ( etel1.state < etel2.state )
+			return -1;
+		else if ( etel1.state > etel2.state )
+			return 1;
+		else if ( etel1.prodId < etel2.prodId )
+			return -1;
+		else if ( etel1.prodId > etel2.prodId )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+typedef BstSet<ExpandToEl, CmpExpandToEl> ExpandToSet;
+typedef BstSet< int, CmpOrd<int> > IntSet;
+typedef CmpTable< int, CmpOrd<int> > CmpIntSet;
+
+typedef BstSet< long, CmpOrd<long> > LongSet;
+typedef CmpTable< long, CmpOrd<long> > CmpLongSet;
+
+typedef BstMap< long, long, CmpOrd<long> > LongMap;
+typedef BstMapEl< long, long > LongMapEl;
+
+typedef LongSet ProdIdSet;
+typedef CmpLongSet CmpProdIdSet;
+
+/* Set of states, list of states. */
+typedef BstSet<PdaState*> PdaStateSet;
+typedef Vector<PdaState*> StateVect;
+typedef DList<PdaState> PdaStateList;
+
+typedef LongMap FollowToAdd;
+typedef LongMap ReductionMap;
+typedef LongMapEl ReductionMapEl;
+
+struct ProdIdPair
+{
+	ProdIdPair( int onReduce, int length )
+		: onReduce(onReduce), length(length) {}
+
+	int onReduce;
+	int length;
+};
+
+struct CmpProdIdPair
+{
+	static inline int compare( const ProdIdPair &pair1, const ProdIdPair &pair2 )
+	{ 
+		if ( pair1.onReduce < pair2.onReduce )
+			return -1;
+		else if ( pair1.onReduce > pair2.onReduce )
+			return 1;
+		else if ( pair1.length < pair2.length )
+			return -1;
+		else if ( pair1.length > pair2.length )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+typedef BstSet< ProdIdPair, CmpProdIdPair > ProdIdPairSet;
+
+/* Transition class that implements actions and priorities. */
+struct PdaTrans 
+{
+	PdaTrans() : 
+		fromState(0), 
+		toState(0), 
+		isShift(false), 
+		isShiftReduce(false),
+		shiftPrior(0)
+	{ }
+
+	PdaTrans( const PdaTrans &other ) :
+		lowKey(other.lowKey),
+		fromState(0), toState(0),
+		isShift(other.isShift),
+		isShiftReduce(other.isShiftReduce),
+		shiftPrior(other.shiftPrior),
+		reductions(other.reductions),
+		commits(other.commits)
+	{ }
+
+	long lowKey;
+	PdaState *fromState;
+	PdaState *toState;
+
+	/* Pointers for outlist. */
+	PdaTrans *prev, *next;
+
+	/* Pointers for in-list. */
+	PdaTrans *ilprev, *ilnext;
+
+	long maxPrior();
+
+	/* Parse Table construction data. */
+	bool isShift, isShiftReduce;
+	int shiftPrior;
+	ReductionMap reductions;
+	ActDataList actions;
+	ActDataList actOrds;
+	ActDataList actPriors;
+
+	ExpandToSet expandTo;
+
+	PdaActionSetEl *actionSetEl;
+
+	LongSet commits;
+	LongSet afterShiftCommits;
+};
+
+/* In transition list. Like DList except only has head pointers, which is all
+ * that is required. Insertion and deletion is handled by the graph. This
+ * class provides the iterator of a single list. */
+struct PdaTransInList
+{
+	PdaTransInList() : head(0) { }
+
+	PdaTrans *head;
+
+	struct Iter
+	{
+		/* Default construct. */
+		Iter() : ptr(0) { }
+
+		/* Construct, assign from a list. */
+		Iter( const PdaTransInList &il )  : ptr(il.head) { }
+		Iter &operator=( const PdaTransInList &dl ) { ptr = dl.head; return *this; }
+
+		/* At the end */
+		bool lte() const    { return ptr != 0; }
+		bool end() const    { return ptr == 0; }
+
+		/* At the first, last element. */
+		bool first() const { return ptr && ptr->ilprev == 0; }
+		bool last() const  { return ptr && ptr->ilnext == 0; }
+
+		/* Cast, dereference, arrow ops. */
+		operator PdaTrans*() const   { return ptr; }
+		PdaTrans &operator *() const { return *ptr; }
+		PdaTrans *operator->() const { return ptr; }
+
+		/* Increment, decrement. */
+		inline void operator++(int)   { ptr = ptr->ilnext; }
+		inline void operator--(int)   { ptr = ptr->ilprev; }
+
+		/* The iterator is simply a pointer. */
+		PdaTrans *ptr;
+	};
+};
+
+typedef DList<PdaTrans> PdaTransList;
+
+/* A element in a state dict. */
+struct PdaStateDictEl 
+:
+	public AvlTreeEl<PdaStateDictEl>
+{
+	PdaStateDictEl(const PdaStateSet &stateSet) 
+		: stateSet(stateSet) { }
+
+	const PdaStateSet &getKey() { return stateSet; }
+	PdaStateSet stateSet;
+	PdaState *targState;
+};
+
+/* Dictionary mapping a set of states to a target state. */
+typedef AvlTree< PdaStateDictEl, PdaStateSet, CmpTable<PdaState*> > PdaStateDict;
+
+/* What items does a particular state encompass. */
+typedef BstSet< long, CmpOrd<long> > DotSet;
+typedef CmpTable< long, CmpOrd<long> > CmpDotSet;
+
+/* Map of dot sets to states. */
+typedef AvlTree< PdaState, DotSet, CmpDotSet > DotSetMap;
+typedef PdaState DotSetMapEl;
+
+typedef BstMap< long, PdaTrans* > TransMap;
+typedef BstMapEl< long, PdaTrans* > TransMapEl;
+
+/* State class that implements actions and priorities. */
+struct PdaState 
+: 
+	public ClosureQueueListEl,
+	public AvlTreeEl< PdaState >
+{
+	PdaState();
+	PdaState(const PdaState &other);
+	~PdaState();
+
+	/* Is the state final? */
+	bool isFinState() { return stateBits & SB_ISFINAL; }
+
+	PdaTrans *findTrans( long key ) 
+	{
+		TransMapEl *transMapEl = transMap.find( key );
+		if ( transMapEl == 0 )
+			return 0;
+		return transMapEl->value;
+	}
+
+	/* In transition list. */
+	PdaTransInList inRange;
+
+	ProdIdPairSet pendingCommits;
+
+	/* When duplicating the fsm we need to map each 
+	 * state to the new state representing it. */
+	PdaState *stateMap;
+
+	/* When merging states (state machine operations) this next pointer is
+	 * used for the list of states that need to be filled in. */
+	PdaState *alg_next;
+
+	PdaStateSet *stateSet;
+
+	/* Identification for printing and stable minimization. */
+	int stateNum;
+
+	/* A pointer to a dict element that contains the set of states this state
+	 * represents. This cannot go into alg, because alg.next is used during
+	 * the merging process. */
+	PdaStateDictEl *stateDictEl;
+
+	/* Bits controlling the behaviour of the state during collapsing to dfa. */
+	int stateBits;
+
+	/* State list elements. */
+	PdaState *next, *prev;
+
+	/* For dotset map. */
+	DotSet &getKey() { return dotSet; }
+
+	/* Closure management. */
+	DotSet dotSet;
+	DotSet dotSet2;
+	bool onClosureQueue;
+	bool inClosedMap;
+	bool followMarked;
+	bool onStateList;
+
+	TransMap transMap;
+
+	RegionVect regions;
+};
+
+/* Compare lists of epsilon transitions. Entries are name ids of targets. */
+typedef CmpTable< int, CmpOrd<int> > CmpEpsilonTrans;
+
+/* Compare sets of context values. */
+typedef CmpTable< int, CmpOrd<int> > CmpContextSets;
+
+/* Graph class that implements actions and priorities. */
+struct PdaGraph 
+{
+	/* Constructors/Destructors. */
+	PdaGraph();
+	PdaGraph( const PdaGraph &graph );
+	~PdaGraph();
+
+	/* The list of states. */
+	PdaStateList stateList;
+	PdaStateList misfitList;
+
+	/* The start state. */
+	PdaState *startState;
+
+	/* The set of final states. */
+	PdaStateSet finStateSet;
+
+	/* Closure queues and maps. */
+	DotSetMap closedMap;
+	StateClosureQueue stateClosureQueue;
+	StateClosureQueue stateClosedList;
+
+	TransClosureQueue transClosureQueue;
+	PdaState *stateClosureHead;
+
+	KlangEl **langElIndex;
+
+	void setStartState( PdaState *state );
+	void unsetStartState( );
+	
+	/*
+	 * Basic attaching and detaching.
+	 */
+
+	/* Common to attaching/detaching list and default. */
+	void attachToInList( PdaState *from, PdaState *to, PdaTrans *&head, PdaTrans *trans );
+	void detachFromInList( PdaState *from, PdaState *to, PdaTrans *&head, PdaTrans *trans );
+
+	/* Attach with a new transition. */
+	PdaTrans *appendNewTrans( PdaState *from, PdaState *to, long onChar1, long );
+	PdaTrans *insertNewTrans( PdaState *from, PdaState *to, long lowKey, long );
+
+	/* Attach with an existing transition that already in an out list. */
+	void attachTrans( PdaState *from, PdaState *to, PdaTrans *trans );
+	
+	/* Detach a transition from a target state. */
+	void detachTrans( PdaState *from, PdaState *to, PdaTrans *trans );
+
+	/* Detach a state from the graph. */
+	void detachState( PdaState *state );
+
+	/*
+	 * Callbacks.
+	 */
+
+	/* Add in the properties of srcTrans into this. */
+	void addInReduction( PdaTrans *dest, long prodId, long prior );
+	void addInTrans( PdaTrans *destTrans, PdaTrans *srcTrans );
+	void addInState( PdaState *destState, PdaState *srcState );
+
+	/*
+	 * Allocation.
+	 */
+
+	/* New up a state and add it to the graph. */
+	PdaState *addState();
+
+	/*
+	 * Fsm operators.
+	 */
+
+	/* Follow to the fin state of src fsm. */
+	PdaState *followFsm( PdaState *from, PdaGraph *srcFsm );
+
+	/*
+	 * Final states
+	 */
+
+	/* Set and Unset a state as final. */
+	void setFinState( PdaState *state );
+	void unsetFinState( PdaState *state );
+	void unsetAllFinStates( );
+
+	/* Set State numbers starting at 0. */
+	void setStateNumbers();
+
+	/*
+	 * Path pruning
+	 */
+
+	/* Mark all states reachable from state. */
+	void markReachableFromHere( PdaState *state );
+
+	/* Removes states that cannot be reached by any path in the fsm and are
+	 * thus wasted silicon. */
+	void removeUnreachableStates();
+
+	/* Remove error actions from states on which the error transition will
+	 * never be taken. */
+	bool outListCovers( PdaState *state );
+
+	/* Remove states that are on the misfit list. */
+	void removeMisfits();
+
+
+	/*
+	 * Other
+	 */
+
+	/* Move the in trans into src into dest. */
+	void inTransMove(PdaState *dest, PdaState *src);
+
+	int fsmLength( );
+
+	/* Collected machine information. */
+	unsigned long long maxState;
+	unsigned long long maxAction;
+	unsigned long long maxLelId;
+	unsigned long long maxOffset;
+	unsigned long long maxIndex;
+	unsigned long long maxProdLen;
+
+	PdaActionSet actionSet;
+};
+
+
+#endif /* _FSMGRAPH_H */
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
new file mode 100644
index 00000000..35a60446
--- /dev/null
+++ b/colm/pdarun.cpp
@@ -0,0 +1,646 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <errno.h>
+#include <stdio.h>
+#include <fstream>
+#include <string>
+
+#include "config.h"
+#include "pdarun.h"
+#include "fsmrun.h"
+
+using std::ostream;
+using std::cout;
+using std::cerr;
+using std::endl;
+
+#define act_sb 0x1
+#define act_rb 0x2
+#define lower 0x0000ffff
+#define upper 0xffff0000
+#define reject() induceReject = 1
+
+Tree *PdaRun::getParsedRoot( bool stop )
+{
+	return stop ? stackTop->tree : stackTop->next->tree;
+}
+
+void PdaRun::clean()
+{
+	/* Traverse the stack, cleaning. */
+	Kid *kid = stackTop;
+	while ( kid != 0 ) {
+		Kid *next = kid->next;
+		tree_downref( prg, kid->tree );
+		prg->kidPool.free( kid );
+		kid = next;
+	}
+}
+
+bool PdaRun::isParserStopFinished()
+{
+	bool done = 
+			stackTop->next != 0 && 
+			stackTop->next->next == 0 &&
+			stackTop->tree->id == stopTarget;
+	return done;
+}
+
+void PdaRun::init()
+{
+	cs = tables->startState;
+
+	/* Init the element allocation variables. */
+	stackTop = prg->kidPool.allocate();
+	stackTop->tree = prg->treePool.allocate();
+	stackTop->tree->alg = prg->algPool.allocate();
+
+	stackTop->tree->alg->state = -1;
+	stackTop->tree->refs = 1;
+	numRetry = 0;
+	errCount = 0;
+	nextRegionInd = tables->tokenRegionInds[cs];
+	stopParsing = false;
+	accumIgnore = 0;
+
+	/* Bindings are indexed at 1. Need a no-binding. */
+	bindings.push(0);
+}
+
+long PdaRun::stackTopTarget()
+{
+	long state;
+	if ( stackTop->tree->alg->state < 0 )
+		state = tables->startState;
+	else {
+		state = tables->targs[(int)tables->indicies[tables->offsets[
+				stackTop->tree->alg->state] + 
+				(stackTop->tree->id - tables->keys[stackTop->tree->alg->state<<1])]];
+	}
+	return state;
+}
+
+#define push(i) (*(--sp) = (i))
+#define pop() (*sp++)
+
+bool beenCommitted( Kid *kid )
+{
+	return kid->tree->alg->flags & AF_COMMITTED;
+}
+
+bool beenFreed( Kid *kid )
+{
+	return kid->tree->alg->flags & AF_REV_FREED;
+}
+
+/* The top level of the stack is linked right-to-left. Trees underneath are
+ * left to right natural order. */
+
+void PdaRun::commitKid( Tree **root, Kid *lel )
+{
+	Alg *alg = 0;
+	Tree *tree = 0;
+	Tree **sp = root;
+
+head:
+	/* Load up the parsed tree. */
+	tree = lel->tree;
+	alg = tree->alg;
+	if ( alg->parsed != 0 )
+		tree = alg->parsed;
+
+	/* Recurse only on non-generated trees. */
+	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
+		push( (Tree*)lel );
+		lel = tree_child( prg, tree );
+
+		while ( lel != 0 ) {
+			if ( !beenCommitted( lel ) )
+				goto head;
+
+			upwards:
+			lel = lel->next;
+		}
+
+		lel = (Kid*)pop();
+	}
+
+	/* Commit */
+	#ifdef COLM_LOG_PARSE
+	cerr << "commit visiting: " << 
+			prg->rtd->lelInfo[lel->tree->id].name << endl;
+	#endif
+
+	alg = lel->tree->alg;
+
+	/* Reset retries. */
+	if ( alg->retry_lower > 0 ) {
+		numRetry -= 1;
+		alg->retry_lower = 0;
+	}
+	if ( alg->retry_upper > 0 ) {
+		numRetry -= 1;
+		alg->retry_upper = 0;
+	}
+	alg->flags |= AF_COMMITTED;
+
+	if ( sp != root )
+		goto upwards;
+
+	numRetry = 0;
+	assert( sp == root );
+}
+
+
+/* The top level of the stack is linked right-to-left. Trees underneath are
+ * left to right natural order. */
+void parsed_downref_kid( Tree **root, Program *prg, Kid *lel )
+{
+	Alg *alg = 0;
+	Tree *tree = 0;
+	Tree **sp = root;
+
+head:
+	/* Load up the right tree. */
+	tree = lel->tree;
+	alg = tree->alg;
+	if ( alg->parsed != 0 )
+		tree = alg->parsed;
+
+	/* Recurse. */
+	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
+		push( (Tree*)lel );
+		lel = tree_child( prg, tree );
+
+		while ( lel != 0 ) {
+			if ( !beenFreed( lel ) )
+				goto head;
+
+			upwards:
+			lel = lel->next;
+		}
+
+		lel = (Kid*)pop();
+	}
+
+	/* Commit */
+	#ifdef COLM_LOG_PARSE
+	cerr << "rev free visiting: " << 
+			prg->rtd->lelInfo[lel->tree->id].name << endl;
+	#endif
+
+	alg = lel->tree->alg;
+
+	alg->flags |= AF_REV_FREED;
+
+	tree_downref( prg, alg->parsed );
+	alg->parsed = 0;
+
+	if ( sp != root )
+		goto upwards;
+
+	assert( sp == root );
+}
+
+void parsed_downref( Tree **root, Program *prg, Tree *tree )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "running parsed_downref on tree" << endl;
+	#endif
+
+	Kid kid;
+	kid.next = 0;
+	kid.tree = tree;
+	parsed_downref_kid( root, prg, &kid );
+}
+
+void PdaRun::commit()
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "running full commit" << endl;
+	#endif
+	
+	Tree **sp = root;
+	Kid *kid = stackTop;
+	long topLevel = 0;
+	while ( kid != 0 && !beenCommitted( kid ) ) {
+		push( (Tree*)kid );
+		kid = kid->next;
+		topLevel += 1;
+	}
+
+	while ( topLevel > 0 ) {
+		kid = (Kid*)pop();
+		commitKid( sp, kid );
+		parsed_downref_kid( sp, prg, kid );
+		topLevel -= 1;
+	}
+
+	/* Affter running the commit the the stack should be where it 
+	 * was when we started. */
+	assert( sp == root );
+
+	/* Now clear all the rcode. */
+	rcode_downref_all( root, prg, &allReverseCode );
+}
+
+
+/*
+ * shift:         retry goes into lower of shifted node.
+ * reduce:        retry goes into upper of reduced node.
+ * shift-reduce:  cannot be a retry
+ */
+
+void PdaRun::parseToken( Kid *input )
+{
+	int pos, targState;
+	unsigned int *action;
+	int rhsLen;
+	Kid *lel;
+	bool induceReject;
+
+	/* The scanner will send a null token if it can't find a token. */
+	if ( input == 0 )
+		goto parseError;
+
+	/* This will cause input to be lost. This 
+	 * path should be Should be traced. */
+	if ( cs < 0 )
+		return;
+
+	input->tree->alg->region = nextRegionInd;
+	input->tree->alg->state = cs;
+	if ( tables->tokenRegions[input->tree->alg->region+1] != 0 )
+		numRetry += 1;
+
+again:
+	if ( input == 0 )
+		goto _out;
+
+	lel = input;
+	if ( lel->tree->id < tables->keys[cs<<1] || lel->tree->id > tables->keys[(cs<<1)+1] )
+		goto parseError;
+
+	pos = tables->indicies[tables->offsets[cs] + (lel->tree->id - tables->keys[cs<<1])];
+	if ( pos < 0 )
+		goto parseError;
+
+	induceReject = false;
+	targState = tables->targs[pos];
+	action = tables->actions + tables->actInds[pos];
+	if ( lel->tree->alg->retry_lower )
+		action += lel->tree->alg->retry_lower;
+
+	if ( *action & act_sb ) {
+		#ifdef COLM_LOG_PARSE
+		cerr << "shifted: " << tables->gbl->lelInfo[lel->tree->id].name;
+		#endif
+		input = input->next;
+		lel->tree->alg->state = cs;
+		lel->next = stackTop;
+		stackTop = lel;
+
+		/* If shifting a termDup then change it to the nonterm. */
+		if ( lel->tree->id < tables->gbl->firstNonTermId &&
+				tables->gbl->lelInfo[lel->tree->id].termDupId > 0 )
+		{
+			lel->tree->id = tables->gbl->lelInfo[lel->tree->id].termDupId;
+			lel->tree->alg->flags |= AF_GENERATED;
+		}
+
+		if ( action[1] == 0 )
+			lel->tree->alg->retry_lower = 0;
+		else {
+			lel->tree->alg->retry_lower += 1;
+			assert( lel->tree->alg->retry_upper == 0 );
+			numRetry += 1; /* FIXME: Has the retry already been counted? */
+			#ifdef COLM_LOG_PARSE
+			cerr << " retry: " << stackTop;
+			#endif
+		}
+		#ifdef COLM_LOG_PARSE
+		cerr << endl;
+		#endif
+	}
+
+	if ( tables->commitLen[pos] != 0 )
+		commit();
+
+	if ( *action & act_rb ) {
+		int objectLength, reduction = *action >> 2;
+		Kid *last, *redLel, *child, *attrs;
+		Alg *redAlg;
+
+		if ( input != 0 )
+			input->tree->alg->causeReduce += 1;
+
+		redLel = prg->kidPool.allocate();
+		redLel->tree = prg->treePool.allocate();
+		redAlg = prg->algPool.allocate();
+
+		redLel->tree->refs = 1;
+		redLel->tree->id = tables->gbl->prodInfo[reduction].lhsId;
+
+		redLel->next = 0;
+		redAlg->causeReduce = 0;
+		redAlg->retry_lower = 0;
+		redAlg->retry_upper = lel->tree->alg->retry_lower;
+		lel->tree->alg->retry_lower = 0;
+
+		/* Allocate the attributes. */
+		objectLength = tables->gbl->lelInfo[redLel->tree->id].objectLength;
+		attrs = alloc_attrs( prg, objectLength );
+
+		/* Build the list of children. */
+		rhsLen = tables->gbl->prodInfo[reduction].length;
+		child = last = 0;
+		for ( int r = 0; r < rhsLen; r++ ) {
+			child = stackTop;
+			stackTop = stackTop->next;
+			child->next = last;
+			last = child;
+		}
+
+		redLel->tree->child = kid_list_concat( attrs, child );
+
+		#ifdef COLM_LOG_PARSE
+		cerr << "reduced: "
+				<< tables->gbl->prodInfo[reduction].name
+				<< " rhsLen: " << rhsLen;
+		#endif
+		if ( action[1] == 0 )
+			redAlg->retry_upper = 0;
+		else {
+			redAlg->retry_upper += 1;
+			assert( lel->tree->alg->retry_lower == 0 );
+			numRetry += 1;
+			#ifdef COLM_LOG_PARSE
+			cerr << " retry: " << redLel;
+			#endif
+		}
+
+		#ifdef COLM_LOG_PARSE
+		cerr << endl;
+		#endif
+
+		/* When the production is of zero length we stay in the same state.
+		 * Otherwise we use the state stored in the first child. */
+		targState = rhsLen == 0 ? cs : child->tree->alg->state;
+
+		assert( redLel->tree->refs == 1 );
+
+		if ( prg->ctxDepParsing && tables->gbl->prodInfo[reduction].frameId >= 0 ) {
+			/* Frame info for reduction. */
+			FrameInfo *fi = &tables->gbl->frameInfo[tables->gbl->prodInfo[reduction].frameId];
+
+			/* Execution environment for the reduction code. */
+			Execution execution( prg, reverseCode, 
+					this, fi->code, redLel->tree, 0 );
+
+			/* Take a copy of the lhs and store it in alg. May need it during
+			 * reverse parsing. */
+			redAlg->parsed = redLel->tree;
+			tree_upref( redAlg->parsed );
+
+			/* Execute it. */
+			execution.execute( root );
+
+			/* Pull out the reverse code, if any. */
+			bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+			if ( hasrcode )
+				redAlg->flags |= AF_HAS_RCODE;
+
+			/* Transfer the lhs from the environment to redLel. It is uprefed
+			 * while in the environment. */
+			redLel->tree = execution.lhs;
+
+			/* Perhaps the execution environment is telling us we need to
+			 * reject the reduction. */
+			induceReject = execution.reject;
+		}
+
+		/* Save the algorithm data in the reduced tree. */
+		redLel->tree->alg = redAlg;
+
+		if ( induceReject ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "error induced during reduction of " <<
+					tables->gbl->lelInfo[redLel->tree->id].name << endl;
+			#endif
+			redLel->tree->alg->state = cs;
+			redLel->next = stackTop;
+			stackTop = redLel;
+			cs = targState;
+			goto parseError;
+		}
+		else {
+			redLel->next = input;
+			input = redLel;
+		}
+	}
+
+
+	cs = targState;
+	goto again;
+
+parseError:
+	#ifdef COLM_LOG_PARSE
+	cerr << "hit error, backtracking" << endl;
+	#endif
+
+	if ( numRetry == 0 )
+		goto fail;
+
+	while ( 1 ) {
+		if ( input != 0 ) {
+			assert( input->tree->alg->retry_upper == 0 );
+
+			if ( input->tree->alg->retry_lower != 0 ) {
+				#ifdef COLM_LOG_PARSE
+				cerr << "found retry targ: " << input << endl;
+				#endif
+				numRetry -= 1;
+				#ifdef COLM_LOG_PARSE
+				cerr << "found retry: " << input << endl;
+				#endif
+
+				cs = input->tree->alg->state;
+				goto again;
+			}
+
+			/* If there is no retry and there are no reductions caused by the
+			 * current input token then we are finished with it. Send it back. */
+			if ( input->tree->alg->causeReduce == 0 ) {
+				int next = input->tree->alg->region + 1;
+
+				fsmRun->queueBack( input );
+				input = 0;
+				if ( tables->tokenRegions[next] != 0 ) {
+					#ifdef COLM_LOG_PARSE
+					cerr << "found a new region" << endl;
+					#endif
+					numRetry -= 1;
+					cs = stackTopTarget();
+					nextRegionInd = next;
+					return;
+				}
+			}
+		}
+
+		/* Now it is time to undo something. Pick an element from the top of
+		 * the stack. */
+		Kid *undoLel = stackTop;
+
+		/* Check if we've arrived at the stack sentinal. This guard is
+		 * here to allow us to initially set numRetry to one to cause the
+		 * parser to backup all the way to the beginning when an error
+		 * occurs. */
+		if ( undoLel->next == 0 )
+			break;
+
+		/* Either we are dealing with a terminal that was
+		 * shifted or a nonterminal that was reduced. */
+		if ( stackTop->tree->id < tables->gbl->firstNonTermId || 
+				(stackTop->tree->alg->flags & AF_GENERATED) )
+		{
+			#ifdef COLM_LOG_PARSE
+			cerr << "backing up over effective terminal: " <<
+					tables->gbl->lelInfo[stackTop->tree->id].name << endl;
+			#endif
+
+			/* Pop the item from the stack. */
+			stackTop = stackTop->next;
+
+			/* Undo the translation from termDup. */
+			if ( undoLel->tree->alg->flags & AF_GENERATED ) {
+				undoLel->tree->id = tables->gbl->lelInfo[undoLel->tree->id].termDupId;
+				undoLel->tree->alg->flags &= ~AF_GENERATED;
+			}
+
+			/* Queue it as next input item. */
+			undoLel->next = input;
+			input = undoLel;
+		}
+		else {
+			#ifdef COLM_LOG_PARSE
+			cerr << "backing up over non-terminal: " <<
+					tables->gbl->lelInfo[stackTop->tree->id].name << endl;
+			#endif
+
+			/* Take the alg out of undoLel. */
+			Alg *alg = undoLel->tree->alg;
+			assert( alg != 0 );
+			undoLel->tree->alg = 0;
+
+			/* Check for an execution environment. */
+			if ( alg->flags & AF_HAS_RCODE ) {
+				Execution execution( prg, reverseCode, this, 0, 0, 0 );
+
+				/* Do the reverse exeuction. */
+				execution.rexecute( root, 0, allReverseCode );
+				alg->flags &= ~AF_HAS_RCODE;
+			}
+
+			if ( alg->parsed != 0 ) {
+				/* Get the lhs, it may have been reverted. */
+				tree_downref( prg, undoLel->tree );
+				undoLel->tree = alg->parsed;
+			}
+
+			/* Warm fuzzies ... */
+			assert( undoLel == stackTop );
+
+			/* Take the nonterm off the stack. */
+			stackTop = stackTop->next;
+
+			/* Extract the real children from the child list. */
+			Kid *first = tree_extract_child( prg, undoLel->tree );
+
+			/* Walk the child list and and push the items onto the parsing
+			 * stack one at a time. */
+			while ( first != 0 ) {
+				/* Get the next item ahead of time. */
+				Kid *next = first->next;
+
+				/* Push onto the stack. */
+				first->next = stackTop;
+				stackTop = first;
+
+				first = next;
+			}
+
+			/* If there is an input queued, this is one less reduction it has
+			 * caused. */
+			if ( input != 0 )
+				input->tree->alg->causeReduce -= 1;
+
+			if ( alg->retry_upper != 0 ) {
+				/* There is always an input item here because reduce
+				 * conflicts only happen on a lookahead character. */
+				assert( input != undoLel );
+				assert( input != 0 );
+				assert( alg->retry_lower == 0 );
+				assert( input->tree->alg->retry_upper == 0 );
+
+				/* Transfer the retry from undoLel to input. */
+				input->tree->alg->retry_lower = alg->retry_upper;
+				input->tree->alg->retry_upper = 0;
+				input->tree->alg->state = stackTopTarget();
+			}
+
+			/* Free the reduced item. */
+			tree_downref( prg, undoLel->tree );
+			prg->kidPool.free( undoLel );
+			prg->algPool.free( alg );
+		}
+	}
+
+fail:
+	cs = -1;
+	errCount += 1;
+_out:
+	nextRegionInd = tables->tokenRegionInds[cs];
+}
+
+ostream &PdaRun::parse_error( int tokId, Tree *tree )
+{
+	/* Maintain the error count. */
+	// FIXME: what to put here?
+	// gblErrorCount += 1;
+
+	//cerr << token.loc.fileName << ":" << token.loc.line << ":" << token.loc.col << ": ";
+	cerr << "error: at token ";
+	if ( tokId < 128 )
+		cerr << "\"" << tables->gbl->lelInfo[tokId].name << "\"";
+	else 
+		cerr << tables->gbl->lelInfo[tokId].name;
+	if ( string_length( tree->tokdata ) > 0 ) {
+		cerr << " with data \"";
+		cerr.write( string_data( tree->tokdata ), 
+				string_length( tree->tokdata ) );
+		cerr << "\"";
+	}
+	cerr << ": ";
+	
+	return cerr;
+}
diff --git a/colm/pdarun.h b/colm/pdarun.h
new file mode 100644
index 00000000..7f633abe
--- /dev/null
+++ b/colm/pdarun.h
@@ -0,0 +1,511 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PDARUN_H
+#define _PDARUN_H
+
+#include <iostream>
+#include "dlistval.h"
+#include "bytecode.h"
+#include "vector.h"
+#include "dlist.h"
+
+using std::ostream;
+
+struct Tree;
+struct ParseData;
+struct FsmRun;
+struct KlangEl;
+struct PdaTables;
+struct FsmTables;
+
+struct Alg
+{
+	/* Parsing algorithm. */
+	Tree *parsed;
+	long state;
+	long region;
+	char causeReduce;
+	char retry_lower;
+	char retry_upper;
+	char flags;
+};
+
+struct Kid
+{
+	/* The tree needs to be first since pointers to kids are used to reference
+	 * trees on the stack. A pointer to the word that is a Tree* is cast to
+	 * a Kid*. */
+	Tree *tree;
+	Kid *next;
+};
+
+struct Tree
+{
+	/* First three must be overlaid. */
+	long id;
+	long refs;
+	Kid *child;
+
+	Head *tokdata;
+	Alg *alg;
+};
+
+struct Ref
+{
+	Kid *kid;
+	Ref *next;
+};
+
+struct Int
+{
+	/* Must overlay over Tree. */
+	long id;
+	long refs;
+	Kid *child;
+
+	long value;
+};
+
+struct Pointer
+{
+	/* Must overlay over Tree. */
+	long id;
+	long refs;
+	Kid *child;
+
+	Kid *value;
+};
+
+struct Str
+{
+	/* Must overlay over Tree. */
+	long id;
+	long refs;
+	Kid *child;
+
+	Head *value;
+};
+
+struct TreeIter
+{
+	TreeIter( const Ref &rootRef, int searchId, Tree **stackRoot ) : 
+		rootRef(rootRef), searchId(searchId), 
+		stackRoot(stackRoot), stackSize(0)
+	{
+		ref.kid = 0;
+		ref.next = 0;
+	}
+	
+	Ref rootRef;
+	Ref ref;
+	long searchId;
+	Tree **stackRoot;
+	long stackSize;
+};
+
+struct FunctionInfo
+{
+	const char *name;
+	long frameId;
+	long argSize;
+	long ntrees;
+	long frameSize;
+};
+
+struct UserIter
+{
+	UserIter( Tree **stackRoot, long argSize, long searchId ) : 
+		stackRoot(stackRoot), 
+		argSize(argSize), stackSize(0),
+		resume(0), frame(0), searchId(searchId)
+	{
+		ref.kid = 0;
+		ref.next = 0;
+	}
+		
+	/* The current item. */
+	Ref ref;
+	Tree **stackRoot;
+	long argSize;
+	long stackSize;
+	Code *resume;
+	Tree **frame;
+	long searchId;
+};
+
+struct ListEl
+{
+	/* Must overlay over kid. */
+	Tree *value;
+	ListEl *next;
+	ListEl *prev;
+
+	ListEl() { }
+	ListEl( Tree *value )
+		: value(value) { }
+};
+
+struct List
+{
+	/* Must overlay over tree. */
+	long id;
+	long refs;
+	ListEl *head;
+
+	ListEl *tail;
+	long listLen;
+	GenericInfo *genericInfo;
+
+	void prepend(ListEl *new_el) { addBefore(head, new_el); }
+	void append(ListEl *new_el)  { addAfter(tail, new_el); }
+
+	void addAfter( ListEl *prev_el, ListEl *new_el );
+	void addBefore( ListEl *next_el, ListEl *new_el );
+
+	ListEl *detachFirst()        { return detach(head); }
+	ListEl *detachLast()         { return detach(tail); }
+	ListEl *detach(ListEl *el);
+
+	long length() const 
+		{ return listLen; }
+};
+
+struct MapEl
+{
+	Tree *tree;
+	MapEl *next;
+	MapEl *prev;
+
+	MapEl *left, *right, *parent;
+	long height;
+	Tree *key;
+
+	Tree *getKey() const 
+		{ return key; }
+};
+
+struct Map
+{
+	/* Must overlay over Tree. */
+	long id;
+	long refs;
+	MapEl *head;
+
+	MapEl *tail;
+	MapEl *root;
+	long treeSize;
+	GenericInfo *genericInfo;
+
+	/* List functions. */
+	MapEl *listDetach( MapEl *el );
+	void listAddBefore( MapEl *next_el, MapEl *new_el );
+	void listAddAfter( MapEl *prev_el, MapEl *new_el );
+	void listAbandon();
+
+	int compare( const Tree *w1, const Tree *w2 ) const
+		{ return cmp_tree( w1, w2 ); }
+
+	/* Insert a element into the tree. */
+	MapEl *insert( MapEl *element, MapEl **lastFound = 0 );
+
+	MapEl *insert( Program *p, Tree *key, MapEl **lastFound = 0 );
+
+	/* Find a element in the tree. Returns the element if 
+	 * key exists, false otherwise. */
+	MapEl *find( Tree *key ) const;
+
+	/* Detach a element from the tree. */
+	MapEl *detach( Tree *key );
+
+	/* Detach and delete a element from the tree. */
+	bool remove( Tree *key );
+
+	/* Detach a element from the tree. */
+	MapEl *detach( MapEl *element );
+
+	/* Detach and delete a element from the tree. */
+	void remove( MapEl *element );
+
+	/* Free all memory used by tree. */
+	void empty();
+
+	/** \brief Return the number of elements in the tree. */
+	long length() const { return treeSize; }
+
+	/* Recursive worker for the copy constructor. */
+	MapEl *copyBranch( Program *p, MapEl *element, Kid *oldNextDown, Kid *&newNextDown );
+
+	/* Recursively delete element in the tree. */
+	void deleteChildrenOf(MapEl *n);
+
+	/* rebalance the tree beginning at the leaf whose 
+	 * grandparent is unbalanced. */
+	MapEl *rebalance(MapEl *start);
+
+	/* Move up the tree from a given element, recalculating the heights. */
+	void recalcHeights(MapEl *start);
+
+	/* Move up the tree and find the first element whose 
+	 * grand-parent is unbalanced. */
+	MapEl *findFirstUnbalGP(MapEl *start);
+
+	/* Move up the tree and find the first element which is unbalanced. */
+	MapEl *findFirstUnbalEl(MapEl *start);
+
+	/* Replace a element in the tree with another element not in the tree. */
+	void replaceEl(MapEl *element, MapEl *replacement);
+
+	/* Remove a element from the tree and put another (normally a child of element)
+	 * in its place. */
+	void removeEl(MapEl *element, MapEl *filler);
+
+	/* Once an insertion point is found at a leaf then do the insert. */
+	void attachRebal( MapEl *element, MapEl *parentEl, MapEl *lastLess );
+};
+
+struct InputStream;
+
+struct Stream
+{
+	/* Must overlay over Tree. */
+	long id;
+	long refs;
+	Kid *child;
+
+	FILE *file;
+	InputStream *in;
+	FsmRun *scanner;
+};
+
+struct PatReplInfo
+{
+	long offset;
+	long numBindings;
+};
+
+struct PatReplNode
+{
+	long id;
+	long next;
+	long child;
+	long bindId;
+	const char *data;
+	long length;
+	long ignore;
+
+	/* Just match nonterminal, don't go inside. */
+	bool stop;
+};
+
+struct LangElInfo
+{
+	const char *name;
+	bool repeat;
+	bool literal;
+	bool ignore;
+
+	long frameId;
+
+	long objectTypeId;
+	long ofiOffset;
+	long objectLength;
+
+	long termDupId;
+	long genericId;
+};
+
+struct ObjFieldInfo
+{
+	int typeId;
+};
+
+struct ProdInfo
+{
+	long length;
+	unsigned long lhsId;
+	const char *name;
+	long frameId;
+	bool lhsUpref;
+};
+
+struct FrameInfo
+{
+	Code *code;
+	long codeLen;
+	char *trees;
+	long treesLen;
+};
+
+struct RegionInfo
+{
+	const char *name;
+	long defaultToken;
+	long eofFrameId;
+};
+
+struct RuntimeData
+{
+	LangElInfo *lelInfo;
+	long numLangEls;
+
+	ProdInfo *prodInfo;
+	long numProds;
+
+	RegionInfo *regionInfo;
+	long numRegions;
+
+	Code *rootCode;
+	long rootCodeLen;
+
+	FrameInfo *frameInfo;
+	long numFrames;
+
+	FunctionInfo *functionInfo;
+	long numFunctions;
+
+	PatReplInfo *patReplInfo;
+	long numPatterns;
+
+	PatReplNode *patReplNodes;
+	long numPatternNodes;
+
+	GenericInfo *genericInfo;
+	long numGenerics;
+
+	const char **litdata;
+	long *litlen;
+	Head **literals;
+	long numLiterals;
+
+	FsmTables *fsmTables;
+	PdaTables **parsers;
+	long numParsers;
+
+	long globalSize;
+
+	long firstNonTermId;
+
+	long integerId;
+	long stringId;
+	long anyId;
+	long eofId;
+};
+
+struct PdaTables
+{
+	/* Parser table data. */
+	unsigned int startState;
+	int *indicies;
+	int *keys;
+	unsigned int *offsets;
+	unsigned int *targs;
+	unsigned int *actInds;
+	unsigned int *actions;
+	int *commitLen;
+	int *tokenRegionInds;
+	int *tokenRegions;
+
+	int numIndicies;
+	int numKeys;
+	int numStates;
+	int numTargs;
+	int numActInds;
+	int numActions;
+	int numCommitLen;
+	int numRegionItems;
+
+	RuntimeData *gbl;
+};
+
+bool makeReverseCode( CodeVect &all, CodeVect &reverseCode );
+
+typedef Vector<Tree*> Bindings;
+
+struct PdaRun
+{
+	PdaRun( Tree **root, Program *prg, PdaTables *tables, 
+			FsmRun *scanner, long stopTarget )
+	:
+		root(root),
+		prg(prg),
+		tables(tables), 
+		fsmRun(scanner), 
+		stopParsing(false),
+		stopTarget(stopTarget),
+		queue(0),
+		queueLast(0)
+	{
+	}
+
+	Tree **root;
+	int numRetry;
+	Kid *stackTop;
+	int errCount;
+	int cs;
+	int nextRegionInd;
+
+	/* Offset can be used to look at the next nextRegionInd. */
+	int getNextRegion( int offset = 0 )
+		{ return tables->tokenRegions[nextRegionInd+offset]; }
+
+	Tree *getParsedRoot( bool stop );
+	void clean();
+
+	Program *prg;
+	PdaTables *tables;
+
+	FsmRun *fsmRun;
+
+	long stackTopTarget();
+	void init();
+	void commitKid( Tree **root, Kid *lel );
+	void commit();
+	void parseToken( Kid *input );
+	bool isParserStopFinished();
+	void match( Kid *tree, Kid *pattern );
+	long run();
+	long undoParse( Tree *tree, CodeVect *rev );
+
+	void send( Kid *kid );
+	void ignore( Tree *tree );
+	void sendBackIgnore();
+	Kid *extractIgnore();
+
+	/* Report an error encountered by the parser. */
+	ostream &parse_error( int tokId, Tree *tree );
+
+	/* Reused. */
+	CodeVect reverseCode;
+	CodeVect allReverseCode;
+
+	bool stopParsing;
+	long stopTarget;
+
+	Kid *accumIgnore;
+	Kid *queue, *queueLast;
+
+	Bindings bindings;
+};
+
+void xml_print_list( RuntimeData *runtimeData, Kid *lel, int depth );
+
+#endif /* _PDARUN_H */
diff --git a/colm/redbuild.cpp b/colm/redbuild.cpp
new file mode 100644
index 00000000..feec178f
--- /dev/null
+++ b/colm/redbuild.cpp
@@ -0,0 +1,645 @@
+/*
+ *  Copyright 2005-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+
+#include "colm.h"
+#include "redbuild.h"
+#include "fsmgraph.h"
+#include "redfsm.h"
+#include "fsmcodegen.h"
+#include <string.h>
+
+using namespace std;
+
+RedFsmBuild::RedFsmBuild( char *fsmName, ParseData *pd, FsmGraph *fsm )
+:
+	fsmName(fsmName),
+	pd(pd),
+	fsm(fsm),
+	nextActionTableId(0),
+	startState(-1),
+	errState(-1)
+{
+}
+
+void RedFsmBuild::initActionList( unsigned long length )
+{ 
+	redFsm->allActions = new GenAction[length];
+	for ( unsigned long a = 0; a < length; a++ )
+		redFsm->actionList.append( redFsm->allActions+a );
+}
+
+
+void RedFsmBuild::makeActionList()
+{
+	/* Determine which actions to write. */
+	int nextActionId = 0;
+	for ( ActionList::Iter act = pd->actionList; act.lte(); act++ ) {
+		if ( act->numRefs() > 0 || act->numCondRefs > 0 )
+			act->actionId = nextActionId++;
+	}
+
+	initActionList( nextActionId );
+	curAction = 0;
+
+	for ( ActionList::Iter act = pd->actionList; act.lte(); act++ ) {
+		if ( act->actionId >= 0 )
+			makeAction( act );
+	}
+}
+
+void RedFsmBuild::initActionTableList( unsigned long length )
+{ 
+	redFsm->allActionTables = new RedAction[length];
+}
+
+void RedFsmBuild::initStateList( unsigned long length )
+{
+	redFsm->allStates = new RedState[length];
+	for ( unsigned long s = 0; s < length; s++ )
+		redFsm->stateList.append( redFsm->allStates+s );
+
+	/* We get the start state as an offset, set the pointer now. */
+	assert( startState >= 0 );
+	redFsm->startState = redFsm->allStates + startState;
+	if ( errState >= 0 )
+		redFsm->errState = redFsm->allStates + errState;
+	for ( EntryIdVect::Iter en = redFsm->entryPointIds; en.lte(); en++ )
+		redFsm->entryPoints.insert( redFsm->allStates + *en );
+
+	/* The nextStateId is no longer used to assign state ids (they come in set
+	 * from the frontend now), however generation code still depends on it.
+	 * Should eventually remove this variable. */
+	redFsm->nextStateId = redFsm->stateList.length();
+}
+
+void RedFsmBuild::addEntryPoint( int entryId, char *name, unsigned long entryState )
+{
+	redFsm->entryPointIds.append( entryState );
+	redFsm->entryPointNames.append( name );
+	redFsm->redEntryMap.insert( entryId, entryState );
+}
+
+void RedFsmBuild::addRegionToEntry( int regionId, int entryId )
+{
+	assert( regionId == redFsm->regionToEntry.length() );
+	redFsm->regionToEntry.append( entryId );
+}
+
+void RedFsmBuild::initTransList( int snum, unsigned long length )
+{
+	/* Could preallocate the out range to save time growing it. For now do
+	 * nothing. */
+}
+
+void RedFsmBuild::newTrans( int snum, int tnum, Key lowKey, 
+		Key highKey, long targ, long action )
+{
+	/* Get the current state and range. */
+	RedState *curState = redFsm->allStates + snum;
+	RedTransList &destRange = curState->outRange;
+
+	if ( curState == redFsm->errState )
+		return;
+
+	/* Make the new transitions. */
+	RedState *targState = targ >= 0 ? (redFsm->allStates + targ) : 
+			redFsm->wantComplete ? redFsm->getErrorState() : 0;
+	RedAction *actionTable = action >= 0 ? (redFsm->allActionTables + action) : 0;
+	RedTrans *trans = redFsm->allocateTrans( targState, actionTable );
+	RedTransEl transEl( lowKey, highKey, trans );
+
+	if ( redFsm->wantComplete ) {
+		/* If the machine is to be complete then we need to fill any gaps with
+		 * the error transitions. */
+		if ( destRange.length() == 0 ) {
+			/* Range is currently empty. */
+			if ( keyOps->minKey < lowKey ) {
+				/* The first range doesn't start at the low end. */
+				Key fillHighKey = lowKey;
+				fillHighKey.decrement();
+
+				/* Create the filler with the state's error transition. */
+				RedTransEl newTel( keyOps->minKey, fillHighKey, redFsm->getErrorTrans() );
+				destRange.append( newTel );
+			}
+		}
+		else {
+			/* The range list is not empty, get the the last range. */
+			RedTransEl *last = &destRange[destRange.length()-1];
+			Key nextKey = last->highKey;
+			nextKey.increment();
+			if ( nextKey < lowKey ) {
+				/* There is a gap to fill. Make the high key. */
+				Key fillHighKey = lowKey;
+				fillHighKey.decrement();
+
+				/* Create the filler with the state's error transtion. */
+				RedTransEl newTel( nextKey, fillHighKey, redFsm->getErrorTrans() );
+				destRange.append( newTel );
+			}
+		}
+	}
+
+	/* Filler taken care of. Append the range. */
+	destRange.append( RedTransEl( lowKey, highKey, trans ) );
+}
+
+void RedFsmBuild::finishTransList( int snum )
+{
+	/* Get the current state and range. */
+	RedState *curState = redFsm->allStates + snum;
+	RedTransList &destRange = curState->outRange;
+
+	if ( curState == redFsm->errState )
+		return;
+
+	/* If building a complete machine we may need filler on the end. */
+	if ( redFsm->wantComplete ) {
+		/* Check if there are any ranges already. */
+		if ( destRange.length() == 0 ) {
+			/* Fill with the whole alphabet. */
+			/* Add the range on the lower and upper bound. */
+			RedTransEl newTel( keyOps->minKey, keyOps->maxKey, redFsm->getErrorTrans() );
+			destRange.append( newTel );
+		}
+		else {
+			/* Get the last and check for a gap on the end. */
+			RedTransEl *last = &destRange[destRange.length()-1];
+			if ( last->highKey < keyOps->maxKey ) {
+				/* Make the high key. */
+				Key fillLowKey = last->highKey;
+				fillLowKey.increment();
+
+				/* Create the new range with the error trans and append it. */
+				RedTransEl newTel( fillLowKey, keyOps->maxKey, redFsm->getErrorTrans() );
+				destRange.append( newTel );
+			}
+		}
+	}
+}
+
+void RedFsmBuild::setId( int snum, int id )
+{
+	RedState *curState = redFsm->allStates + snum;
+	curState->id = id;
+}
+
+void RedFsmBuild::setEofTrans( int snum, int eofTarget, int actId )
+{
+	RedState *curState = redFsm->allStates + snum;
+	RedState *targState = redFsm->allStates + eofTarget;
+	RedAction *eofAct = redFsm->allActionTables + actId;
+	curState->eofTrans = redFsm->allocateTrans( targState, eofAct );
+}
+
+void RedFsmBuild::setFinal( int snum )
+{
+	RedState *curState = redFsm->allStates + snum;
+	curState->isFinal = true;
+}
+
+
+void RedFsmBuild::setStateActions( int snum, long toStateAction, 
+			long fromStateAction, long eofAction )
+{
+	RedState *curState = redFsm->allStates + snum;
+	if ( toStateAction >= 0 )
+		curState->toStateAction = redFsm->allActionTables + toStateAction;
+	if ( fromStateAction >= 0 )
+		curState->fromStateAction = redFsm->allActionTables + fromStateAction;
+	if ( eofAction >= 0 )
+		curState->eofAction = redFsm->allActionTables + eofAction;
+}
+
+void RedFsmBuild::closeMachine()
+{
+	//for ( GenActionList::Iter a = redFsm->actionList; a.lte(); a++ )
+	//	resolveTargetStates( a->inlineList );
+
+	/* Note that even if we want a complete graph we do not give the error
+	 * state a default transition. All machines break out of the processing
+	 * loop when in the error state. */
+
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		for ( GenStateCondList::Iter sci = st->stateCondList; sci.lte(); sci++ )
+			st->stateCondVect.append( sci );
+	}
+}
+
+void RedFsmBuild::initCondSpaceList( ulong length )
+{
+	redFsm->allCondSpaces = new GenCondSpace[length];
+	for ( ulong c = 0; c < length; c++ )
+		redFsm->condSpaceList.append( redFsm->allCondSpaces + c );
+}
+
+void RedFsmBuild::newCondSpace( int cnum, int condSpaceId, Key baseKey )
+{
+	GenCondSpace *cond = redFsm->allCondSpaces + cnum;
+	cond->condSpaceId = condSpaceId;
+	cond->baseKey = baseKey;
+}
+
+void RedFsmBuild::condSpaceItem( int cnum, long condActionId )
+{
+	GenCondSpace *cond = redFsm->allCondSpaces + cnum;
+	cond->condSet.append( redFsm->allActions + condActionId );
+}
+
+void RedFsmBuild::initStateCondList( int snum, ulong length )
+{
+	/* Could preallocate these, as we could with transitions. */
+}
+
+void RedFsmBuild::addStateCond( int snum, Key lowKey, Key highKey, long condNum )
+{
+	RedState *curState = redFsm->allStates + snum;
+
+	/* Create the new state condition. */
+	GenStateCond *stateCond = new GenStateCond;
+	stateCond->lowKey = lowKey;
+	stateCond->highKey = highKey;
+
+	/* Assign it a cond space. */
+	GenCondSpace *condSpace = redFsm->allCondSpaces + condNum;
+	stateCond->condSpace = condSpace;
+
+	curState->stateCondList.append( stateCond );
+}
+
+
+void RedFsmBuild::setForcedErrorState()
+{
+	redFsm->forcedErrorState = true;
+}
+
+Key RedFsmBuild::findMaxKey()
+{
+	Key maxKey = keyOps->maxKey;
+	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
+		assert( st->outSingle.length() == 0 );
+		assert( st->defTrans == 0 );
+
+		long rangeLen = st->outRange.length();
+		if ( rangeLen > 0 ) {
+			Key highKey = st->outRange[rangeLen-1].highKey;
+			if ( highKey > maxKey )
+				maxKey = highKey;
+		}
+	}
+	return maxKey;
+}
+
+
+void RedFsmBuild::makeActionTableList()
+{
+	/* Must first order the action tables based on their id. */
+	int numTables = nextActionTableId;
+	RedActionTable **tables = new RedActionTable*[numTables];
+	for ( ActionTableMap::Iter at = actionTableMap; at.lte(); at++ )
+		tables[at->id] = at;
+
+	initActionTableList( numTables );
+	curActionTable = 0;
+
+	for ( int t = 0; t < numTables; t++ ) {
+		long length = tables[t]->key.length();
+
+		/* Collect the action table. */
+		RedAction *redAct = redFsm->allActionTables + curActionTable;
+		redAct->actListId = curActionTable;
+		redAct->key.setAsNew( length );
+
+		int pos = 0;
+		for ( ActionTable::Iter atel = tables[t]->key; atel.lte(); atel++ ) {
+			int actionId = atel->value->actionId;
+			redAct->key[pos].key = 0;
+			redAct->key[pos].value = redFsm->allActions+actionId;
+			pos += 1;
+		}
+
+		/* Insert into the action table map. */
+		redFsm->actionMap.insert( redAct );
+
+		curActionTable += 1;
+
+	}
+
+	delete[] tables;
+}
+
+void RedFsmBuild::reduceActionTables()
+{
+	/* Reduce the actions tables to a set. */
+	for ( StateList::Iter st = fsm->stateList; st.lte(); st++ ) {
+		RedActionTable *actionTable = 0;
+
+		/* Reduce To State Actions. */
+		if ( st->toStateActionTable.length() > 0 ) {
+			if ( actionTableMap.insert( st->toStateActionTable, &actionTable ) )
+				actionTable->id = nextActionTableId++;
+		}
+
+		/* Reduce From State Actions. */
+		if ( st->fromStateActionTable.length() > 0 ) {
+			if ( actionTableMap.insert( st->fromStateActionTable, &actionTable ) )
+				actionTable->id = nextActionTableId++;
+		}
+
+		/* Reduce EOF actions. */
+		if ( st->eofActionTable.length() > 0 ) {
+			if ( actionTableMap.insert( st->eofActionTable, &actionTable ) )
+				actionTable->id = nextActionTableId++;
+		}
+
+		/* Loop the transitions and reduce their actions. */
+		for ( TransList::Iter trans = st->outList; trans.lte(); trans++ ) {
+			if ( trans->actionTable.length() > 0 ) {
+				if ( actionTableMap.insert( trans->actionTable, &actionTable ) )
+					actionTable->id = nextActionTableId++;
+			}
+		}
+	}
+}
+
+void RedFsmBuild::appendTrans( TransListVect &outList, Key lowKey, 
+		Key highKey, FsmTrans *trans )
+{
+	if ( trans->toState != 0 || trans->actionTable.length() > 0 )
+		outList.append( TransEl( lowKey, highKey, trans ) );
+}
+
+void RedFsmBuild::makeTrans( Key lowKey, Key highKey, FsmTrans *trans )
+{
+	/* First reduce the action. */
+	RedActionTable *actionTable = 0;
+	if ( trans->actionTable.length() > 0 )
+		actionTable = actionTableMap.find( trans->actionTable );
+
+	long targ = trans->toState == 0 ? -1 : trans->toState->alg.stateNum;
+	long action = actionTable == 0 ? -1 : actionTable->id;
+
+	newTrans( curState, curTrans++, lowKey, highKey, targ, action );
+}
+
+void RedFsmBuild::makeTransList( FsmState *state )
+{
+	TransListVect outList;
+
+	/* If there is only are no ranges the task is simple. */
+	if ( state->outList.length() > 0 ) {
+		/* Loop each source range. */
+		for ( TransList::Iter trans = state->outList; trans.lte(); trans++ ) {
+			/* Reduce the transition. If it reduced to anything then add it. */
+			appendTrans( outList, trans->lowKey, trans->highKey, trans );
+		}
+	}
+
+	long length = outList.length();
+	initTransList( curState, length );
+	curTrans = 0;
+
+	for ( TransListVect::Iter tvi = outList; tvi.lte(); tvi++ )
+		makeTrans( tvi->lowKey, tvi->highKey, tvi->value );
+	finishTransList( curState );
+}
+
+void RedFsmBuild::newAction( int anum, char *name, int line, int col, Action *action )
+{
+	redFsm->allActions[anum].actionId = anum;
+	redFsm->allActions[anum].name = name;
+	redFsm->allActions[anum].loc.line = line;
+	redFsm->allActions[anum].loc.col = col;
+	redFsm->allActions[anum].inlineList = action->inlineList;
+	redFsm->allActions[anum].objField = action->objField;
+	redFsm->allActions[anum].markType = action->markType;
+}
+
+void RedFsmBuild::makeAction( Action *action )
+{
+	int line = action->loc.line;
+	int col = action->loc.col;
+
+	char *name = 0;
+	if ( action->name != 0 ) 
+		name = action->name;
+
+	newAction( curAction++, name, line, col, action );
+}
+
+void xmlEscapeHost( std::ostream &out, char *data, int len )
+{
+	char *end = data + len;
+	while ( data != end ) {
+		switch ( *data ) {
+		case '<': out << "&lt;"; break;
+		case '>': out << "&gt;"; break;
+		case '&': out << "&amp;"; break;
+		default: out << *data; break;
+		}
+		data += 1;
+	}
+}
+
+void RedFsmBuild::makeStateActions( FsmState *state )
+{
+	RedActionTable *toStateActions = 0;
+	if ( state->toStateActionTable.length() > 0 )
+		toStateActions = actionTableMap.find( state->toStateActionTable );
+
+	RedActionTable *fromStateActions = 0;
+	if ( state->fromStateActionTable.length() > 0 )
+		fromStateActions = actionTableMap.find( state->fromStateActionTable );
+
+	RedActionTable *eofActions = 0;
+	if ( state->eofActionTable.length() > 0 )
+		eofActions = actionTableMap.find( state->eofActionTable );
+	
+	if ( toStateActions != 0 || fromStateActions != 0 || eofActions != 0 ) {
+		long toStateAction = -1;
+		long fromStateAction = -1;
+		long eofAction = -1;
+
+		if ( toStateActions != 0 )
+			toStateAction = toStateActions->id;
+		if ( fromStateActions != 0 )
+			fromStateAction = fromStateActions->id;
+		if ( eofActions != 0 )
+			eofAction = eofActions->id;
+
+		setStateActions( curState, toStateAction,
+				fromStateAction, eofAction );
+	}
+}
+
+void RedFsmBuild::makeStateConditions( FsmState *state )
+{
+	if ( state->stateCondList.length() > 0 ) {
+
+		long length = state->stateCondList.length();
+		initStateCondList( curState, length );
+		curStateCond = 0;
+
+		for ( StateCondList::Iter scdi = state->stateCondList; scdi.lte(); scdi++ ) {
+			Key lowKey = scdi->lowKey;
+			Key highKey = scdi->highKey;
+			long condId = scdi->condSpace->condSpaceId;
+			addStateCond( curState, lowKey, highKey, condId );
+		}
+	}
+}
+
+void RedFsmBuild::makeStateList()
+{
+	/* Write the list of states. */
+	long length = fsm->stateList.length();
+	initStateList( length );
+	curState = 0;
+
+	for ( StateList::Iter st = fsm->stateList; st.lte(); st++ ) {
+		/* Both or neither should be set. */
+		assert( !( st->eofTarget != 0 xor st->eofActionTable.length() > 0 ) );
+
+		makeStateActions( st );
+		makeStateConditions( st );
+		makeTransList( st );
+
+		setId( curState, st->alg.stateNum );
+		if ( st->isFinState() )
+			setFinal( curState );
+
+		/* If there is an eof target, make an eof transition. */
+		if ( st->eofTarget != 0 ) {
+			/* Find the eof actions. */
+			RedActionTable *eofActions = 0;
+			eofActions = actionTableMap.find( st->eofActionTable );
+			setEofTrans( curState, st->eofTarget->alg.stateNum, eofActions->id );
+		}
+
+		curState += 1;
+	}
+}
+
+void RedFsmBuild::makeEntryPoints()
+{
+	if ( fsm->lmRequiresErrorState )
+		setForcedErrorState();
+
+	for ( EntryMap::Iter en = fsm->entryPoints; en.lte(); en++ ) {
+		/* Get the name instantiation from nameIndex. */
+		NameInst *nameInst = fsm->nameIndex[en->key];
+		FsmState *state = en->value;
+		char *name = nameInst->name;
+		long entry = state->alg.stateNum;
+		addEntryPoint( en->key, name, entry );
+	}
+
+	for ( RegionList::Iter reg = pd->regionList; reg.lte(); reg++ ) {
+		if ( reg->regionNameInst == 0 )
+			addRegionToEntry( reg->id, pd->defaultRegion->id );
+		else {
+			NameInst *regionName = reg->regionNameInst->parent;
+			addRegionToEntry( reg->id, regionName->id );
+		}
+	}
+}
+
+void RedFsmBuild::makeMachine()
+{
+	/* Action tables. */
+	reduceActionTables();
+
+	makeActionList();
+	makeActionTableList();
+	makeConditions();
+
+	/* Start state. */
+	startState = fsm->startState->alg.stateNum;
+	
+	/* Error state. */
+	if ( fsm->errState != 0 )
+		errState = fsm->errState->alg.stateNum;
+
+	makeEntryPoints();
+	makeStateList();
+}
+
+void RedFsmBuild::makeConditions()
+{
+	if ( condData->condSpaceMap.length() > 0 ) {
+		long nextCondSpaceId = 0;
+		for ( CondSpaceMap::Iter cs = condData->condSpaceMap; cs.lte(); cs++ )
+			cs->condSpaceId = nextCondSpaceId++;
+
+		long length = condData->condSpaceMap.length(); 
+		initCondSpaceList( length );
+		curCondSpace = 0;
+
+		for ( CondSpaceMap::Iter cs = condData->condSpaceMap; cs.lte(); cs++ ) {
+			long condSpaceId = cs->condSpaceId;
+			Key baseKey = cs->baseKey;
+
+			newCondSpace( curCondSpace, condSpaceId, baseKey );
+			for ( CondSet::Iter csi = cs->condSet; csi.lte(); csi++ ) {
+				long actionOffset = (*csi)->actionId;
+				condSpaceItem( curCondSpace, actionOffset );
+			}
+
+			curCondSpace += 1;
+		}
+	}
+}
+
+RedFsm *RedFsmBuild::reduceMachine()
+{
+	redFsm = new RedFsm();
+	redFsm->wantComplete = true;
+
+	/* Open the definition. */
+	makeMachine();
+
+	/* Do this before distributing transitions out to singles and defaults
+	 * makes life easier. */
+	redFsm->maxKey = findMaxKey();
+
+	redFsm->assignActionLocs();
+
+	/* Find the first final state (The final state with the lowest id). */
+	redFsm->findFirstFinState();
+
+	/* Choose default transitions and the single transition. */
+	redFsm->chooseDefaultSpan();
+		
+	/* Maybe do flat expand, otherwise choose single. */
+	redFsm->chooseSingle();
+
+	/* Set up incoming transitions. */
+	redFsm->setInTrans();
+
+	/* Anlayze Machine will find the final action reference counts, among
+	 * other things. We will use these in reporting the usage
+	 * of fsm directives in action code. */
+	redFsm->analyzeMachine();
+
+	return redFsm;
+}
+
diff --git a/colm/redbuild.h b/colm/redbuild.h
new file mode 100644
index 00000000..15c00ca2
--- /dev/null
+++ b/colm/redbuild.h
@@ -0,0 +1,161 @@
+/*
+ *  Copyright 2005, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _FSMREDUCE_H
+#define _FSMREDUCE_H
+
+#include <iostream>
+#include "avltree.h"
+#include "fsmgraph.h"
+#include "parsedata.h"
+
+/* Forwards. */
+struct FsmTrans;
+struct FsmGraph;
+struct ParseData;
+struct FsmCodeGen;
+struct RedFsm;
+struct FsmRun;
+struct GenCondSpace;
+struct Condition;
+
+struct RedActionTable
+:
+	public AvlTreeEl<RedActionTable>
+{
+	RedActionTable( const ActionTable &key )
+	:	
+		key(key), 
+		id(0)
+	{ }
+
+	const ActionTable &getKey() 
+		{ return key; }
+
+	ActionTable key;
+	int id;
+};
+
+typedef AvlTree<RedActionTable, ActionTable, CmpActionTable> ActionTableMap;
+
+struct NextRedTrans
+{
+	Key lowKey, highKey;
+	FsmTrans *trans;
+	FsmTrans *next;
+
+	void load() {
+		if ( trans != 0 ) {
+			next = trans->next;
+			lowKey = trans->lowKey;
+			highKey = trans->highKey;
+		}
+	}
+
+	NextRedTrans( FsmTrans *t ) {
+		trans = t;
+		load();
+	}
+
+	void increment() {
+		trans = next;
+		load();
+	}
+};
+
+class RedFsmBuild
+{
+public:
+	RedFsmBuild( char *fsmName, ParseData *pd, FsmGraph *fsm );
+	RedFsm *reduceMachine( );
+
+private:
+	void appendTrans( TransListVect &outList, Key lowKey, Key highKey, FsmTrans *trans );
+	void makeStateActions( FsmState *state );
+	void makeStateList();
+	void makeStateConditions( FsmState *state );
+
+	void initActionList( unsigned long length );
+	void newAction( int anum, char *name, int line, int col, Action *action );
+	void initActionTableList( unsigned long length );
+	void initCondSpaceList( ulong length );
+	void condSpaceItem( int cnum, long condActionId );
+	void newCondSpace( int cnum, int condSpaceId, Key baseKey );
+	void initStateCondList( int snum, ulong length );
+	void addStateCond( int snum, Key lowKey, Key highKey, long condNum );
+	void initStateList( unsigned long length );
+	void addRegionToEntry( int regionId, int entryId );
+	void addEntryPoint( int entryId, char *name, unsigned long entryState );
+	void setId( int snum, int id );
+	void initTransList( int snum, unsigned long length );
+	void newTrans( int snum, int tnum, Key lowKey, Key highKey, 
+			long targ, long act );
+	void finishTransList( int snum );
+	void setFinal( int snum );
+	void setEofTrans( int snum, int eofTarget, int actId );
+	void setStateActions( int snum, long toStateAction, 
+			long fromStateAction, long eofAction );
+	void setForcedErrorState();
+	void closeMachine();
+	Key findMaxKey();
+
+
+	void makeEntryPoints();
+	void makeGetKeyExpr();
+	void makeAccessExpr();
+	void makeCurStateExpr();
+	void makeConditions();
+	void makeInlineList( InlineList *inlineList, InlineItem *context );
+	void makeActionList();
+	void makeActionTableList();
+	void reduceTrans( FsmTrans *trans );
+	void reduceActionTables();
+	void makeTransList( FsmState *state );
+	void makeTrans( Key lowKey, Key highKey, FsmTrans *defTrans );
+	void makeAction( Action *action );
+	void makeLmSwitch( InlineItem *item );
+	void makeMachine();
+	void makeActionExec( InlineItem *item );
+	void makeActionExecTE( InlineItem *item );
+
+	char *fsmName;
+	ParseData *pd;
+	FsmGraph *fsm;
+	ActionTableMap actionTableMap;
+	int nextActionTableId;
+
+	int startState;
+	int errState;
+
+public:
+	RedFsm *redFsm;
+
+private:
+	int curAction;
+	int curActionTable;
+	int curTrans;
+	int curState;
+	int curCondSpace;
+	int curStateCond;
+};
+
+
+#endif /* _FSMREDUCE_H */
diff --git a/colm/redfsm.cpp b/colm/redfsm.cpp
new file mode 100644
index 00000000..033bc131
--- /dev/null
+++ b/colm/redfsm.cpp
@@ -0,0 +1,1112 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include <iostream>
+#include <sstream>
+#include "redfsm.h"
+#include "avlmap.h"
+#include "mergesort.h"
+#include "fsmgraph.h"
+#include "parsetree.h"
+#include "fsmrun.h"
+
+using std::ostringstream;
+
+string GenAction::nameOrLoc()
+{
+	if ( name != 0 )
+		return string(name);
+	else {
+		ostringstream ret;
+		ret << loc.line << ":" << loc.col;
+		return ret.str();
+	}
+}
+
+RedFsm::RedFsm()
+:
+	wantComplete(false),
+	forcedErrorState(false),
+	nextActionId(0),
+	nextTransId(0),
+	errState(0),
+	errTrans(0),
+	firstFinState(0),
+	numFinStates(0),
+	allActions(0),
+	allActionTables(0),
+	allConditions(0),
+	allCondSpaces(0),
+	allStates(0),
+	bAnyToStateActions(false),
+	bAnyFromStateActions(false),
+	bAnyRegActions(false),
+	bAnyEofActions(false),
+	bAnyActionGotos(false),
+	bAnyActionCalls(false),
+	bAnyActionRets(false),
+	bAnyRegActionRets(false),
+	bAnyRegActionByValControl(false),
+	bAnyRegNextStmt(false),
+	bAnyRegCurStateRef(false),
+	bAnyRegBreak(false),
+	bAnyLmSwitchError(false),
+	bAnyConditions(false)
+{
+}
+
+/* Does the machine have any actions. */
+bool RedFsm::anyActions()
+{
+	return actionMap.length() > 0;
+}
+
+void RedFsm::depthFirstOrdering( RedState *state )
+{
+	/* Nothing to do if the state is already on the list. */
+	if ( state->onStateList )
+		return;
+
+	/* Doing depth first, put state on the list. */
+	state->onStateList = true;
+	stateList.append( state );
+	
+//	/* At this point transitions should only be in ranges. */
+//	assert( state->outSingle.length() == 0 );
+//	assert( state->defTrans == 0 );
+
+	/* Recurse on singles. */
+	for ( RedTransList::Iter stel = state->outSingle; stel.lte(); stel++ ) {
+		if ( stel->value->targ != 0 )
+			depthFirstOrdering( stel->value->targ );
+	}
+
+	/* Recurse on everything ranges. */
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ ) {
+		if ( rtel->value->targ != 0 )
+			depthFirstOrdering( rtel->value->targ );
+	}
+
+	if ( state->defTrans != 0 && state->defTrans->targ != 0 )
+		depthFirstOrdering( state->defTrans->targ );
+}
+
+/* Ordering states by transition connections. */
+void RedFsm::depthFirstOrdering()
+{
+	/* Init on state list flags. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		st->onStateList = false;
+	
+	/* Clear out the state list, we will rebuild it. */
+	int stateListLen = stateList.length();
+	stateList.abandon();
+
+	/* Add back to the state list from the start state and all other entry
+	 * points. */
+	depthFirstOrdering( startState );
+	for ( RedStateSet::Iter en = entryPoints; en.lte(); en++ )
+		depthFirstOrdering( *en );
+	if ( forcedErrorState )
+		depthFirstOrdering( errState );
+	
+	/* Make sure we put everything back on. */
+	assert( stateListLen == stateList.length() );
+}
+
+/* Assign state ids by appearance in the state list. */
+void RedFsm::sequentialStateIds()
+{
+	/* Table based machines depend on the state numbers starting at zero. */
+	nextStateId = 0;
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		st->id = nextStateId++;
+}
+
+/* Stable sort the states by final state status. */
+void RedFsm::sortStatesByFinal()
+{
+	/* Move forward through the list and throw final states onto the end. */
+	RedState *state = 0;
+	RedState *next = stateList.head;
+	RedState *last = stateList.tail;
+	while ( state != last ) {
+		/* Move forward and load up the next. */
+		state = next;
+		next = state->next;
+
+		/* Throw to the end? */
+		if ( state->isFinal ) {
+			stateList.detach( state );
+			stateList.append( state );
+		}
+	}
+}
+
+/* Assign state ids by final state state status. */
+void RedFsm::sortStateIdsByFinal()
+{
+	/* Table based machines depend on this starting at zero. */
+	nextStateId = 0;
+
+	/* First pass to assign non final ids. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		if ( ! st->isFinal ) 
+			st->id = nextStateId++;
+	}
+
+	/* Second pass to assign final ids. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		if ( st->isFinal ) 
+			st->id = nextStateId++;
+	}
+}
+
+struct CmpStateById
+{
+	static int compare( RedState *st1, RedState *st2 )
+	{
+		if ( st1->id < st2->id )
+			return -1;
+		else if ( st1->id > st2->id )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+void RedFsm::sortByStateId()
+{
+	/* Make the array. */
+	int pos = 0;
+	RedState **ptrList = new RedState*[stateList.length()];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		ptrList[pos++] = st;
+	
+	MergeSort<RedState*, CmpStateById> mergeSort;
+	mergeSort.sort( ptrList, stateList.length() );
+
+	stateList.abandon();
+	for ( int st = 0; st < pos; st++ )
+		stateList.append( ptrList[st] );
+
+	delete[] ptrList;
+}
+
+/* Find the final state with the lowest id. */
+void RedFsm::findFirstFinState()
+{
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		if ( st->isFinal && (firstFinState == 0 || st->id < firstFinState->id) )
+			firstFinState = st;
+	}
+}
+
+void RedFsm::assignActionLocs()
+{
+	int nextLocation = 0;
+	for ( GenActionTableMap::Iter act = actionMap; act.lte(); act++ ) {
+		/* Store the loc, skip over the array and a null terminator. */
+		act->location = nextLocation;
+		nextLocation += act->key.length() + 1;		
+	}
+}
+
+/* Check if we can extend the current range by displacing any ranges
+ * ahead to the singles. */
+bool RedFsm::canExtend( const RedTransList &list, int pos )
+{
+	/* Get the transition that we want to extend. */
+	RedTrans *extendTrans = list[pos].value;
+
+	/* Look ahead in the transition list. */
+	for ( int next = pos + 1; next < list.length(); pos++, next++ ) {
+		/* If they are not continuous then cannot extend. */
+		Key nextKey = list[next].lowKey;
+		nextKey.decrement();
+		if ( list[pos].highKey != nextKey )
+			break;
+
+		/* Check for the extenstion property. */
+		if ( extendTrans == list[next].value )
+			return true;
+
+		/* If the span of the next element is more than one, then don't keep
+		 * checking, it won't be moved to single. */
+		unsigned long long nextSpan = keyOps->span( list[next].lowKey, list[next].highKey );
+		if ( nextSpan > 1 )
+			break;
+	}
+	return false;
+}
+
+/* Move ranges to the singles list. */
+void RedFsm::moveTransToSingle( RedState *state )
+{
+	RedTransList &range = state->outRange;
+	RedTransList &single = state->outSingle;
+	for ( int rpos = 0; rpos < range.length(); ) {
+		/* Check if this is a range we can extend. */
+		if ( canExtend( range, rpos ) ) {
+			/* Transfer singles over. */
+			while ( range[rpos].value != range[rpos+1].value ) {
+				/* Transfer the range to single. */
+				single.append( range[rpos+1] );
+				range.remove( rpos+1 );
+			}
+			
+			/* Extend. */
+			range[rpos].highKey = range[rpos+1].highKey;
+			range.remove( rpos+1 );
+		}
+		/* Maybe move it to the singles. */
+		else if ( keyOps->span( range[rpos].lowKey, range[rpos].highKey ) == 1 ) {
+			single.append( range[rpos] );
+			range.remove( rpos );
+		}
+		else {
+			/* Keeping it in the ranges. */
+			rpos += 1;
+		}
+	}
+}
+
+/* Look through ranges and choose suitable single character transitions. */
+void RedFsm::chooseSingle()
+{
+	/* Loop the states. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Rewrite the transition list taking out the suitable single
+		 * transtions. */
+		moveTransToSingle( st );
+	}
+}
+
+void RedFsm::makeFlat()
+{
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		if ( st->stateCondList.length() == 0 ) {
+			st->condLowKey = 0;
+			st->condHighKey = 0;
+		}
+		else {
+			st->condLowKey = st->stateCondList.head->lowKey;
+			st->condHighKey = st->stateCondList.tail->highKey;
+
+			unsigned long long span = keyOps->span( st->condLowKey, st->condHighKey );
+			st->condList = new GenCondSpace*[ span ];
+			memset( st->condList, 0, sizeof(GenCondSpace*)*span );
+
+			for ( GenStateCondList::Iter sci = st->stateCondList; sci.lte(); sci++ ) {
+				unsigned long long base, trSpan;
+				base = keyOps->span( st->condLowKey, sci->lowKey )-1;
+				trSpan = keyOps->span( sci->lowKey, sci->highKey );
+				for ( unsigned long long pos = 0; pos < trSpan; pos++ )
+					st->condList[base+pos] = sci->condSpace;
+			}
+		}
+
+		if ( st->outRange.length() == 0 ) {
+			st->lowKey = st->highKey = 0;
+			st->transList = 0;
+		}
+		else {
+			st->lowKey = st->outRange[0].lowKey;
+			st->highKey = st->outRange[st->outRange.length()-1].highKey;
+			unsigned long long span = keyOps->span( st->lowKey, st->highKey );
+			st->transList = new RedTrans*[ span ];
+			memset( st->transList, 0, sizeof(RedTrans*)*span );
+			
+			for ( RedTransList::Iter trans = st->outRange; trans.lte(); trans++ ) {
+				unsigned long long base, trSpan;
+				base = keyOps->span( st->lowKey, trans->lowKey )-1;
+				trSpan = keyOps->span( trans->lowKey, trans->highKey );
+				for ( unsigned long long pos = 0; pos < trSpan; pos++ )
+					st->transList[base+pos] = trans->value;
+			}
+
+			/* Fill in the gaps with the default transition. */
+			for ( unsigned long long pos = 0; pos < span; pos++ ) {
+				if ( st->transList[pos] == 0 )
+					st->transList[pos] = st->defTrans;
+			}
+		}
+	}
+}
+
+
+/* A default transition has been picked, move it from the outRange to the
+ * default pointer. */
+void RedFsm::moveToDefault( RedTrans *defTrans, RedState *state )
+{
+	/* Rewrite the outRange, omitting any ranges that use 
+	 * the picked default. */
+	RedTransList outRange;
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ ) {
+		/* If it does not take the default, copy it over. */
+		if ( rtel->value != defTrans )
+			outRange.append( *rtel );
+	}
+
+	/* Save off the range we just created into the state's range. */
+	state->outRange.transfer( outRange );
+
+	/* Store the default. */
+	state->defTrans = defTrans;
+}
+
+bool RedFsm::alphabetCovered( RedTransList &outRange )
+{
+	/* Cannot cover without any out ranges. */
+	if ( outRange.length() == 0 )
+		return false;
+
+	/* If the first range doesn't start at the the lower bound then the
+	 * alphabet is not covered. */
+	RedTransList::Iter rtel = outRange;
+	if ( keyOps->minKey < rtel->lowKey )
+		return false;
+
+	/* Check that every range is next to the previous one. */
+	rtel.increment();
+	for ( ; rtel.lte(); rtel++ ) {
+		Key highKey = rtel[-1].highKey;
+		highKey.increment();
+		if ( highKey != rtel->lowKey )
+			return false;
+	}
+
+	/* The last must extend to the upper bound. */
+	RedTransEl *last = &outRange[outRange.length()-1];
+	if ( last->highKey < keyOps->maxKey )
+		return false;
+
+	return true;
+}
+
+RedTrans *RedFsm::chooseDefaultSpan( RedState *state )
+{
+	/* Make a set of transitions from the outRange. */
+	RedTransPtrSet stateTransSet;
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ )
+		stateTransSet.insert( rtel->value );
+	
+	/* For each transition in the find how many alphabet characters the
+	 * transition spans. */
+	unsigned long long *span = new unsigned long long[stateTransSet.length()];
+	memset( span, 0, sizeof(unsigned long long) * stateTransSet.length() );
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ ) {
+		/* Lookup the transition in the set. */
+		RedTrans **inSet = stateTransSet.find( rtel->value );
+		int pos = inSet - stateTransSet.data;
+		span[pos] += keyOps->span( rtel->lowKey, rtel->highKey );
+	}
+
+	/* Find the max span, choose it for making the default. */
+	RedTrans *maxTrans = 0;
+	unsigned long long maxSpan = 0;
+	for ( RedTransPtrSet::Iter rtel = stateTransSet; rtel.lte(); rtel++ ) {
+		if ( span[rtel.pos()] > maxSpan ) {
+			maxSpan = span[rtel.pos()];
+			maxTrans = *rtel;
+		}
+	}
+
+	delete[] span;
+	return maxTrans;
+}
+
+/* Pick default transitions from ranges for the states. */
+void RedFsm::chooseDefaultSpan()
+{
+	/* Loop the states. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Only pick a default transition if the alphabet is covered. This
+		 * avoids any transitions in the out range that go to error and avoids
+		 * the need for an ERR state. */
+		if ( alphabetCovered( st->outRange ) ) {
+			/* Pick a default transition by largest span. */
+			RedTrans *defTrans = chooseDefaultSpan( st );
+
+			/* Rewrite the transition list taking out the transition we picked
+			 * as the default and store the default. */
+			moveToDefault( defTrans, st );
+		}
+	}
+}
+
+RedTrans *RedFsm::chooseDefaultGoto( RedState *state )
+{
+	/* Make a set of transitions from the outRange. */
+	RedTransPtrSet stateTransSet;
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ ) {
+		if ( rtel->value->targ == state->next )
+			return rtel->value;
+	}
+	return 0;
+}
+
+void RedFsm::chooseDefaultGoto()
+{
+	/* Loop the states. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Pick a default transition. */
+		RedTrans *defTrans = chooseDefaultGoto( st );
+		if ( defTrans == 0 )
+			defTrans = chooseDefaultSpan( st );
+
+		/* Rewrite the transition list taking out the transition we picked
+		 * as the default and store the default. */
+		moveToDefault( defTrans, st );
+	}
+}
+
+RedTrans *RedFsm::chooseDefaultNumRanges( RedState *state )
+{
+	/* Make a set of transitions from the outRange. */
+	RedTransPtrSet stateTransSet;
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ )
+		stateTransSet.insert( rtel->value );
+	
+	/* For each transition in the find how many ranges use the transition. */
+	int *numRanges = new int[stateTransSet.length()];
+	memset( numRanges, 0, sizeof(int) * stateTransSet.length() );
+	for ( RedTransList::Iter rtel = state->outRange; rtel.lte(); rtel++ ) {
+		/* Lookup the transition in the set. */
+		RedTrans **inSet = stateTransSet.find( rtel->value );
+		numRanges[inSet - stateTransSet.data] += 1;
+	}
+
+	/* Find the max number of ranges. */
+	RedTrans *maxTrans = 0;
+	int maxNumRanges = 0;
+	for ( RedTransPtrSet::Iter rtel = stateTransSet; rtel.lte(); rtel++ ) {
+		if ( numRanges[rtel.pos()] > maxNumRanges ) {
+			maxNumRanges = numRanges[rtel.pos()];
+			maxTrans = *rtel;
+		}
+	}
+
+	delete[] numRanges;
+	return maxTrans;
+}
+
+void RedFsm::chooseDefaultNumRanges()
+{
+	/* Loop the states. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Pick a default transition. */
+		RedTrans *defTrans = chooseDefaultNumRanges( st );
+
+		/* Rewrite the transition list taking out the transition we picked
+		 * as the default and store the default. */
+		moveToDefault( defTrans, st );
+	}
+}
+
+RedTrans *RedFsm::getErrorTrans( )
+{
+	/* If the error trans has not been made aready, make it. */
+	if ( errTrans == 0 ) {
+		/* This insert should always succeed since no transition created by
+		 * the user can point to the error state. */
+		errTrans = new RedTrans( getErrorState(), 0, nextTransId++ );
+		RedTrans *inRes = transSet.insert( errTrans );
+		assert( inRes != 0 );
+	}
+	return errTrans;
+}
+
+RedState *RedFsm::getErrorState()
+{
+	/* Something went wrong. An error state is needed but one was not supplied
+	 * by the frontend. */
+	assert( errState != 0 );
+	return errState;
+}
+
+
+RedTrans *RedFsm::allocateTrans( RedState *targ, RedAction *action )
+{
+	/* Create a reduced trans and look for it in the transiton set. */
+	RedTrans redTrans( targ, action, 0 );
+	RedTrans *inDict = transSet.find( &redTrans );
+	if ( inDict == 0 ) {
+		inDict = new RedTrans( targ, action, nextTransId++ );
+		transSet.insert( inDict );
+	}
+	return inDict;
+}
+
+void RedFsm::partitionFsm( int nparts )
+{
+	/* At this point the states are ordered by a depth-first traversal. We
+	 * will allocate to partitions based on this ordering. */
+	this->nParts = nparts;
+	int partSize = stateList.length() / nparts;
+	int remainder = stateList.length() % nparts;
+	int numInPart = partSize;
+	int partition = 0;
+	if ( remainder-- > 0 )
+		numInPart += 1;
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		st->partition = partition;
+
+		numInPart -= 1;
+		if ( numInPart == 0 ) {
+			partition += 1;
+			numInPart = partSize;
+			if ( remainder-- > 0 )
+				numInPart += 1;
+		}
+	}
+}
+
+void RedFsm::setInTrans()
+{
+	/* First pass counts the number of transitions. */
+	for ( RedTransSet::Iter trans = transSet; trans.lte(); trans++ )
+		trans->targ->numInTrans += 1;
+
+	/* Pass over states to allocate the needed memory. Reset the counts so we
+	 * can use them as the current size. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		st->inTrans = new RedTrans*[st->numInTrans];
+		st->numInTrans = 0;
+	}
+
+	/* Second pass over transitions copies pointers into the in trans list. */
+	for ( RedTransSet::Iter trans = transSet; trans.lte(); trans++ )
+		trans->targ->inTrans[trans->targ->numInTrans++] = trans;
+}
+
+GenCondSpace *RedFsm::findCondSpace( Key lowKey, Key highKey )
+{
+	for ( CondSpaceList::Iter cs = condSpaceList; cs.lte(); cs++ ) {
+		Key csHighKey = cs->baseKey;
+		csHighKey += keyOps->alphSize() * (1 << cs->condSet.length());
+
+		if ( lowKey >= cs->baseKey && highKey <= csHighKey )
+			return cs;
+	}
+	return 0;
+}
+
+Condition *RedFsm::findCondition( Key key )
+{
+	for ( ConditionList::Iter cond = conditionList; cond.lte(); cond++ ) {
+		Key upperKey = cond->baseKey + (1 << cond->condSet.length());
+		if ( cond->baseKey <= key && key <= upperKey )
+			return cond;
+	}
+	return 0;
+}
+
+void RedFsm::setValueLimits()
+{
+	maxSingleLen = 0;
+	maxRangeLen = 0;
+	maxKeyOffset = 0;
+	maxIndexOffset = 0;
+	maxActListId = 0;
+	maxActionLoc = 0;
+	maxActArrItem = 0;
+	maxSpan = 0;
+	maxCondSpan = 0;
+	maxFlatIndexOffset = 0;
+	maxCondOffset = 0;
+	maxCondLen = 0;
+	maxCondSpaceId = 0;
+	maxCondIndexOffset = 0;
+
+	/* In both of these cases the 0 index is reserved for no value, so the max
+	 * is one more than it would be if they started at 0. */
+	maxIndex = transSet.length();
+	maxCond = condSpaceList.length(); 
+
+	/* The nextStateId - 1 is the last state id assigned. */
+	maxState = nextStateId - 1;
+
+	for ( CondSpaceList::Iter csi = condSpaceList; csi.lte(); csi++ ) {
+		if ( csi->condSpaceId > maxCondSpaceId )
+			maxCondSpaceId = csi->condSpaceId;
+	}
+
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Maximum cond length. */
+		if ( st->stateCondList.length() > maxCondLen )
+			maxCondLen = st->stateCondList.length();
+
+		/* Maximum single length. */
+		if ( st->outSingle.length() > maxSingleLen )
+			maxSingleLen = st->outSingle.length();
+
+		/* Maximum range length. */
+		if ( st->outRange.length() > maxRangeLen )
+			maxRangeLen = st->outRange.length();
+
+		/* The key offset index offset for the state after last is not used, skip it.. */
+		if ( ! st.last() ) {
+			maxCondOffset += st->stateCondList.length();
+			maxKeyOffset += st->outSingle.length() + st->outRange.length()*2;
+			maxIndexOffset += st->outSingle.length() + st->outRange.length() + 1;
+		}
+
+		/* Max cond span. */
+		if ( st->condList != 0 ) {
+			unsigned long long span = keyOps->span( st->condLowKey, st->condHighKey );
+			if ( span > maxCondSpan )
+				maxCondSpan = span;
+		}
+
+		/* Max key span. */
+		if ( st->transList != 0 ) {
+			unsigned long long span = keyOps->span( st->lowKey, st->highKey );
+			if ( span > maxSpan )
+				maxSpan = span;
+		}
+
+		/* Max cond index offset. */
+		if ( ! st.last() ) {
+			if ( st->condList != 0 )
+				maxCondIndexOffset += keyOps->span( st->condLowKey, st->condHighKey );
+		}
+
+		/* Max flat index offset. */
+		if ( ! st.last() ) {
+			if ( st->transList != 0 )
+				maxFlatIndexOffset += keyOps->span( st->lowKey, st->highKey );
+			maxFlatIndexOffset += 1;
+		}
+	}
+
+	for ( GenActionTableMap::Iter at = actionMap; at.lte(); at++ ) {
+		/* Maximum id of action lists. */
+		if ( at->actListId+1 > maxActListId )
+			maxActListId = at->actListId+1;
+
+		/* Maximum location of items in action array. */
+		if ( at->location+1 > maxActionLoc )
+			maxActionLoc = at->location+1;
+
+		/* Maximum values going into the action array. */
+		if ( at->key.length() > maxActArrItem )
+			maxActArrItem = at->key.length();
+		for ( GenActionTable::Iter item = at->key; item.lte(); item++ ) {
+			if ( item->value->actionId > maxActArrItem )
+				maxActArrItem = item->value->actionId;
+		}
+	}
+}
+
+void RedFsm::findFinalActionRefs()
+{
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Rerence count out of single transitions. */
+		for ( RedTransList::Iter rtel = st->outSingle; rtel.lte(); rtel++ ) {
+			if ( rtel->value->action != 0 ) {
+				rtel->value->action->numTransRefs += 1;
+				for ( GenActionTable::Iter item = rtel->value->action->key; item.lte(); item++ )
+					item->value->numTransRefs += 1;
+			}
+		}
+
+		/* Reference count out of range transitions. */
+		for ( RedTransList::Iter rtel = st->outRange; rtel.lte(); rtel++ ) {
+			if ( rtel->value->action != 0 ) {
+				rtel->value->action->numTransRefs += 1;
+				for ( GenActionTable::Iter item = rtel->value->action->key; item.lte(); item++ )
+					item->value->numTransRefs += 1;
+			}
+		}
+
+		/* Reference count default transition. */
+		if ( st->defTrans != 0 && st->defTrans->action != 0 ) {
+			st->defTrans->action->numTransRefs += 1;
+			for ( GenActionTable::Iter item = st->defTrans->action->key; item.lte(); item++ )
+				item->value->numTransRefs += 1;
+		}
+
+		/* Reference count to state actions. */
+		if ( st->toStateAction != 0 ) {
+			st->toStateAction->numToStateRefs += 1;
+			for ( GenActionTable::Iter item = st->toStateAction->key; item.lte(); item++ )
+				item->value->numToStateRefs += 1;
+		}
+
+		/* Reference count from state actions. */
+		if ( st->fromStateAction != 0 ) {
+			st->fromStateAction->numFromStateRefs += 1;
+			for ( GenActionTable::Iter item = st->fromStateAction->key; item.lte(); item++ )
+				item->value->numFromStateRefs += 1;
+		}
+
+		/* Reference count EOF actions. */
+		if ( st->eofAction != 0 ) {
+			st->eofAction->numEofRefs += 1;
+			for ( GenActionTable::Iter item = st->eofAction->key; item.lte(); item++ )
+				item->value->numEofRefs += 1;
+		}
+	}
+}
+
+void RedFsm::analyzeAction( GenAction *act, InlineList *inlineList )
+{
+	for ( InlineList::Iter item = *inlineList; item.lte(); item++ ) {
+		/* Check for various things in regular actions. */
+		if ( act->numTransRefs > 0 || act->numToStateRefs > 0 || 
+				act->numFromStateRefs > 0 )
+		{
+			if ( item->type == InlineItem::LmSwitch && 
+					item->tokenRegion->lmSwitchHandlesError )
+			{
+				bAnyLmSwitchError = true;
+			}
+		}
+
+		if ( item->children != 0 )
+			analyzeAction( act, item->children );
+	}
+}
+
+void RedFsm::analyzeActionList( RedAction *redAct, InlineList *inlineList )
+{
+	for ( InlineList::Iter item = *inlineList; item.lte(); item++ ) {
+		if ( item->children != 0 )
+			analyzeActionList( redAct, item->children );
+	}
+}
+
+/* Assign ids to referenced actions. */
+void RedFsm::assignActionIds()
+{
+	int nextActionId = 0;
+	for ( GenActionList::Iter act = actionList; act.lte(); act++ ) {
+		/* Only ever interested in referenced actions. */
+		if ( act->numRefs() > 0 )
+			act->actionId = nextActionId++;
+	}
+}
+
+/* Gather various info on the machine. */
+void RedFsm::analyzeMachine()
+{
+	/* Find the true count of action references.  */
+	findFinalActionRefs();
+
+	/* Check if there are any calls in action code. */
+	for ( GenActionList::Iter act = actionList; act.lte(); act++ ) {
+		/* Record the occurrence of various kinds of actions. */
+		if ( act->numToStateRefs > 0 )
+			bAnyToStateActions = true;
+		if ( act->numFromStateRefs > 0 )
+			bAnyFromStateActions = true;
+		if ( act->numEofRefs > 0 )
+			bAnyEofActions = true;
+		if ( act->numTransRefs > 0 )
+			bAnyRegActions = true;
+
+		/* Recurse through the action's parse tree looking for various things. */
+		analyzeAction( act, act->inlineList );
+	}
+
+	/* Analyze reduced action lists. */
+	for ( GenActionTableMap::Iter redAct = actionMap; redAct.lte(); redAct++ ) {
+		for ( GenActionTable::Iter act = redAct->key; act.lte(); act++ )
+			analyzeActionList( redAct, act->value->inlineList );
+	}
+
+	/* Find states that have transitions with actions that have next
+	 * statements. */
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Check any actions out of outSinge. */
+		for ( RedTransList::Iter rtel = st->outSingle; rtel.lte(); rtel++ ) {
+			if ( rtel->value->action != 0 && rtel->value->action->anyCurStateRef() )
+				st->bAnyRegCurStateRef = true;
+		}
+
+		/* Check any actions out of outRange. */
+		for ( RedTransList::Iter rtel = st->outRange; rtel.lte(); rtel++ ) {
+			if ( rtel->value->action != 0 && rtel->value->action->anyCurStateRef() )
+				st->bAnyRegCurStateRef = true;
+		}
+
+		/* Check any action out of default. */
+		if ( st->defTrans != 0 && st->defTrans->action != 0 && 
+				st->defTrans->action->anyCurStateRef() )
+			st->bAnyRegCurStateRef = true;
+		
+		if ( st->stateCondList.length() > 0 )
+			bAnyConditions = true;
+	}
+
+	/* Assign ids to actions that are referenced. */
+	assignActionIds();
+
+	/* Set the maximums of various values used for deciding types. */
+	setValueLimits();
+}
+
+int transAction( RedTrans *trans )
+{
+	int retAct = 0;
+	if ( trans->action != 0 )
+		retAct = trans->action->location+1;
+	return retAct;
+}
+
+int toStateAction( RedState *state )
+{
+	int act = 0;
+	if ( state->toStateAction != 0 )
+		act = state->toStateAction->location+1;
+	return act;
+}
+
+int fromStateAction( RedState *state )
+{
+	int act = 0;
+	if ( state->fromStateAction != 0 )
+		act = state->fromStateAction->location+1;
+	return act;
+}
+
+int eofAction( RedState *state )
+{
+	int act = 0;
+	if ( state->eofAction != 0 )
+		act = state->eofAction->location+1;
+	return act;
+}
+
+
+FsmTables *RedFsm::makeFsmTables()
+{
+	/* The fsm runtime needs states sorted by id. */
+	sortByStateId();
+
+	int pos, curKeyOffset, curIndOffset;
+	FsmTables *fsmTables = new FsmTables;
+	fsmTables->numStates = stateList.length();
+
+	/*
+	 * actions
+	 */
+
+	fsmTables->numActions = 1;
+	for ( GenActionTableMap::Iter act = actionMap; act.lte(); act++ )
+		fsmTables->numActions += 1 + act->key.length();
+
+	pos = 0;
+	fsmTables->actions = new long[fsmTables->numActions];
+	fsmTables->actions[pos++] = 0;
+	for ( GenActionTableMap::Iter act = actionMap; act.lte(); act++ ) {
+		fsmTables->actions[pos++] = act->key.length();
+		for ( GenActionTable::Iter item = act->key; item.lte(); item++ )
+			fsmTables->actions[pos++] = item->value->actionId;
+	}
+
+	/*
+	 * keyOffset
+	 */
+	pos = 0, curKeyOffset = 0;
+	fsmTables->keyOffsets = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		/* Store the current offset. */
+		fsmTables->keyOffsets[pos++] = curKeyOffset;
+
+		/* Move the key offset ahead. */
+		curKeyOffset += st->outSingle.length() + st->outRange.length()*2;
+	}
+
+	/*
+	 * transKeys
+	 */
+	fsmTables->numTransKeys = 0;
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		fsmTables->numTransKeys += st->outSingle.length();
+		fsmTables->numTransKeys += 2 * st->outRange.length();
+	}
+
+	pos = 0;
+	fsmTables->transKeys = new char[fsmTables->numTransKeys];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		for ( RedTransList::Iter stel = st->outSingle; stel.lte(); stel++ )
+			fsmTables->transKeys[pos++] = stel->lowKey.getVal();
+		for ( RedTransList::Iter rtel = st->outRange; rtel.lte(); rtel++ ) {
+			fsmTables->transKeys[pos++] = rtel->lowKey.getVal();
+			fsmTables->transKeys[pos++] = rtel->highKey.getVal();
+		}
+	}
+
+	/*
+	 * singleLengths
+	 */
+	pos = 0;
+	fsmTables->singleLengths = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		fsmTables->singleLengths[pos++] = st->outSingle.length();
+
+	/*
+	 * rangeLengths
+	 */
+	pos = 0;
+	fsmTables->rangeLengths = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		fsmTables->rangeLengths[pos++] = st->outRange.length();
+
+	/*
+	 * indexOffsets
+	 */
+	pos = 0, curIndOffset = 0;
+	fsmTables->indexOffsets = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		fsmTables->indexOffsets[pos++] = curIndOffset;
+
+		curIndOffset += st->outSingle.length() + st->outRange.length();
+		if ( st->defTrans != 0 )
+			curIndOffset += 1;
+	}
+
+	/*
+	 * transTargsWI
+	 */
+	fsmTables->numTransTargsWI = 0;
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		fsmTables->numTransTargsWI += st->outSingle.length();
+		fsmTables->numTransTargsWI += st->outRange.length();
+		if ( st->defTrans != 0 )
+			fsmTables->numTransTargsWI += 1;
+	}
+
+	pos = 0;
+	fsmTables->transTargsWI = new long[fsmTables->numTransTargsWI];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		for ( RedTransList::Iter stel = st->outSingle; stel.lte(); stel++ )
+			fsmTables->transTargsWI[pos++] = stel->value->targ->id;
+
+		for ( RedTransList::Iter rtel = st->outRange; rtel.lte(); rtel++ )
+			fsmTables->transTargsWI[pos++] = rtel->value->targ->id;
+
+		if ( st->defTrans != 0 )
+			fsmTables->transTargsWI[pos++] = st->defTrans->targ->id;
+	}
+
+	/*
+	 * transActionsWI
+	 */
+	fsmTables->numTransActionsWI = 0;
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		fsmTables->numTransActionsWI += st->outSingle.length();
+		fsmTables->numTransActionsWI += st->outRange.length();
+		if ( st->defTrans != 0 )
+			fsmTables->numTransActionsWI += 1;
+	}
+
+	pos = 0;
+	fsmTables->transActionsWI = new long[fsmTables->numTransActionsWI];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		for ( RedTransList::Iter stel = st->outSingle; stel.lte(); stel++ )
+			fsmTables->transActionsWI[pos++] = transAction( stel->value );
+
+		for ( RedTransList::Iter rtel = st->outRange; rtel.lte(); rtel++ )
+			fsmTables->transActionsWI[pos++] = transAction( rtel->value );
+
+		if ( st->defTrans != 0 )
+			fsmTables->transActionsWI[pos++] = transAction( st->defTrans );
+	}
+
+	/*
+	 * toStateActions
+	 */
+	pos = 0;
+	fsmTables->toStateActions = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		fsmTables->toStateActions[pos++] = toStateAction( st );
+
+	/*
+	 * fromStateActions
+	 */
+	pos = 0;
+	fsmTables->fromStateActions = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		fsmTables->fromStateActions[pos++] = fromStateAction( st );
+
+	/*
+	 * eofActions
+	 */
+	pos = 0;
+	fsmTables->eofActions = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ )
+		fsmTables->eofActions[pos++] = eofAction( st );
+
+	/*
+	 * eofTargs
+	 */
+	pos = 0;
+	fsmTables->eofTargs = new long[fsmTables->numStates];
+	for ( RedStateList::Iter st = stateList; st.lte(); st++ ) {
+		int targ = -1;
+		if ( st->eofTrans != 0 )
+			targ = st->eofTrans->targ->id;
+		fsmTables->eofTargs[pos++] = targ;
+	}
+
+	/* Start state. */
+	fsmTables->startState = startState->id;
+
+	/* First final state. */
+	fsmTables->firstFinal = ( firstFinState != 0 ) ?
+		firstFinState->id : nextStateId;
+
+	/* The error state. */
+	fsmTables->errorState = ( errState != 0 ) ?
+		errState->id : -1;
+
+	/* The array pointing to actions. */
+	pos = 0;
+	fsmTables->numActionSwitch = actionList.length();
+	fsmTables->actionSwitch = new GenAction*[fsmTables->numActionSwitch];
+	for ( GenActionList::Iter act = actionList; act.lte(); act++ )
+		fsmTables->actionSwitch[pos++] = act;
+	
+	/*
+	 * entryByRegion
+	 */
+
+	fsmTables->numRegions = regionToEntry.length()+1;
+	fsmTables->entryByRegion = new long[fsmTables->numRegions];
+	fsmTables->entryByRegion[0] = fsmTables->errorState;
+
+	pos = 1;
+	for ( RegionToEntry::Iter en = regionToEntry; en.lte(); en++ ) {
+		/* Find the entry state from the entry id. */
+		RedEntryMapEl *entryMapEl = redEntryMap.find( *en );
+		
+		/* Save it off. */
+		fsmTables->entryByRegion[pos++] = entryMapEl != 0 ? entryMapEl->value 
+				: fsmTables->errorState;
+	}
+	
+	return fsmTables;
+}
+
+
diff --git a/colm/redfsm.h b/colm/redfsm.h
new file mode 100644
index 00000000..161df043
--- /dev/null
+++ b/colm/redfsm.h
@@ -0,0 +1,531 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _REDFSM_H
+#define _REDFSM_H
+
+#include <assert.h>
+#include <string.h>
+#include <string>
+#include "common.h"
+#include "vector.h"
+#include "dlist.h"
+#include "compare.h"
+#include "bstmap.h"
+#include "bstset.h"
+#include "avlmap.h"
+#include "avltree.h"
+#include "avlbasic.h"
+#include "mergesort.h"
+#include "sbstmap.h"
+#include "sbstset.h"
+#include "sbsttable.h"
+#include "colm.h"
+
+#define TRANS_ERR_TRANS   0
+#define STATE_ERR_STATE   0
+#define FUNC_NO_FUNC      0
+
+using std::string;
+
+struct RedState;
+struct InlineList;
+struct GenAction;
+struct FsmTables;
+struct ParseData;
+struct ObjField;
+
+typedef DList<GenAction> GenActionList;
+
+/* Element in list of actions. Contains the string for the code to exectute. */
+struct GenAction 
+:
+	public DListEl<GenAction>
+{
+	GenAction( )
+	:
+		name(0),
+		inlineList(0), 
+		actionId(0),
+		numTransRefs(0),
+		numToStateRefs(0),
+		numFromStateRefs(0),
+		numEofRefs(0)
+	{
+	}
+
+	/* Data collected during parse. */
+	InputLoc loc;
+	char *name;
+	InlineList *inlineList;
+	int actionId;
+	ObjField *objField;
+	MarkType markType;
+
+	string nameOrLoc();
+
+	/* Number of references in the final machine. */
+	int numRefs() 
+		{ return numTransRefs + numToStateRefs + numFromStateRefs + numEofRefs; }
+	int numTransRefs;
+	int numToStateRefs;
+	int numFromStateRefs;
+	int numEofRefs;
+};
+
+
+/* Forwards. */
+struct RedState;
+struct FsmState;
+
+/* Transistion GenAction Element. */
+typedef SBstMapEl< int, GenAction* > GenActionTableEl;
+
+/* Transition GenAction Table.  */
+struct GenActionTable 
+	: public SBstMap< int, GenAction*, CmpOrd<int> >
+{
+	void setAction( int ordering, GenAction *action );
+	void setActions( int *orderings, GenAction **actions, int nActs );
+	void setActions( const GenActionTable &other );
+};
+
+/* Compare of a whole action table element (key & value). */
+struct GenCmpActionTableEl
+{
+	static int compare( const GenActionTableEl &action1, 
+			const GenActionTableEl &action2 )
+	{
+		if ( action1.key < action2.key )
+			return -1;
+		else if ( action1.key > action2.key )
+			return 1;
+		else if ( action1.value < action2.value )
+			return -1;
+		else if ( action1.value > action2.value )
+			return 1;
+		return 0;
+	}
+};
+
+/* Compare for GenActionTable. */
+typedef CmpSTable< GenActionTableEl, GenCmpActionTableEl > GenCmpActionTable;
+
+/* Set of states. */
+typedef BstSet<RedState*> RedStateSet;
+typedef BstSet<int> IntSet;
+
+/* Reduced action. */
+struct RedAction
+:
+	public AvlTreeEl<RedAction>
+{
+	RedAction( )
+	:	
+		key(), 
+		eofRefs(0),
+		numTransRefs(0),
+		numToStateRefs(0),
+		numFromStateRefs(0),
+		numEofRefs(0),
+		bAnyNextStmt(false), 
+		bAnyCurStateRef(false),
+		bAnyBreakStmt(false)
+	{ }
+	
+	const GenActionTable &getKey() 
+		{ return key; }
+
+	GenActionTable key;
+	int actListId;
+	int location;
+	IntSet *eofRefs;
+
+	/* Number of references in the final machine. */
+	bool numRefs() 
+		{ return numTransRefs + numToStateRefs + numFromStateRefs + numEofRefs; }
+	int numTransRefs;
+	int numToStateRefs;
+	int numFromStateRefs;
+	int numEofRefs;
+
+	bool anyNextStmt() { return bAnyNextStmt; }
+	bool anyCurStateRef() { return bAnyCurStateRef; }
+	bool anyBreakStmt() { return bAnyBreakStmt; }
+
+	bool bAnyNextStmt;
+	bool bAnyCurStateRef;
+	bool bAnyBreakStmt;
+};
+typedef AvlTree<RedAction, GenActionTable, GenCmpActionTable> GenActionTableMap;
+
+/* Reduced transition. */
+struct RedTrans
+:
+	public AvlTreeEl<RedTrans>
+{
+	RedTrans( RedState *targ, RedAction *action, int id )
+		: targ(targ), action(action), id(id), labelNeeded(true) { }
+
+	RedState *targ;
+	RedAction *action;
+	int id;
+	bool partitionBoundary;
+	bool labelNeeded;
+};
+
+/* Compare of transitions for the final reduction of transitions. Comparison
+ * is on target and the pointer to the shared action table. It is assumed that
+ * when this is used the action tables have been reduced. */
+struct CmpRedTrans
+{
+	static int compare( const RedTrans &t1, const RedTrans &t2 )
+	{
+		if ( t1.targ < t2.targ )
+			return -1;
+		else if ( t1.targ > t2.targ )
+			return 1;
+		else if ( t1.action < t2.action )
+			return -1;
+		else if ( t1.action > t2.action )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+typedef AvlBasic<RedTrans, CmpRedTrans> RedTransSet;
+
+/* Element in out range. */
+struct RedTransEl
+{
+	/* Constructors. */
+	RedTransEl( Key lowKey, Key highKey, RedTrans *value ) 
+		: lowKey(lowKey), highKey(highKey), value(value) { }
+
+	Key lowKey, highKey;
+	RedTrans *value;
+};
+
+typedef Vector<RedTransEl> RedTransList;
+typedef Vector<RedState*> RedStateVect;
+
+typedef BstMapEl<RedState*, unsigned long long> RedSpanMapEl;
+typedef BstMap<RedState*, unsigned long long> RedSpanMap;
+
+/* Compare used by span map sort. Reverse sorts by the span. */
+struct CmpRedSpanMapEl
+{
+	static int compare( const RedSpanMapEl &smel1, const RedSpanMapEl &smel2 )
+	{
+		if ( smel1.value > smel2.value )
+			return -1;
+		else if ( smel1.value < smel2.value )
+			return 1;
+		else
+			return 0;
+	}
+};
+
+/* Sorting state-span map entries by span. */
+typedef MergeSort<RedSpanMapEl, CmpRedSpanMapEl> RedSpanMapSort;
+
+/* Set of entry ids that go into this state. */
+typedef Vector<int> EntryIdVect;
+typedef Vector<char*> EntryNameVect;
+
+/* Maps entry ids (defined by the frontend, to reduced state ids. */
+typedef BstMap<int, int> RedEntryMap;
+typedef BstMapEl<int, int> RedEntryMapEl;
+
+typedef Vector<int> RegionToEntry;
+
+typedef Vector< GenAction* > GenCondSet;
+
+struct Condition
+{
+	Condition( )
+		: key(0), baseKey(0) {}
+
+	Key key;
+	Key baseKey;
+	GenCondSet condSet;
+
+	Condition *next, *prev;
+};
+typedef DList<Condition> ConditionList;
+
+struct GenCondSpace
+{
+	Key baseKey;
+	GenCondSet condSet;
+	int condSpaceId;
+
+	GenCondSpace *next, *prev;
+};
+typedef DList<GenCondSpace> CondSpaceList;
+
+struct GenStateCond
+{
+	Key lowKey;
+	Key highKey;
+
+	GenCondSpace *condSpace;
+
+	GenStateCond *prev, *next;
+};
+typedef DList<GenStateCond> GenStateCondList;
+typedef Vector<GenStateCond*> StateCondVect;
+
+/* Reduced state. */
+struct RedState
+{
+	RedState()
+	: 
+		defTrans(0), 
+		condList(0),
+		transList(0), 
+		isFinal(false), 
+		labelNeeded(false), 
+		outNeeded(false), 
+		onStateList(false), 
+		toStateAction(0), 
+		fromStateAction(0), 
+		eofAction(0), 
+		eofTrans(0),
+		id(0), 
+		bAnyRegCurStateRef(false),
+		partitionBoundary(false),
+		inTrans(0),
+		numInTrans(0)
+	{ }
+
+	/* Transitions out. */
+	RedTransList outSingle;
+	RedTransList outRange;
+	RedTrans *defTrans;
+
+	/* For flat conditions. */
+	Key condLowKey, condHighKey;
+	GenCondSpace **condList;
+
+	/* For flat keys. */
+	Key lowKey, highKey;
+	RedTrans **transList;
+
+	/* The list of states that transitions from this state go to. */
+	RedStateVect targStates;
+
+	bool isFinal;
+	bool labelNeeded;
+	bool outNeeded;
+	bool onStateList;
+	RedAction *toStateAction;
+	RedAction *fromStateAction;
+	RedAction *eofAction;
+	RedTrans *eofTrans;
+	int id;
+	GenStateCondList stateCondList;
+	StateCondVect stateCondVect;
+
+	/* Pointers for the list of states. */
+	RedState *prev, *next;
+
+	bool anyRegCurStateRef() { return bAnyRegCurStateRef; }
+	bool bAnyRegCurStateRef;
+
+	int partition;
+	bool partitionBoundary;
+
+	RedTrans **inTrans;
+	int numInTrans;
+};
+
+/* List of states. */
+typedef DList<RedState> RedStateList;
+
+/* Set of reduced transitons. Comparison is by pointer. */
+typedef BstSet< RedTrans*, CmpOrd<RedTrans*> > RedTransPtrSet;
+
+/* Next version of the fsm machine. */
+struct RedFsm
+{
+	RedFsm();
+
+	bool wantComplete;
+	bool forcedErrorState;
+
+	int nextActionId;
+	int nextTransId;
+
+	/* Next State Id doubles as the total number of state ids. */
+	int nextStateId;
+
+	RedTransSet transSet;
+	GenActionTableMap actionMap;
+	RedStateList stateList;
+	RedStateSet entryPoints;
+	RedState *startState;
+	RedState *errState;
+	RedTrans *errTrans;
+	RedTrans *errActionTrans;
+	RedState *firstFinState;
+	int numFinStates;
+	int nParts;
+
+	GenAction *allActions;
+	RedAction *allActionTables;
+	Condition *allConditions;
+	GenCondSpace *allCondSpaces;
+	RedState *allStates;
+	GenActionList actionList;
+	ConditionList conditionList;
+	CondSpaceList condSpaceList;
+	EntryIdVect entryPointIds;
+	EntryNameVect entryPointNames;
+	RedEntryMap redEntryMap;
+	RegionToEntry regionToEntry;
+
+	bool bAnyToStateActions;
+	bool bAnyFromStateActions;
+	bool bAnyRegActions;
+	bool bAnyEofActions;
+	bool bAnyActionGotos;
+	bool bAnyActionCalls;
+	bool bAnyActionRets;
+	bool bAnyRegActionRets;
+	bool bAnyRegActionByValControl;
+	bool bAnyRegNextStmt;
+	bool bAnyRegCurStateRef;
+	bool bAnyRegBreak;
+	bool bAnyLmSwitchError;
+	bool bAnyConditions;
+
+	int maxState;
+	int maxSingleLen;
+	int maxRangeLen;
+	int maxKeyOffset;
+	int maxIndexOffset;
+	int maxIndex;
+	int maxActListId;
+	int maxActionLoc;
+	int maxActArrItem;
+	unsigned long long maxSpan;
+	unsigned long long maxCondSpan;
+	int maxFlatIndexOffset;
+	Key maxKey;
+	int maxCondOffset;
+	int maxCondLen;
+	int maxCondSpaceId;
+	int maxCondIndexOffset;
+	int maxCond;
+
+	bool anyActions();
+	bool anyToStateActions()        { return bAnyToStateActions; }
+	bool anyFromStateActions()      { return bAnyFromStateActions; }
+	bool anyRegActions()            { return bAnyRegActions; }
+	bool anyEofActions()            { return bAnyEofActions; }
+	bool anyActionGotos()           { return bAnyActionGotos; }
+	bool anyActionCalls()           { return bAnyActionCalls; }
+	bool anyActionRets()            { return bAnyActionRets; }
+	bool anyRegActionRets()         { return bAnyRegActionRets; }
+	bool anyRegActionByValControl() { return bAnyRegActionByValControl; }
+	bool anyRegNextStmt()           { return bAnyRegNextStmt; }
+	bool anyRegCurStateRef()        { return bAnyRegCurStateRef; }
+	bool anyRegBreak()              { return bAnyRegBreak; }
+	bool anyLmSwitchError()         { return bAnyLmSwitchError; }
+	bool anyConditions()            { return bAnyConditions; }
+
+	GenCondSpace *findCondSpace( Key lowKey, Key highKey );
+	Condition *findCondition( Key key );
+
+	/* Is is it possible to extend a range by bumping ranges that span only
+	 * one character to the singles array. */
+	bool canExtend( const RedTransList &list, int pos );
+
+	/* Pick single transitions from the ranges. */
+	void moveTransToSingle( RedState *state );
+	void chooseSingle();
+
+	void makeFlat();
+
+	/* Move a selected transition from ranges to default. */
+	void moveToDefault( RedTrans *defTrans, RedState *state );
+
+	/* Pick a default transition by largest span. */
+	RedTrans *chooseDefaultSpan( RedState *state );
+	void chooseDefaultSpan();
+
+	/* Pick a default transition by most number of ranges. */
+	RedTrans *chooseDefaultNumRanges( RedState *state );
+	void chooseDefaultNumRanges();
+
+	/* Pick a default transition tailored towards goto driven machine. */
+	RedTrans *chooseDefaultGoto( RedState *state );
+	void chooseDefaultGoto();
+
+	/* Ordering states by transition connections. */
+	void optimizeStateOrdering( RedState *state );
+	void optimizeStateOrdering();
+
+	/* Ordering states by transition connections. */
+	void depthFirstOrdering( RedState *state );
+	void depthFirstOrdering();
+
+	/* Set state ids. */
+	void sequentialStateIds();
+	void sortStateIdsByFinal();
+
+	/* Arrange states in by final id. This is a stable sort. */
+	void sortStatesByFinal();
+
+	/* Sorting states by id. */
+	void sortByStateId();
+
+	/* Locating the first final state. This is the final state with the lowest
+	 * id. */
+	void findFirstFinState();
+
+	void assignActionLocs();
+
+	RedTrans *getErrorTrans();
+	RedState *getErrorState();
+
+	/* Is every char in the alphabet covered? */
+	bool alphabetCovered( RedTransList &outRange );
+
+	RedTrans *allocateTrans( RedState *targState, RedAction *actionTable );
+
+	void partitionFsm( int nParts );
+
+	void setInTrans();
+	void setValueLimits();
+	void assignActionIds();
+	void analyzeActionList( RedAction *redAct, InlineList *inlineList );
+	void analyzeAction( GenAction *act, InlineList *inlineList );
+	void findFinalActionRefs();
+	void analyzeMachine();
+
+	FsmTables *makeFsmTables();
+};
+
+
+#endif /* _REDFSM_H */
diff --git a/colm/string.cpp b/colm/string.cpp
new file mode 100644
index 00000000..84500f92
--- /dev/null
+++ b/colm/string.cpp
@@ -0,0 +1,177 @@
+/*
+ *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pdarun.h"
+#include "bytecode.h"
+#include <assert.h>
+#include <string.h>
+
+Head *string_copy( Program *prg, Head *head )
+{
+	Head *result = 0;
+	if ( head != 0 ) {
+		if ( (char*)(head+1) == head->data )
+			result = string_alloc_new( prg, head->data, head->length );
+		else
+			result = string_alloc_const( prg, head->data, head->length );
+	}
+	return result;
+}
+
+void string_free( Program *prg, Head *head )
+{
+	if ( head != 0 ) {
+		if ( (char*)(head+1) == head->data ) {
+			/* Full string allocation. */
+			free( head );
+		}
+		else {
+			/* Just a string head. */
+			prg->kidPool.free( (Kid*)head );
+		}
+	}
+}
+
+const char *string_data( Head *head )
+{
+	if ( head == 0 )
+		return 0;
+	return head->data;
+}
+
+long string_length( Head *head )
+{
+	if ( head == 0 )
+		return 0;
+	return head->length;
+}
+
+void string_shorten( Head *head, long newlen )
+{
+	assert( newlen <= head->length );
+	head->length = newlen;
+}
+
+Head *init_str_space( long length )
+{
+	/* Find the length and allocate the space for the shared string. */
+	Head *head = (Head*) malloc( sizeof(Head) + length );
+	if ( head == 0 )
+		throw std::bad_alloc();
+
+	/* Init the header. */
+	head->data = (char*)(head+1);
+	head->length = length;
+
+	/* Save the pointer to the data. */
+	return head;
+}
+
+/* Create from a c-style string. */
+Head *string_alloc_new( Program *prg, const char *data, long length )
+{
+	/* Init space for the data. */
+	Head *head = init_str_space( length );
+
+	/* Copy in the data. */
+	memcpy( (head+1), data, length );
+
+	return head;
+}
+
+/* Create from a c-style string. */
+Head *string_alloc_const( Program *prg, const char *data, long length )
+{
+	/* Find the length and allocate the space for the shared string. */
+	Head *head = (Head*) prg->kidPool.allocate();
+
+	/* Init the header. */
+	head->data = data;
+	head->length = length;
+
+	return head;
+}
+
+Head *concat_str( Head *s1, Head *s2 )
+{
+	long s1Len = s1->length;
+	long s2Len = s2->length;
+
+	/* Init space for the data. */
+	Head *head = init_str_space( s1Len + s2Len );
+
+	/* Copy in the data. */
+	memcpy( (head+1), s1->data, s1Len );
+	memcpy( (char*)(head+1) + s1Len, s2->data, s2Len );
+
+	return head;
+}
+
+/* Compare two strings. If identical returns 1, otherwise 0. */
+Word cmp_string( Head *s1, Head *s2 )
+{
+	if ( s1->length < s2->length )
+		return -1;
+	else if ( s1->length > s2->length )
+		return 1;
+	else {
+		char *d1 = (char*)(s1->data);
+		char *d2 = (char*)(s2->data);
+		return memcmp( d1, d2, s1->length );
+	}
+}
+
+Word str_atoi( Head *str )
+{
+	int res = atoi( (char*)(str->data) );
+	return res;
+}
+
+Head *int_to_str( Program *prg, Word i )
+{
+	char data[20];
+	sprintf( data, "%ld", i );
+	return string_alloc_new( prg, data, strlen(data) );
+}
+
+Word str_uord16( Head *head )
+{
+	uchar *data = (uchar*)(head->data);
+	ulong res;
+	res =   (ulong)data[1];
+	res |= ((ulong)data[0]) << 8;
+	return res;
+}
+
+Word str_uord8( Head *head )
+{
+	uchar *data = (uchar*)(head->data);
+	ulong res = (ulong)data[0];
+	return res;
+}
+
+Head *make_literal( Program *prg, long offset )
+{
+	return string_alloc_const( prg,
+			prg->rtd->litdata[offset],
+			prg->rtd->litlen[offset] );
+}
+
diff --git a/colm/tree.cpp b/colm/tree.cpp
new file mode 100644
index 00000000..f7f83c26
--- /dev/null
+++ b/colm/tree.cpp
@@ -0,0 +1,160 @@
+/*
+ *  Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "bytecode.h"
+#include "pdarun.h"
+#include "dlistval.h"
+#include "fsmrun.h"
+#include "pdarun.h"
+
+void tree_free( Program *prg, Tree *tree )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	long genericId = lelInfo[tree->id].genericId;
+	if ( genericId > 0 ) {
+		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
+		if ( generic->type == GEN_LIST )
+			list_free( prg, (List*)tree );
+		else if ( generic->type == GEN_MAP )
+			map_free( prg, (Map*)tree );
+		else
+			assert(false);
+	}
+	else {
+		if ( tree->id == LEL_ID_STR ) {
+			Str *str = (Str*) tree;
+			string_free( prg, str->value );
+			prg->treePool.free( tree );
+		}
+		else if ( tree->id == LEL_ID_BOOL || tree->id == LEL_ID_INT )
+			prg->treePool.free( tree );
+		else if ( tree->id == LEL_ID_PTR ) {
+			//Pointer *ptr = (Pointer*)tree;
+			//tree_downref( prg, ptr->value->tree );
+			//prg->kidPool.free( ptr->value );
+			prg->treePool.free( tree );
+		}
+		else if ( tree->id == LEL_ID_STREAM )
+			stream_free( prg, (Stream*) tree );
+		else { 
+			if ( tree->alg != 0 ) {
+				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
+				tree_downref( prg, tree->alg->parsed );
+				prg->algPool.free( tree->alg );
+			}
+			string_free( prg, tree->tokdata );
+
+			Kid *child = tree->child;
+			while ( child != 0 ) {
+				Kid *next = child->next;
+				tree_downref( prg, child->tree );
+				prg->kidPool.free( child );
+				child = next;
+			}
+
+			prg->treePool.free( tree );
+		}
+	}
+}
+
+void tree_upref( Tree *tree )
+{
+	if ( tree != 0 )
+		tree->refs += 1;
+};
+
+void tree_downref( Program *prg, Tree *tree )
+{
+	if ( tree != 0 ) {
+		assert( tree->refs > 0 );
+		tree->refs -= 1;
+		if ( tree->refs == 0 )
+			tree_free( prg, tree );
+	}
+};
+
+/* Find the first child of a tree. */
+Kid *tree_child( Program *prg, Tree *tree )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Kid *kid = tree->child;
+
+	/* Skip over attributes. */
+	long objectLength = lelInfo[tree->id].objectLength;
+	for ( long a = 0; a < objectLength; a++ )
+		kid = kid->next;
+
+	/* Skip over ignore tokens. */
+	while ( kid != 0 && lelInfo[kid->tree->id].ignore )
+		kid = kid->next;
+	return kid;
+}
+
+/* Find the first child of a tree. */
+Kid *tree_extract_child( Program *prg, Tree *tree )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Kid *kid = tree->child, *last = 0;
+
+	/* Skip over attributes. */
+	long objectLength = lelInfo[tree->id].objectLength;
+	for ( long a = 0; a < objectLength; a++ ) {
+		last = kid;
+		kid = kid->next;
+	}
+
+	/* Skip over ignore tokens. */
+	while ( kid != 0 && lelInfo[kid->tree->id].ignore ) {
+		last = kid;
+		kid = kid->next;
+	}
+
+	if ( last == 0 )
+		tree->child = 0;
+	else
+		last->next = 0;
+
+	return kid;
+}
+
+
+Kid *tree_ignore( Program *prg, Tree *tree )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Kid *ignore = tree->child;
+
+	/* Skip over attributes. */
+	long objectLength = lelInfo[tree->id].objectLength;
+	for ( long a = 0; a < objectLength; a++ )
+		ignore = ignore->next;
+
+	/* Check for ignore tokens, there may not be any. */
+	if ( ignore != 0 && !lelInfo[ignore->tree->id].ignore )
+		ignore = 0;
+	return ignore;
+}
+
+bool tree_is_ignore( Program *prg, Kid *kid )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	return kid != 0 && lelInfo[kid->tree->id].ignore;
+}
+
diff --git a/common/Makefile.in b/common/Makefile.in
new file mode 100644
index 00000000..47dc3567
--- /dev/null
+++ b/common/Makefile.in
@@ -0,0 +1,67 @@
+#
+#   Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+INCS += 
+DEFS +=
+
+CFLAGS += -g -Wall
+LDFLAGS +=
+
+CC_SRCS = common.cpp
+
+GEN_SRC = version.h
+
+#*************************************
+
+# Programs
+CXX = @CXX@
+
+# Get objects and dependencies from sources.
+OBJS = $(CC_SRCS:%.cpp=%.o)
+DEPS = $(CC_SRCS:%.cpp=.%.d)
+
+# Get the version info.
+include ../version.mk
+
+# rules
+
+all: common.a
+
+common.a: $(GEN_SRC) $(OBJS)
+	ar -cr $@ $(OBJS) 
+
+version.h: ../version.mk
+	echo '#define VERSION "$(VERSION)"' > version.h
+	echo '#define PUBDATE "$(PUBDATE)"' >> version.h
+
+%.o: %.cpp
+	@$(CXX) -M $(DEFS) $(INCS) $< > .$*.d
+	$(CXX) -c $(CFLAGS) $(DEFS) $(INCS) -o $@ $<
+
+distclean: clean
+	rm -f Makefile config.h
+
+clean:
+	rm -f tags version.h .*.d *.o common.a
+
+install:
+	@true
+
+-include $(DEPS)
diff --git a/common/buffer.h b/common/buffer.h
new file mode 100644
index 00000000..99c4e82d
--- /dev/null
+++ b/common/buffer.h
@@ -0,0 +1,55 @@
+/*
+ *  Copyright 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _BUFFER_H
+#define _BUFFER_H
+
+#define BUFFER_INITIAL_SIZE 4096
+
+/* An automatically grown buffer for collecting tokens. Always reuses space;
+ * never down resizes. */
+struct Buffer
+{
+	Buffer()
+	{
+		data = (char*) malloc( BUFFER_INITIAL_SIZE );
+		allocated = BUFFER_INITIAL_SIZE;
+		length = 0;
+	}
+	~Buffer() { free(data); }
+
+	void append( char p )
+	{
+		if ( length == allocated ) {
+			allocated *= 2;
+			data = (char*) realloc( data, allocated );
+		}
+		data[length++] = p;
+	}
+		
+	void clear() { length = 0; }
+
+	char *data;
+	int allocated;
+	int length;
+};
+
+#endif /* _BUFFER_H */
diff --git a/common/common.cpp b/common/common.cpp
new file mode 100644
index 00000000..e6b0a70b
--- /dev/null
+++ b/common/common.cpp
@@ -0,0 +1,257 @@
+/*
+ *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pcheck.h"
+#include "common.h"
+#include <assert.h>
+
+HostType hostTypesC[] =
+{
+	{ "char",     0,       true,   CHAR_MIN,  CHAR_MAX,   sizeof(char) },
+	{ "unsigned", "char",  false,  0,         UCHAR_MAX,  sizeof(unsigned char) },
+	{ "short",    0,       true,   SHRT_MIN,  SHRT_MAX,   sizeof(short) },
+	{ "unsigned", "short", false,  0,         USHRT_MAX,  sizeof(unsigned short) },
+	{ "int",      0,       true,   INT_MIN,   INT_MAX,    sizeof(int) },
+	{ "unsigned", "int",   false,  0,         UINT_MAX,   sizeof(unsigned int) },
+	{ "long",     0,       true,   LONG_MIN,  LONG_MAX,   sizeof(long) },
+	{ "unsigned", "long",  false,  0,         ULONG_MAX,  sizeof(unsigned long) }
+};
+
+HostType hostTypesD[] =
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "ubyte",    0,  false,  0,         UCHAR_MAX,   1 },
+	{ "char",     0,  false,  0,         UCHAR_MAX,   1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "ushort",   0,  false,  0,         USHRT_MAX,   2 },
+	{ "wchar",    0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+	{ "uint",     0,  false,  0,         UINT_MAX,    4 },
+	{ "dchar",    0,  false,  0,         UINT_MAX,    4 }
+};
+
+HostType hostTypesJava[] = 
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+};
+
+HostType hostTypesRuby[] = 
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+};
+
+HostLang hostLangC =    { hostTypesC,    8, hostTypesC+0,    true };
+HostLang hostLangD =    { hostTypesD,    9, hostTypesD+2,    true };
+HostLang hostLangJava = { hostTypesJava, 4, hostTypesJava+2, false };
+HostLang hostLangRuby = { hostTypesRuby, 4, hostTypesRuby+2, false };
+
+HostLang *hostLang = &hostLangC;
+HostLangType hostLangType = CCode;
+
+/* Construct a new parameter checker with for paramSpec. */
+ParamCheck::ParamCheck( const char *paramSpec, int argc,  const char **argv )
+:
+	state(noparam),
+	argOffset(0),
+	curArg(0),
+	iCurArg(1),
+	paramSpec(paramSpec), 
+	argc(argc), 
+	argv(argv)
+{
+}
+
+/* Check a single option. Returns the index of the next parameter.  Sets p to
+ * the arg character if valid, 0 otherwise.  Sets parg to the parameter arg if
+ * there is one, NULL otherwise. */
+bool ParamCheck::check()
+{
+	bool requiresParam;
+
+	if ( iCurArg >= argc ) {            /* Off the end of the arg list. */
+		state = noparam;
+		return false;
+	}
+
+	if ( argOffset != 0 && *argOffset == 0 ) {
+		/* We are at the end of an arg string. */
+		iCurArg += 1;
+		if ( iCurArg >= argc ) {
+			state = noparam;
+			return false;
+		}
+		argOffset = 0;
+	}
+
+	if ( argOffset == 0 ) {
+		/* Set the current arg. */
+		curArg = argv[iCurArg];
+
+		/* We are at the beginning of an arg string. */
+		if ( argv[iCurArg] == 0 ||        /* Argv[iCurArg] is null. */
+			 argv[iCurArg][0] != '-' ||   /* Not a param. */
+			 argv[iCurArg][1] == 0 ) {    /* Only a dash. */
+			parameter = 0;
+			parameterArg = 0;
+
+			iCurArg += 1;
+			state = noparam;
+			return true;
+		}
+		argOffset = argv[iCurArg] + 1;
+	}
+
+	/* Get the arg char. */
+	char argChar = *argOffset;
+	
+	/* Loop over all the parms and look for a match. */
+	const char *pSpec = paramSpec;
+	while ( *pSpec != 0 ) {
+		char pSpecChar = *pSpec;
+
+		/* If there is a ':' following the char then
+		 * it requires a parm.  If a parm is required
+		 * then move ahead two in the parmspec. Otherwise
+		 * move ahead one in the parm spec. */
+		if ( pSpec[1] == ':' ) {
+			requiresParam = true;
+			pSpec += 2;
+		}
+		else {
+			requiresParam = false;
+			pSpec += 1;
+		}
+
+		/* Do we have a match. */
+		if ( argChar == pSpecChar ) {
+			if ( requiresParam ) {
+				if ( argOffset[1] == 0 ) {
+					/* The param must follow. */
+					if ( iCurArg + 1 == argc ) {
+						/* We are the last arg so there
+						 * cannot be a parameter to it. */
+						parameter = argChar;
+						parameterArg = 0;
+						iCurArg += 1;
+						argOffset = 0;
+						state = invalid;
+						return true;
+					}
+					else {
+						/* the parameter to the arg is the next arg. */
+						parameter = pSpecChar;
+						parameterArg = argv[iCurArg + 1];
+						iCurArg += 2;
+						argOffset = 0;
+						state = match;
+						return true;
+					}
+				}
+				else {
+					/* The param for the arg is built in. */
+					parameter = pSpecChar;
+					parameterArg = argOffset + 1;
+					iCurArg += 1;
+					argOffset = 0;
+					state = match;
+					return true;
+				}
+			}
+			else {
+				/* Good, we matched the parm and no
+				 * arg is required. */
+				parameter = pSpecChar;
+				parameterArg = 0;
+				argOffset += 1;
+				state = match;
+				return true;
+			}
+		}
+	}
+
+	/* We did not find a match. Bad Argument. */
+	parameter = argChar;
+	parameterArg = 0;
+	argOffset += 1;
+	state = invalid;
+	return true;
+}
+
+/* Scans a string looking for the file extension. If there is a file
+ * extension then pointer returned points to inside the string
+ * passed in. Otherwise returns null. */
+const char *findFileExtension( const char *stemFile )
+{
+	const char *ppos = stemFile + strlen(stemFile) - 1;
+
+	/* Scan backwards from the end looking for the first dot.
+	 * If we encounter a '/' before the first dot, then stop the scan. */
+	while ( 1 ) {
+		/* If we found a dot or got to the beginning of the string then
+		 * we are done. */
+		if ( ppos == stemFile || *ppos == '.' )
+			break;
+
+		/* If we hit a / then there is no extension. Done. */
+		if ( *ppos == '/' ) {
+			ppos = stemFile;
+			break;
+		}
+		ppos--;
+	} 
+
+	/* If we got to the front of the string then bail we 
+	 * did not find an extension  */
+	if ( ppos == stemFile )
+		ppos = 0;
+
+	return ppos;
+}
+
+/* Make a file name from a stem. Removes the old filename suffix and
+ * replaces it with a new one. Returns a newed up string. */
+char *fileNameFromStem( const char *stemFile, const char *suffix )
+{
+	int len = strlen( stemFile );
+	assert( len > 0 );
+
+	/* Get the extension. */
+	const char *ppos = findFileExtension( stemFile );
+
+	/* If an extension was found, then shorten what we think the len is. */
+	if ( ppos != 0 )
+		len = ppos - stemFile;
+
+	/* Make the return string from the stem and the suffix. */
+	char *retVal = new char[ len + strlen( suffix ) + 1 ];
+	strncpy( retVal, stemFile, len );
+	strcpy( retVal + len, suffix );
+
+	return retVal;
+}
+
+
diff --git a/common/common.h b/common/common.h
new file mode 100644
index 00000000..53ce443d
--- /dev/null
+++ b/common/common.h
@@ -0,0 +1,283 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _COMMON_H
+#define _COMMON_H
+
+#include <fstream>
+#include <climits>
+
+enum MarkType
+{
+	MarkEnter,
+	MarkLeave
+};
+
+typedef unsigned long long Size;
+
+struct Key
+{
+private:
+	long key;
+
+public:
+	friend inline Key operator+(const Key key1, const Key key2);
+	friend inline Key operator-(const Key key1, const Key key2);
+	friend inline Key operator/(const Key key1, const Key key2);
+	friend inline long operator&(const Key key1, const Key key2);
+
+	friend inline bool operator<( const Key key1, const Key key2 );
+	friend inline bool operator<=( const Key key1, const Key key2 );
+	friend inline bool operator>( const Key key1, const Key key2 );
+	friend inline bool operator>=( const Key key1, const Key key2 );
+	friend inline bool operator==( const Key key1, const Key key2 );
+	friend inline bool operator!=( const Key key1, const Key key2 );
+
+	friend struct KeyOps;
+	
+	Key( ) {}
+	Key( const Key &key ) : key(key.key) {}
+	Key( long key ) : key(key) {}
+
+	/* Returns the value used to represent the key. This value must be
+	 * interpreted based on signedness. */
+	long getVal() const { return key; };
+
+	/* Returns the key casted to a long long. This form of the key does not
+	 * require and signedness interpretation. */
+	long long getLongLong() const;
+
+	bool isUpper() const { return ( 'A' <= key && key <= 'Z' ); }
+	bool isLower() const { return ( 'a' <= key && key <= 'z' ); }
+	bool isPrintable() const { return ( 32 <= key && key < 127 ); }
+
+	Key toUpper() const
+		{ return Key( 'A' + ( key - 'a' ) ); }
+	Key toLower() const
+		{ return Key( 'a' + ( key - 'A' ) ); }
+
+	void operator+=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key += other.key;
+	}
+
+	void operator-=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key -= other.key;
+	}
+
+	void operator|=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key |= other.key;
+	}
+
+	/* Decrement. Needed only for ranges. */
+	inline void decrement();
+	inline void increment();
+};
+
+struct HostType
+{
+	char *data1;
+	char *data2;
+	bool isSigned;
+	long long minVal;
+	long long maxVal;
+	unsigned int size;
+};
+
+struct HostLang
+{
+	HostType *hostTypes;
+	int numHostTypes;
+	HostType *defaultAlphType;
+	bool explicitUnsigned;
+};
+
+
+/* Target language. */
+enum HostLangType
+{
+	CCode,
+	DCode,
+	JavaCode,
+	RubyCode
+};
+
+extern HostLang *hostLang;
+extern HostLangType hostLangType;
+
+extern HostLang hostLangC;
+extern HostLang hostLangD;
+extern HostLang hostLangJava;
+extern HostLang hostLangRuby;
+
+/* An abstraction of the key operators that manages key operations such as
+ * comparison and increment according the signedness of the key. */
+struct KeyOps
+{
+	/* Default to signed alphabet. */
+	KeyOps() :
+		isSigned(true),
+		alphType(0)
+	{}
+
+	/* Default to signed alphabet. */
+	KeyOps( bool isSigned ) 
+		:isSigned(isSigned) {}
+
+	bool isSigned;
+	Key minKey, maxKey;
+	HostType *alphType;
+
+	void setAlphType( HostType *alphType )
+	{
+		this->alphType = alphType;
+		isSigned = alphType->isSigned;
+		if ( isSigned ) {
+			minKey = (long) alphType->minVal;
+			maxKey = (long) alphType->maxVal;
+		}
+		else {
+			minKey = (long) (unsigned long) alphType->minVal; 
+			maxKey = (long) (unsigned long) alphType->maxVal;
+		}
+	}
+
+	/* Compute the distance between two keys. */
+	Size span( Key key1, Key key2 )
+	{
+		return isSigned ? 
+			(unsigned long long)(
+				(long long)key2.key - 
+				(long long)key1.key + 1) : 
+			(unsigned long long)(
+				(unsigned long)key2.key) - 
+				(unsigned long long)((unsigned long)key1.key) + 1;
+	}
+
+	Size alphSize()
+		{ return span( minKey, maxKey ); }
+
+	HostType *typeSubsumes( long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+
+	HostType *typeSubsumes( bool isSigned, long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
+					maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+};
+
+extern KeyOps *keyOps;
+
+inline bool operator<( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key < key2.key : 
+		(unsigned long)key1.key < (unsigned long)key2.key;
+}
+
+inline bool operator<=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ?  key1.key <= key2.key : 
+		(unsigned long)key1.key <= (unsigned long)key2.key;
+}
+
+inline bool operator>( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key > key2.key : 
+		(unsigned long)key1.key > (unsigned long)key2.key;
+}
+
+inline bool operator>=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key >= key2.key : 
+		(unsigned long)key1.key >= (unsigned long)key2.key;
+}
+
+inline bool operator==( const Key key1, const Key key2 )
+{
+	return key1.key == key2.key;
+}
+
+inline bool operator!=( const Key key1, const Key key2 )
+{
+	return key1.key != key2.key;
+}
+
+/* Decrement. Needed only for ranges. */
+inline void Key::decrement()
+{
+	key = keyOps->isSigned ? key - 1 : ((unsigned long)key)-1;
+}
+
+/* Increment. Needed only for ranges. */
+inline void Key::increment()
+{
+	key = keyOps->isSigned ? key+1 : ((unsigned long)key)+1;
+}
+
+inline long long Key::getLongLong() const
+{
+	return keyOps->isSigned ? (long long)key : (long long)(unsigned long)key;
+}
+
+inline Key operator+(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key + key2.key );
+}
+
+inline Key operator-(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key - key2.key );
+}
+
+inline long operator&(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key & key2.key;
+}
+
+inline Key operator/(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key / key2.key;
+}
+
+const char *findFileExtension( const char *stemFile );
+char *fileNameFromStem( const char *stemFile, const char *suffix );
+
+#endif /* _COMMON_H */
diff --git a/common/config.h.in b/common/config.h.in
new file mode 100644
index 00000000..c370f3b6
--- /dev/null
+++ b/common/config.h.in
@@ -0,0 +1,50 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _CONFIG_H
+#define _CONFIG_H
+
+/* Programs. */
+#undef GDC
+#undef GOBJC
+#undef CXX
+#undef CC
+#undef JAVAC
+#undef TXL
+#undef RUBY
+
+/* Configuration */
+#undef COLM_LOG
+#undef COLM_LOG_BYTECODE
+#undef COLM_LOG_PARSE
+#undef COLM_LOG_MATCH
+#undef COLM_LOG_COMPILE
+
+/* If COLM_LOG is defined then turn on all logging options. */
+#ifdef COLM_LOG
+#define COLM_LOG_BYTECODE 1
+#define COLM_LOG_PARSE 1
+#define COLM_LOG_MATCH 1
+#define COLM_LOG_COMPILE 1
+#endif
+
+
+#endif /* _CONFIG_H */
diff --git a/common/pcheck.h b/common/pcheck.h
new file mode 100644
index 00000000..df3706c2
--- /dev/null
+++ b/common/pcheck.h
@@ -0,0 +1,48 @@
+/*
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PCHECK_H
+#define _PCHECK_H
+
+class ParamCheck
+{
+public:
+	ParamCheck( const char *paramSpec, int argc, const char **argv );
+
+	bool check();
+
+	const char *parameterArg; /* The argument to the parameter. */
+	char parameter;     /* The parameter matched. */
+	enum { match, invalid, noparam } state;
+
+	const char *argOffset;    /* If we are reading params inside an
+	                     * arg this points to the offset. */
+
+	const char *curArg;       /* Pointer to the current arg. */
+	int iCurArg;        /* Index to the current arg. */
+
+private:
+	const char *paramSpec;    /* Parameter spec supplied by the coder. */
+	int argc;           /* Arguement data from the command line. */
+	const char **argv;
+};
+
+#endif /* _PCHECK_H */
diff --git a/configure b/configure
new file mode 100755
index 00000000..be493813
--- /dev/null
+++ b/configure
@@ -0,0 +1,4222 @@
+#! /bin/sh
+# Guess values for system-dependent variables and create Makefiles.
+# Generated by GNU Autoconf 2.61.
+#
+# Copyright (C) 1992, 1993, 1994, 1995, 1996, 1998, 1999, 2000, 2001,
+# 2002, 2003, 2004, 2005, 2006 Free Software Foundation, Inc.
+# This configure script is free software; the Free Software Foundation
+# gives unlimited permission to copy, distribute and modify it.
+## --------------------- ##
+## M4sh Initialization.  ##
+## --------------------- ##
+
+# Be more Bourne compatible
+DUALCASE=1; export DUALCASE # for MKS sh
+if test -n "${ZSH_VERSION+set}" && (emulate sh) >/dev/null 2>&1; then
+  emulate sh
+  NULLCMD=:
+  # Zsh 3.x and 4.x performs word splitting on ${1+"$@"}, which
+  # is contrary to our usage.  Disable this feature.
+  alias -g '${1+"$@"}'='"$@"'
+  setopt NO_GLOB_SUBST
+else
+  case `(set -o) 2>/dev/null` in
+  *posix*) set -o posix ;;
+esac
+
+fi
+
+
+
+
+# PATH needs CR
+# Avoid depending upon Character Ranges.
+as_cr_letters='abcdefghijklmnopqrstuvwxyz'
+as_cr_LETTERS='ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+as_cr_Letters=$as_cr_letters$as_cr_LETTERS
+as_cr_digits='0123456789'
+as_cr_alnum=$as_cr_Letters$as_cr_digits
+
+# The user is always right.
+if test "${PATH_SEPARATOR+set}" != set; then
+  echo "#! /bin/sh" >conf$$.sh
+  echo  "exit 0"   >>conf$$.sh
+  chmod +x conf$$.sh
+  if (PATH="/nonexistent;."; conf$$.sh) >/dev/null 2>&1; then
+    PATH_SEPARATOR=';'
+  else
+    PATH_SEPARATOR=:
+  fi
+  rm -f conf$$.sh
+fi
+
+# Support unset when possible.
+if ( (MAIL=60; unset MAIL) || exit) >/dev/null 2>&1; then
+  as_unset=unset
+else
+  as_unset=false
+fi
+
+
+# IFS
+# We need space, tab and new line, in precisely that order.  Quoting is
+# there to prevent editors from complaining about space-tab.
+# (If _AS_PATH_WALK were called with IFS unset, it would disable word
+# splitting by setting IFS to empty value.)
+as_nl='
+'
+IFS=" ""	$as_nl"
+
+# Find who we are.  Look in the path if we contain no directory separator.
+case $0 in
+  *[\\/]* ) as_myself=$0 ;;
+  *) as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  test -r "$as_dir/$0" && as_myself=$as_dir/$0 && break
+done
+IFS=$as_save_IFS
+
+     ;;
+esac
+# We did not find ourselves, most probably we were run as `sh COMMAND'
+# in which case we are not to be found in the path.
+if test "x$as_myself" = x; then
+  as_myself=$0
+fi
+if test ! -f "$as_myself"; then
+  echo "$as_myself: error: cannot find myself; rerun with an absolute file name" >&2
+  { (exit 1); exit 1; }
+fi
+
+# Work around bugs in pre-3.0 UWIN ksh.
+for as_var in ENV MAIL MAILPATH
+do ($as_unset $as_var) >/dev/null 2>&1 && $as_unset $as_var
+done
+PS1='$ '
+PS2='> '
+PS4='+ '
+
+# NLS nuisances.
+for as_var in \
+  LANG LANGUAGE LC_ADDRESS LC_ALL LC_COLLATE LC_CTYPE LC_IDENTIFICATION \
+  LC_MEASUREMENT LC_MESSAGES LC_MONETARY LC_NAME LC_NUMERIC LC_PAPER \
+  LC_TELEPHONE LC_TIME
+do
+  if (set +x; test -z "`(eval $as_var=C; export $as_var) 2>&1`"); then
+    eval $as_var=C; export $as_var
+  else
+    ($as_unset $as_var) >/dev/null 2>&1 && $as_unset $as_var
+  fi
+done
+
+# Required to use basename.
+if expr a : '\(a\)' >/dev/null 2>&1 &&
+   test "X`expr 00001 : '.*\(...\)'`" = X001; then
+  as_expr=expr
+else
+  as_expr=false
+fi
+
+if (basename -- /) >/dev/null 2>&1 && test "X`basename -- / 2>&1`" = "X/"; then
+  as_basename=basename
+else
+  as_basename=false
+fi
+
+
+# Name of the executable.
+as_me=`$as_basename -- "$0" ||
+$as_expr X/"$0" : '.*/\([^/][^/]*\)/*$' \| \
+	 X"$0" : 'X\(//\)$' \| \
+	 X"$0" : 'X\(/\)' \| . 2>/dev/null ||
+echo X/"$0" |
+    sed '/^.*\/\([^/][^/]*\)\/*$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\/\(\/\/\)$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\/\(\/\).*/{
+	    s//\1/
+	    q
+	  }
+	  s/.*/./; q'`
+
+# CDPATH.
+$as_unset CDPATH
+
+
+if test "x$CONFIG_SHELL" = x; then
+  if (eval ":") 2>/dev/null; then
+  as_have_required=yes
+else
+  as_have_required=no
+fi
+
+  if test $as_have_required = yes && 	 (eval ":
+(as_func_return () {
+  (exit \$1)
+}
+as_func_success () {
+  as_func_return 0
+}
+as_func_failure () {
+  as_func_return 1
+}
+as_func_ret_success () {
+  return 0
+}
+as_func_ret_failure () {
+  return 1
+}
+
+exitcode=0
+if as_func_success; then
+  :
+else
+  exitcode=1
+  echo as_func_success failed.
+fi
+
+if as_func_failure; then
+  exitcode=1
+  echo as_func_failure succeeded.
+fi
+
+if as_func_ret_success; then
+  :
+else
+  exitcode=1
+  echo as_func_ret_success failed.
+fi
+
+if as_func_ret_failure; then
+  exitcode=1
+  echo as_func_ret_failure succeeded.
+fi
+
+if ( set x; as_func_ret_success y && test x = \"\$1\" ); then
+  :
+else
+  exitcode=1
+  echo positional parameters were not saved.
+fi
+
+test \$exitcode = 0) || { (exit 1); exit 1; }
+
+(
+  as_lineno_1=\$LINENO
+  as_lineno_2=\$LINENO
+  test \"x\$as_lineno_1\" != \"x\$as_lineno_2\" &&
+  test \"x\`expr \$as_lineno_1 + 1\`\" = \"x\$as_lineno_2\") || { (exit 1); exit 1; }
+") 2> /dev/null; then
+  :
+else
+  as_candidate_shells=
+    as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in /bin$PATH_SEPARATOR/usr/bin$PATH_SEPARATOR$PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  case $as_dir in
+	 /*)
+	   for as_base in sh bash ksh sh5; do
+	     as_candidate_shells="$as_candidate_shells $as_dir/$as_base"
+	   done;;
+       esac
+done
+IFS=$as_save_IFS
+
+
+      for as_shell in $as_candidate_shells $SHELL; do
+	 # Try only shells that exist, to save several forks.
+	 if { test -f "$as_shell" || test -f "$as_shell.exe"; } &&
+		{ ("$as_shell") 2> /dev/null <<\_ASEOF
+if test -n "${ZSH_VERSION+set}" && (emulate sh) >/dev/null 2>&1; then
+  emulate sh
+  NULLCMD=:
+  # Zsh 3.x and 4.x performs word splitting on ${1+"$@"}, which
+  # is contrary to our usage.  Disable this feature.
+  alias -g '${1+"$@"}'='"$@"'
+  setopt NO_GLOB_SUBST
+else
+  case `(set -o) 2>/dev/null` in
+  *posix*) set -o posix ;;
+esac
+
+fi
+
+
+:
+_ASEOF
+}; then
+  CONFIG_SHELL=$as_shell
+	       as_have_required=yes
+	       if { "$as_shell" 2> /dev/null <<\_ASEOF
+if test -n "${ZSH_VERSION+set}" && (emulate sh) >/dev/null 2>&1; then
+  emulate sh
+  NULLCMD=:
+  # Zsh 3.x and 4.x performs word splitting on ${1+"$@"}, which
+  # is contrary to our usage.  Disable this feature.
+  alias -g '${1+"$@"}'='"$@"'
+  setopt NO_GLOB_SUBST
+else
+  case `(set -o) 2>/dev/null` in
+  *posix*) set -o posix ;;
+esac
+
+fi
+
+
+:
+(as_func_return () {
+  (exit $1)
+}
+as_func_success () {
+  as_func_return 0
+}
+as_func_failure () {
+  as_func_return 1
+}
+as_func_ret_success () {
+  return 0
+}
+as_func_ret_failure () {
+  return 1
+}
+
+exitcode=0
+if as_func_success; then
+  :
+else
+  exitcode=1
+  echo as_func_success failed.
+fi
+
+if as_func_failure; then
+  exitcode=1
+  echo as_func_failure succeeded.
+fi
+
+if as_func_ret_success; then
+  :
+else
+  exitcode=1
+  echo as_func_ret_success failed.
+fi
+
+if as_func_ret_failure; then
+  exitcode=1
+  echo as_func_ret_failure succeeded.
+fi
+
+if ( set x; as_func_ret_success y && test x = "$1" ); then
+  :
+else
+  exitcode=1
+  echo positional parameters were not saved.
+fi
+
+test $exitcode = 0) || { (exit 1); exit 1; }
+
+(
+  as_lineno_1=$LINENO
+  as_lineno_2=$LINENO
+  test "x$as_lineno_1" != "x$as_lineno_2" &&
+  test "x`expr $as_lineno_1 + 1`" = "x$as_lineno_2") || { (exit 1); exit 1; }
+
+_ASEOF
+}; then
+  break
+fi
+
+fi
+
+      done
+
+      if test "x$CONFIG_SHELL" != x; then
+  for as_var in BASH_ENV ENV
+        do ($as_unset $as_var) >/dev/null 2>&1 && $as_unset $as_var
+        done
+        export CONFIG_SHELL
+        exec "$CONFIG_SHELL" "$as_myself" ${1+"$@"}
+fi
+
+
+    if test $as_have_required = no; then
+  echo This script requires a shell more modern than all the
+      echo shells that I found on your system.  Please install a
+      echo modern shell, or manually run the script under such a
+      echo shell if you do have one.
+      { (exit 1); exit 1; }
+fi
+
+
+fi
+
+fi
+
+
+
+(eval "as_func_return () {
+  (exit \$1)
+}
+as_func_success () {
+  as_func_return 0
+}
+as_func_failure () {
+  as_func_return 1
+}
+as_func_ret_success () {
+  return 0
+}
+as_func_ret_failure () {
+  return 1
+}
+
+exitcode=0
+if as_func_success; then
+  :
+else
+  exitcode=1
+  echo as_func_success failed.
+fi
+
+if as_func_failure; then
+  exitcode=1
+  echo as_func_failure succeeded.
+fi
+
+if as_func_ret_success; then
+  :
+else
+  exitcode=1
+  echo as_func_ret_success failed.
+fi
+
+if as_func_ret_failure; then
+  exitcode=1
+  echo as_func_ret_failure succeeded.
+fi
+
+if ( set x; as_func_ret_success y && test x = \"\$1\" ); then
+  :
+else
+  exitcode=1
+  echo positional parameters were not saved.
+fi
+
+test \$exitcode = 0") || {
+  echo No shell found that supports shell functions.
+  echo Please tell autoconf@gnu.org about your system,
+  echo including any error possibly output before this
+  echo message
+}
+
+
+
+  as_lineno_1=$LINENO
+  as_lineno_2=$LINENO
+  test "x$as_lineno_1" != "x$as_lineno_2" &&
+  test "x`expr $as_lineno_1 + 1`" = "x$as_lineno_2" || {
+
+  # Create $as_me.lineno as a copy of $as_myself, but with $LINENO
+  # uniformly replaced by the line number.  The first 'sed' inserts a
+  # line-number line after each line using $LINENO; the second 'sed'
+  # does the real work.  The second script uses 'N' to pair each
+  # line-number line with the line containing $LINENO, and appends
+  # trailing '-' during substitution so that $LINENO is not a special
+  # case at line end.
+  # (Raja R Harinath suggested sed '=', and Paul Eggert wrote the
+  # scripts with optimization help from Paolo Bonzini.  Blame Lee
+  # E. McMahon (1931-1989) for sed's syntax.  :-)
+  sed -n '
+    p
+    /[$]LINENO/=
+  ' <$as_myself |
+    sed '
+      s/[$]LINENO.*/&-/
+      t lineno
+      b
+      :lineno
+      N
+      :loop
+      s/[$]LINENO\([^'$as_cr_alnum'_].*\n\)\(.*\)/\2\1\2/
+      t loop
+      s/-\n.*//
+    ' >$as_me.lineno &&
+  chmod +x "$as_me.lineno" ||
+    { echo "$as_me: error: cannot create $as_me.lineno; rerun with a POSIX shell" >&2
+   { (exit 1); exit 1; }; }
+
+  # Don't try to exec as it changes $[0], causing all sort of problems
+  # (the dirname of $[0] is not the place where we might find the
+  # original and so on.  Autoconf is especially sensitive to this).
+  . "./$as_me.lineno"
+  # Exit status is that of the last command.
+  exit
+}
+
+
+if (as_dir=`dirname -- /` && test "X$as_dir" = X/) >/dev/null 2>&1; then
+  as_dirname=dirname
+else
+  as_dirname=false
+fi
+
+ECHO_C= ECHO_N= ECHO_T=
+case `echo -n x` in
+-n*)
+  case `echo 'x\c'` in
+  *c*) ECHO_T='	';;	# ECHO_T is single tab character.
+  *)   ECHO_C='\c';;
+  esac;;
+*)
+  ECHO_N='-n';;
+esac
+
+if expr a : '\(a\)' >/dev/null 2>&1 &&
+   test "X`expr 00001 : '.*\(...\)'`" = X001; then
+  as_expr=expr
+else
+  as_expr=false
+fi
+
+rm -f conf$$ conf$$.exe conf$$.file
+if test -d conf$$.dir; then
+  rm -f conf$$.dir/conf$$.file
+else
+  rm -f conf$$.dir
+  mkdir conf$$.dir
+fi
+echo >conf$$.file
+if ln -s conf$$.file conf$$ 2>/dev/null; then
+  as_ln_s='ln -s'
+  # ... but there are two gotchas:
+  # 1) On MSYS, both `ln -s file dir' and `ln file dir' fail.
+  # 2) DJGPP < 2.04 has no symlinks; `ln -s' creates a wrapper executable.
+  # In both cases, we have to default to `cp -p'.
+  ln -s conf$$.file conf$$.dir 2>/dev/null && test ! -f conf$$.exe ||
+    as_ln_s='cp -p'
+elif ln conf$$.file conf$$ 2>/dev/null; then
+  as_ln_s=ln
+else
+  as_ln_s='cp -p'
+fi
+rm -f conf$$ conf$$.exe conf$$.dir/conf$$.file conf$$.file
+rmdir conf$$.dir 2>/dev/null
+
+if mkdir -p . 2>/dev/null; then
+  as_mkdir_p=:
+else
+  test -d ./-p && rmdir ./-p
+  as_mkdir_p=false
+fi
+
+if test -x / >/dev/null 2>&1; then
+  as_test_x='test -x'
+else
+  if ls -dL / >/dev/null 2>&1; then
+    as_ls_L_option=L
+  else
+    as_ls_L_option=
+  fi
+  as_test_x='
+    eval sh -c '\''
+      if test -d "$1"; then
+        test -d "$1/.";
+      else
+	case $1 in
+        -*)set "./$1";;
+	esac;
+	case `ls -ld'$as_ls_L_option' "$1" 2>/dev/null` in
+	???[sx]*):;;*)false;;esac;fi
+    '\'' sh
+  '
+fi
+as_executable_p=$as_test_x
+
+# Sed expression to map a string onto a valid CPP name.
+as_tr_cpp="eval sed 'y%*$as_cr_letters%P$as_cr_LETTERS%;s%[^_$as_cr_alnum]%_%g'"
+
+# Sed expression to map a string onto a valid variable name.
+as_tr_sh="eval sed 'y%*+%pp%;s%[^_$as_cr_alnum]%_%g'"
+
+
+
+exec 7<&0 </dev/null 6>&1
+
+# Name of the host.
+# hostname on some systems (SVR3.2, Linux) returns a bogus exit status,
+# so uname gets run too.
+ac_hostname=`(hostname || uname -n) 2>/dev/null | sed 1q`
+
+#
+# Initializations.
+#
+ac_default_prefix=/usr/local
+ac_clean_files=
+ac_config_libobj_dir=.
+LIBOBJS=
+cross_compiling=no
+subdirs=
+MFLAGS=
+MAKEFLAGS=
+SHELL=${CONFIG_SHELL-/bin/sh}
+
+# Identity of this package.
+PACKAGE_NAME=
+PACKAGE_TARNAME=
+PACKAGE_VERSION=
+PACKAGE_STRING=
+PACKAGE_BUGREPORT=
+
+ac_unique_file="colm/main.cpp"
+ac_subst_vars='SHELL
+PATH_SEPARATOR
+PACKAGE_NAME
+PACKAGE_TARNAME
+PACKAGE_VERSION
+PACKAGE_STRING
+PACKAGE_BUGREPORT
+exec_prefix
+prefix
+program_transform_name
+bindir
+sbindir
+libexecdir
+datarootdir
+datadir
+sysconfdir
+sharedstatedir
+localstatedir
+includedir
+oldincludedir
+docdir
+infodir
+htmldir
+dvidir
+pdfdir
+psdir
+libdir
+localedir
+mandir
+DEFS
+ECHO_C
+ECHO_N
+ECHO_T
+LIBS
+build_alias
+host_alias
+target_alias
+BUILD_PARSERS
+CC
+CFLAGS
+LDFLAGS
+CPPFLAGS
+ac_ct_CC
+EXEEXT
+OBJEXT
+CXX
+CXXFLAGS
+ac_ct_CXX
+SET_MAKE
+RAGEL
+KELBT
+LIBOBJS
+LTLIBOBJS'
+ac_subst_files=''
+      ac_precious_vars='build_alias
+host_alias
+target_alias
+CC
+CFLAGS
+LDFLAGS
+LIBS
+CPPFLAGS
+CXX
+CXXFLAGS
+CCC'
+
+
+# Initialize some variables set by options.
+ac_init_help=
+ac_init_version=false
+# The variables have the same names as the options, with
+# dashes changed to underlines.
+cache_file=/dev/null
+exec_prefix=NONE
+no_create=
+no_recursion=
+prefix=NONE
+program_prefix=NONE
+program_suffix=NONE
+program_transform_name=s,x,x,
+silent=
+site=
+srcdir=
+verbose=
+x_includes=NONE
+x_libraries=NONE
+
+# Installation directory options.
+# These are left unexpanded so users can "make install exec_prefix=/foo"
+# and all the variables that are supposed to be based on exec_prefix
+# by default will actually change.
+# Use braces instead of parens because sh, perl, etc. also accept them.
+# (The list follows the same order as the GNU Coding Standards.)
+bindir='${exec_prefix}/bin'
+sbindir='${exec_prefix}/sbin'
+libexecdir='${exec_prefix}/libexec'
+datarootdir='${prefix}/share'
+datadir='${datarootdir}'
+sysconfdir='${prefix}/etc'
+sharedstatedir='${prefix}/com'
+localstatedir='${prefix}/var'
+includedir='${prefix}/include'
+oldincludedir='/usr/include'
+docdir='${datarootdir}/doc/${PACKAGE}'
+infodir='${datarootdir}/info'
+htmldir='${docdir}'
+dvidir='${docdir}'
+pdfdir='${docdir}'
+psdir='${docdir}'
+libdir='${exec_prefix}/lib'
+localedir='${datarootdir}/locale'
+mandir='${datarootdir}/man'
+
+ac_prev=
+ac_dashdash=
+for ac_option
+do
+  # If the previous option needs an argument, assign it.
+  if test -n "$ac_prev"; then
+    eval $ac_prev=\$ac_option
+    ac_prev=
+    continue
+  fi
+
+  case $ac_option in
+  *=*)	ac_optarg=`expr "X$ac_option" : '[^=]*=\(.*\)'` ;;
+  *)	ac_optarg=yes ;;
+  esac
+
+  # Accept the important Cygnus configure options, so we can diagnose typos.
+
+  case $ac_dashdash$ac_option in
+  --)
+    ac_dashdash=yes ;;
+
+  -bindir | --bindir | --bindi | --bind | --bin | --bi)
+    ac_prev=bindir ;;
+  -bindir=* | --bindir=* | --bindi=* | --bind=* | --bin=* | --bi=*)
+    bindir=$ac_optarg ;;
+
+  -build | --build | --buil | --bui | --bu)
+    ac_prev=build_alias ;;
+  -build=* | --build=* | --buil=* | --bui=* | --bu=*)
+    build_alias=$ac_optarg ;;
+
+  -cache-file | --cache-file | --cache-fil | --cache-fi \
+  | --cache-f | --cache- | --cache | --cach | --cac | --ca | --c)
+    ac_prev=cache_file ;;
+  -cache-file=* | --cache-file=* | --cache-fil=* | --cache-fi=* \
+  | --cache-f=* | --cache-=* | --cache=* | --cach=* | --cac=* | --ca=* | --c=*)
+    cache_file=$ac_optarg ;;
+
+  --config-cache | -C)
+    cache_file=config.cache ;;
+
+  -datadir | --datadir | --datadi | --datad)
+    ac_prev=datadir ;;
+  -datadir=* | --datadir=* | --datadi=* | --datad=*)
+    datadir=$ac_optarg ;;
+
+  -datarootdir | --datarootdir | --datarootdi | --datarootd | --dataroot \
+  | --dataroo | --dataro | --datar)
+    ac_prev=datarootdir ;;
+  -datarootdir=* | --datarootdir=* | --datarootdi=* | --datarootd=* \
+  | --dataroot=* | --dataroo=* | --dataro=* | --datar=*)
+    datarootdir=$ac_optarg ;;
+
+  -disable-* | --disable-*)
+    ac_feature=`expr "x$ac_option" : 'x-*disable-\(.*\)'`
+    # Reject names that are not valid shell variable names.
+    expr "x$ac_feature" : ".*[^-._$as_cr_alnum]" >/dev/null &&
+      { echo "$as_me: error: invalid feature name: $ac_feature" >&2
+   { (exit 1); exit 1; }; }
+    ac_feature=`echo $ac_feature | sed 's/[-.]/_/g'`
+    eval enable_$ac_feature=no ;;
+
+  -docdir | --docdir | --docdi | --doc | --do)
+    ac_prev=docdir ;;
+  -docdir=* | --docdir=* | --docdi=* | --doc=* | --do=*)
+    docdir=$ac_optarg ;;
+
+  -dvidir | --dvidir | --dvidi | --dvid | --dvi | --dv)
+    ac_prev=dvidir ;;
+  -dvidir=* | --dvidir=* | --dvidi=* | --dvid=* | --dvi=* | --dv=*)
+    dvidir=$ac_optarg ;;
+
+  -enable-* | --enable-*)
+    ac_feature=`expr "x$ac_option" : 'x-*enable-\([^=]*\)'`
+    # Reject names that are not valid shell variable names.
+    expr "x$ac_feature" : ".*[^-._$as_cr_alnum]" >/dev/null &&
+      { echo "$as_me: error: invalid feature name: $ac_feature" >&2
+   { (exit 1); exit 1; }; }
+    ac_feature=`echo $ac_feature | sed 's/[-.]/_/g'`
+    eval enable_$ac_feature=\$ac_optarg ;;
+
+  -exec-prefix | --exec_prefix | --exec-prefix | --exec-prefi \
+  | --exec-pref | --exec-pre | --exec-pr | --exec-p | --exec- \
+  | --exec | --exe | --ex)
+    ac_prev=exec_prefix ;;
+  -exec-prefix=* | --exec_prefix=* | --exec-prefix=* | --exec-prefi=* \
+  | --exec-pref=* | --exec-pre=* | --exec-pr=* | --exec-p=* | --exec-=* \
+  | --exec=* | --exe=* | --ex=*)
+    exec_prefix=$ac_optarg ;;
+
+  -gas | --gas | --ga | --g)
+    # Obsolete; use --with-gas.
+    with_gas=yes ;;
+
+  -help | --help | --hel | --he | -h)
+    ac_init_help=long ;;
+  -help=r* | --help=r* | --hel=r* | --he=r* | -hr*)
+    ac_init_help=recursive ;;
+  -help=s* | --help=s* | --hel=s* | --he=s* | -hs*)
+    ac_init_help=short ;;
+
+  -host | --host | --hos | --ho)
+    ac_prev=host_alias ;;
+  -host=* | --host=* | --hos=* | --ho=*)
+    host_alias=$ac_optarg ;;
+
+  -htmldir | --htmldir | --htmldi | --htmld | --html | --htm | --ht)
+    ac_prev=htmldir ;;
+  -htmldir=* | --htmldir=* | --htmldi=* | --htmld=* | --html=* | --htm=* \
+  | --ht=*)
+    htmldir=$ac_optarg ;;
+
+  -includedir | --includedir | --includedi | --included | --include \
+  | --includ | --inclu | --incl | --inc)
+    ac_prev=includedir ;;
+  -includedir=* | --includedir=* | --includedi=* | --included=* | --include=* \
+  | --includ=* | --inclu=* | --incl=* | --inc=*)
+    includedir=$ac_optarg ;;
+
+  -infodir | --infodir | --infodi | --infod | --info | --inf)
+    ac_prev=infodir ;;
+  -infodir=* | --infodir=* | --infodi=* | --infod=* | --info=* | --inf=*)
+    infodir=$ac_optarg ;;
+
+  -libdir | --libdir | --libdi | --libd)
+    ac_prev=libdir ;;
+  -libdir=* | --libdir=* | --libdi=* | --libd=*)
+    libdir=$ac_optarg ;;
+
+  -libexecdir | --libexecdir | --libexecdi | --libexecd | --libexec \
+  | --libexe | --libex | --libe)
+    ac_prev=libexecdir ;;
+  -libexecdir=* | --libexecdir=* | --libexecdi=* | --libexecd=* | --libexec=* \
+  | --libexe=* | --libex=* | --libe=*)
+    libexecdir=$ac_optarg ;;
+
+  -localedir | --localedir | --localedi | --localed | --locale)
+    ac_prev=localedir ;;
+  -localedir=* | --localedir=* | --localedi=* | --localed=* | --locale=*)
+    localedir=$ac_optarg ;;
+
+  -localstatedir | --localstatedir | --localstatedi | --localstated \
+  | --localstate | --localstat | --localsta | --localst | --locals)
+    ac_prev=localstatedir ;;
+  -localstatedir=* | --localstatedir=* | --localstatedi=* | --localstated=* \
+  | --localstate=* | --localstat=* | --localsta=* | --localst=* | --locals=*)
+    localstatedir=$ac_optarg ;;
+
+  -mandir | --mandir | --mandi | --mand | --man | --ma | --m)
+    ac_prev=mandir ;;
+  -mandir=* | --mandir=* | --mandi=* | --mand=* | --man=* | --ma=* | --m=*)
+    mandir=$ac_optarg ;;
+
+  -nfp | --nfp | --nf)
+    # Obsolete; use --without-fp.
+    with_fp=no ;;
+
+  -no-create | --no-create | --no-creat | --no-crea | --no-cre \
+  | --no-cr | --no-c | -n)
+    no_create=yes ;;
+
+  -no-recursion | --no-recursion | --no-recursio | --no-recursi \
+  | --no-recurs | --no-recur | --no-recu | --no-rec | --no-re | --no-r)
+    no_recursion=yes ;;
+
+  -oldincludedir | --oldincludedir | --oldincludedi | --oldincluded \
+  | --oldinclude | --oldinclud | --oldinclu | --oldincl | --oldinc \
+  | --oldin | --oldi | --old | --ol | --o)
+    ac_prev=oldincludedir ;;
+  -oldincludedir=* | --oldincludedir=* | --oldincludedi=* | --oldincluded=* \
+  | --oldinclude=* | --oldinclud=* | --oldinclu=* | --oldincl=* | --oldinc=* \
+  | --oldin=* | --oldi=* | --old=* | --ol=* | --o=*)
+    oldincludedir=$ac_optarg ;;
+
+  -prefix | --prefix | --prefi | --pref | --pre | --pr | --p)
+    ac_prev=prefix ;;
+  -prefix=* | --prefix=* | --prefi=* | --pref=* | --pre=* | --pr=* | --p=*)
+    prefix=$ac_optarg ;;
+
+  -program-prefix | --program-prefix | --program-prefi | --program-pref \
+  | --program-pre | --program-pr | --program-p)
+    ac_prev=program_prefix ;;
+  -program-prefix=* | --program-prefix=* | --program-prefi=* \
+  | --program-pref=* | --program-pre=* | --program-pr=* | --program-p=*)
+    program_prefix=$ac_optarg ;;
+
+  -program-suffix | --program-suffix | --program-suffi | --program-suff \
+  | --program-suf | --program-su | --program-s)
+    ac_prev=program_suffix ;;
+  -program-suffix=* | --program-suffix=* | --program-suffi=* \
+  | --program-suff=* | --program-suf=* | --program-su=* | --program-s=*)
+    program_suffix=$ac_optarg ;;
+
+  -program-transform-name | --program-transform-name \
+  | --program-transform-nam | --program-transform-na \
+  | --program-transform-n | --program-transform- \
+  | --program-transform | --program-transfor \
+  | --program-transfo | --program-transf \
+  | --program-trans | --program-tran \
+  | --progr-tra | --program-tr | --program-t)
+    ac_prev=program_transform_name ;;
+  -program-transform-name=* | --program-transform-name=* \
+  | --program-transform-nam=* | --program-transform-na=* \
+  | --program-transform-n=* | --program-transform-=* \
+  | --program-transform=* | --program-transfor=* \
+  | --program-transfo=* | --program-transf=* \
+  | --program-trans=* | --program-tran=* \
+  | --progr-tra=* | --program-tr=* | --program-t=*)
+    program_transform_name=$ac_optarg ;;
+
+  -pdfdir | --pdfdir | --pdfdi | --pdfd | --pdf | --pd)
+    ac_prev=pdfdir ;;
+  -pdfdir=* | --pdfdir=* | --pdfdi=* | --pdfd=* | --pdf=* | --pd=*)
+    pdfdir=$ac_optarg ;;
+
+  -psdir | --psdir | --psdi | --psd | --ps)
+    ac_prev=psdir ;;
+  -psdir=* | --psdir=* | --psdi=* | --psd=* | --ps=*)
+    psdir=$ac_optarg ;;
+
+  -q | -quiet | --quiet | --quie | --qui | --qu | --q \
+  | -silent | --silent | --silen | --sile | --sil)
+    silent=yes ;;
+
+  -sbindir | --sbindir | --sbindi | --sbind | --sbin | --sbi | --sb)
+    ac_prev=sbindir ;;
+  -sbindir=* | --sbindir=* | --sbindi=* | --sbind=* | --sbin=* \
+  | --sbi=* | --sb=*)
+    sbindir=$ac_optarg ;;
+
+  -sharedstatedir | --sharedstatedir | --sharedstatedi \
+  | --sharedstated | --sharedstate | --sharedstat | --sharedsta \
+  | --sharedst | --shareds | --shared | --share | --shar \
+  | --sha | --sh)
+    ac_prev=sharedstatedir ;;
+  -sharedstatedir=* | --sharedstatedir=* | --sharedstatedi=* \
+  | --sharedstated=* | --sharedstate=* | --sharedstat=* | --sharedsta=* \
+  | --sharedst=* | --shareds=* | --shared=* | --share=* | --shar=* \
+  | --sha=* | --sh=*)
+    sharedstatedir=$ac_optarg ;;
+
+  -site | --site | --sit)
+    ac_prev=site ;;
+  -site=* | --site=* | --sit=*)
+    site=$ac_optarg ;;
+
+  -srcdir | --srcdir | --srcdi | --srcd | --src | --sr)
+    ac_prev=srcdir ;;
+  -srcdir=* | --srcdir=* | --srcdi=* | --srcd=* | --src=* | --sr=*)
+    srcdir=$ac_optarg ;;
+
+  -sysconfdir | --sysconfdir | --sysconfdi | --sysconfd | --sysconf \
+  | --syscon | --sysco | --sysc | --sys | --sy)
+    ac_prev=sysconfdir ;;
+  -sysconfdir=* | --sysconfdir=* | --sysconfdi=* | --sysconfd=* | --sysconf=* \
+  | --syscon=* | --sysco=* | --sysc=* | --sys=* | --sy=*)
+    sysconfdir=$ac_optarg ;;
+
+  -target | --target | --targe | --targ | --tar | --ta | --t)
+    ac_prev=target_alias ;;
+  -target=* | --target=* | --targe=* | --targ=* | --tar=* | --ta=* | --t=*)
+    target_alias=$ac_optarg ;;
+
+  -v | -verbose | --verbose | --verbos | --verbo | --verb)
+    verbose=yes ;;
+
+  -version | --version | --versio | --versi | --vers | -V)
+    ac_init_version=: ;;
+
+  -with-* | --with-*)
+    ac_package=`expr "x$ac_option" : 'x-*with-\([^=]*\)'`
+    # Reject names that are not valid shell variable names.
+    expr "x$ac_package" : ".*[^-._$as_cr_alnum]" >/dev/null &&
+      { echo "$as_me: error: invalid package name: $ac_package" >&2
+   { (exit 1); exit 1; }; }
+    ac_package=`echo $ac_package | sed 's/[-.]/_/g'`
+    eval with_$ac_package=\$ac_optarg ;;
+
+  -without-* | --without-*)
+    ac_package=`expr "x$ac_option" : 'x-*without-\(.*\)'`
+    # Reject names that are not valid shell variable names.
+    expr "x$ac_package" : ".*[^-._$as_cr_alnum]" >/dev/null &&
+      { echo "$as_me: error: invalid package name: $ac_package" >&2
+   { (exit 1); exit 1; }; }
+    ac_package=`echo $ac_package | sed 's/[-.]/_/g'`
+    eval with_$ac_package=no ;;
+
+  --x)
+    # Obsolete; use --with-x.
+    with_x=yes ;;
+
+  -x-includes | --x-includes | --x-include | --x-includ | --x-inclu \
+  | --x-incl | --x-inc | --x-in | --x-i)
+    ac_prev=x_includes ;;
+  -x-includes=* | --x-includes=* | --x-include=* | --x-includ=* | --x-inclu=* \
+  | --x-incl=* | --x-inc=* | --x-in=* | --x-i=*)
+    x_includes=$ac_optarg ;;
+
+  -x-libraries | --x-libraries | --x-librarie | --x-librari \
+  | --x-librar | --x-libra | --x-libr | --x-lib | --x-li | --x-l)
+    ac_prev=x_libraries ;;
+  -x-libraries=* | --x-libraries=* | --x-librarie=* | --x-librari=* \
+  | --x-librar=* | --x-libra=* | --x-libr=* | --x-lib=* | --x-li=* | --x-l=*)
+    x_libraries=$ac_optarg ;;
+
+  -*) { echo "$as_me: error: unrecognized option: $ac_option
+Try \`$0 --help' for more information." >&2
+   { (exit 1); exit 1; }; }
+    ;;
+
+  *=*)
+    ac_envvar=`expr "x$ac_option" : 'x\([^=]*\)='`
+    # Reject names that are not valid shell variable names.
+    expr "x$ac_envvar" : ".*[^_$as_cr_alnum]" >/dev/null &&
+      { echo "$as_me: error: invalid variable name: $ac_envvar" >&2
+   { (exit 1); exit 1; }; }
+    eval $ac_envvar=\$ac_optarg
+    export $ac_envvar ;;
+
+  *)
+    # FIXME: should be removed in autoconf 3.0.
+    echo "$as_me: WARNING: you should use --build, --host, --target" >&2
+    expr "x$ac_option" : ".*[^-._$as_cr_alnum]" >/dev/null &&
+      echo "$as_me: WARNING: invalid host type: $ac_option" >&2
+    : ${build_alias=$ac_option} ${host_alias=$ac_option} ${target_alias=$ac_option}
+    ;;
+
+  esac
+done
+
+if test -n "$ac_prev"; then
+  ac_option=--`echo $ac_prev | sed 's/_/-/g'`
+  { echo "$as_me: error: missing argument to $ac_option" >&2
+   { (exit 1); exit 1; }; }
+fi
+
+# Be sure to have absolute directory names.
+for ac_var in	exec_prefix prefix bindir sbindir libexecdir datarootdir \
+		datadir sysconfdir sharedstatedir localstatedir includedir \
+		oldincludedir docdir infodir htmldir dvidir pdfdir psdir \
+		libdir localedir mandir
+do
+  eval ac_val=\$$ac_var
+  case $ac_val in
+    [\\/$]* | ?:[\\/]* )  continue;;
+    NONE | '' ) case $ac_var in *prefix ) continue;; esac;;
+  esac
+  { echo "$as_me: error: expected an absolute directory name for --$ac_var: $ac_val" >&2
+   { (exit 1); exit 1; }; }
+done
+
+# There might be people who depend on the old broken behavior: `$host'
+# used to hold the argument of --host etc.
+# FIXME: To remove some day.
+build=$build_alias
+host=$host_alias
+target=$target_alias
+
+# FIXME: To remove some day.
+if test "x$host_alias" != x; then
+  if test "x$build_alias" = x; then
+    cross_compiling=maybe
+    echo "$as_me: WARNING: If you wanted to set the --build type, don't use --host.
+    If a cross compiler is detected then cross compile mode will be used." >&2
+  elif test "x$build_alias" != "x$host_alias"; then
+    cross_compiling=yes
+  fi
+fi
+
+ac_tool_prefix=
+test -n "$host_alias" && ac_tool_prefix=$host_alias-
+
+test "$silent" = yes && exec 6>/dev/null
+
+
+ac_pwd=`pwd` && test -n "$ac_pwd" &&
+ac_ls_di=`ls -di .` &&
+ac_pwd_ls_di=`cd "$ac_pwd" && ls -di .` ||
+  { echo "$as_me: error: Working directory cannot be determined" >&2
+   { (exit 1); exit 1; }; }
+test "X$ac_ls_di" = "X$ac_pwd_ls_di" ||
+  { echo "$as_me: error: pwd does not report name of working directory" >&2
+   { (exit 1); exit 1; }; }
+
+
+# Find the source files, if location was not specified.
+if test -z "$srcdir"; then
+  ac_srcdir_defaulted=yes
+  # Try the directory containing this script, then the parent directory.
+  ac_confdir=`$as_dirname -- "$0" ||
+$as_expr X"$0" : 'X\(.*[^/]\)//*[^/][^/]*/*$' \| \
+	 X"$0" : 'X\(//\)[^/]' \| \
+	 X"$0" : 'X\(//\)$' \| \
+	 X"$0" : 'X\(/\)' \| . 2>/dev/null ||
+echo X"$0" |
+    sed '/^X\(.*[^/]\)\/\/*[^/][^/]*\/*$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)[^/].*/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\).*/{
+	    s//\1/
+	    q
+	  }
+	  s/.*/./; q'`
+  srcdir=$ac_confdir
+  if test ! -r "$srcdir/$ac_unique_file"; then
+    srcdir=..
+  fi
+else
+  ac_srcdir_defaulted=no
+fi
+if test ! -r "$srcdir/$ac_unique_file"; then
+  test "$ac_srcdir_defaulted" = yes && srcdir="$ac_confdir or .."
+  { echo "$as_me: error: cannot find sources ($ac_unique_file) in $srcdir" >&2
+   { (exit 1); exit 1; }; }
+fi
+ac_msg="sources are in $srcdir, but \`cd $srcdir' does not work"
+ac_abs_confdir=`(
+	cd "$srcdir" && test -r "./$ac_unique_file" || { echo "$as_me: error: $ac_msg" >&2
+   { (exit 1); exit 1; }; }
+	pwd)`
+# When building in place, set srcdir=.
+if test "$ac_abs_confdir" = "$ac_pwd"; then
+  srcdir=.
+fi
+# Remove unnecessary trailing slashes from srcdir.
+# Double slashes in file names in object file debugging info
+# mess up M-x gdb in Emacs.
+case $srcdir in
+*/) srcdir=`expr "X$srcdir" : 'X\(.*[^/]\)' \| "X$srcdir" : 'X\(.*\)'`;;
+esac
+for ac_var in $ac_precious_vars; do
+  eval ac_env_${ac_var}_set=\${${ac_var}+set}
+  eval ac_env_${ac_var}_value=\$${ac_var}
+  eval ac_cv_env_${ac_var}_set=\${${ac_var}+set}
+  eval ac_cv_env_${ac_var}_value=\$${ac_var}
+done
+
+#
+# Report the --help message.
+#
+if test "$ac_init_help" = "long"; then
+  # Omit some internal or obsolete options to make the list less imposing.
+  # This message is too long to be a string in the A/UX 3.1 sh.
+  cat <<_ACEOF
+\`configure' configures this package to adapt to many kinds of systems.
+
+Usage: $0 [OPTION]... [VAR=VALUE]...
+
+To assign environment variables (e.g., CC, CFLAGS...), specify them as
+VAR=VALUE.  See below for descriptions of some of the useful variables.
+
+Defaults for the options are specified in brackets.
+
+Configuration:
+  -h, --help              display this help and exit
+      --help=short        display options specific to this package
+      --help=recursive    display the short help of all the included packages
+  -V, --version           display version information and exit
+  -q, --quiet, --silent   do not print \`checking...' messages
+      --cache-file=FILE   cache test results in FILE [disabled]
+  -C, --config-cache      alias for \`--cache-file=config.cache'
+  -n, --no-create         do not create output files
+      --srcdir=DIR        find the sources in DIR [configure dir or \`..']
+
+Installation directories:
+  --prefix=PREFIX         install architecture-independent files in PREFIX
+			  [$ac_default_prefix]
+  --exec-prefix=EPREFIX   install architecture-dependent files in EPREFIX
+			  [PREFIX]
+
+By default, \`make install' will install all the files in
+\`$ac_default_prefix/bin', \`$ac_default_prefix/lib' etc.  You can specify
+an installation prefix other than \`$ac_default_prefix' using \`--prefix',
+for instance \`--prefix=\$HOME'.
+
+For better control, use the options below.
+
+Fine tuning of the installation directories:
+  --bindir=DIR           user executables [EPREFIX/bin]
+  --sbindir=DIR          system admin executables [EPREFIX/sbin]
+  --libexecdir=DIR       program executables [EPREFIX/libexec]
+  --sysconfdir=DIR       read-only single-machine data [PREFIX/etc]
+  --sharedstatedir=DIR   modifiable architecture-independent data [PREFIX/com]
+  --localstatedir=DIR    modifiable single-machine data [PREFIX/var]
+  --libdir=DIR           object code libraries [EPREFIX/lib]
+  --includedir=DIR       C header files [PREFIX/include]
+  --oldincludedir=DIR    C header files for non-gcc [/usr/include]
+  --datarootdir=DIR      read-only arch.-independent data root [PREFIX/share]
+  --datadir=DIR          read-only architecture-independent data [DATAROOTDIR]
+  --infodir=DIR          info documentation [DATAROOTDIR/info]
+  --localedir=DIR        locale-dependent data [DATAROOTDIR/locale]
+  --mandir=DIR           man documentation [DATAROOTDIR/man]
+  --docdir=DIR           documentation root [DATAROOTDIR/doc/PACKAGE]
+  --htmldir=DIR          html documentation [DOCDIR]
+  --dvidir=DIR           dvi documentation [DOCDIR]
+  --pdfdir=DIR           pdf documentation [DOCDIR]
+  --psdir=DIR            ps documentation [DOCDIR]
+_ACEOF
+
+  cat <<\_ACEOF
+_ACEOF
+fi
+
+if test -n "$ac_init_help"; then
+
+  cat <<\_ACEOF
+
+Optional Features:
+  --disable-FEATURE       do not include FEATURE (same as --enable-FEATURE=no)
+  --enable-FEATURE[=ARG]  include FEATURE [ARG=yes]
+"turn on logging"
+"turns on bytecode logging"
+"turns on parse logging"
+"turns on match logging"
+"turns on compile logging"
+
+Some influential environment variables:
+  CC          C compiler command
+  CFLAGS      C compiler flags
+  LDFLAGS     linker flags, e.g. -L<lib dir> if you have libraries in a
+              nonstandard directory <lib dir>
+  LIBS        libraries to pass to the linker, e.g. -l<library>
+  CPPFLAGS    C/C++/Objective C preprocessor flags, e.g. -I<include dir> if
+              you have headers in a nonstandard directory <include dir>
+  CXX         C++ compiler command
+  CXXFLAGS    C++ compiler flags
+
+Use these variables to override the choices made by `configure' or to help
+it to find libraries and programs with nonstandard names/locations.
+
+_ACEOF
+ac_status=$?
+fi
+
+if test "$ac_init_help" = "recursive"; then
+  # If there are subdirs, report their specific --help.
+  for ac_dir in : $ac_subdirs_all; do test "x$ac_dir" = x: && continue
+    test -d "$ac_dir" || continue
+    ac_builddir=.
+
+case "$ac_dir" in
+.) ac_dir_suffix= ac_top_builddir_sub=. ac_top_build_prefix= ;;
+*)
+  ac_dir_suffix=/`echo "$ac_dir" | sed 's,^\.[\\/],,'`
+  # A ".." for each directory in $ac_dir_suffix.
+  ac_top_builddir_sub=`echo "$ac_dir_suffix" | sed 's,/[^\\/]*,/..,g;s,/,,'`
+  case $ac_top_builddir_sub in
+  "") ac_top_builddir_sub=. ac_top_build_prefix= ;;
+  *)  ac_top_build_prefix=$ac_top_builddir_sub/ ;;
+  esac ;;
+esac
+ac_abs_top_builddir=$ac_pwd
+ac_abs_builddir=$ac_pwd$ac_dir_suffix
+# for backward compatibility:
+ac_top_builddir=$ac_top_build_prefix
+
+case $srcdir in
+  .)  # We are building in place.
+    ac_srcdir=.
+    ac_top_srcdir=$ac_top_builddir_sub
+    ac_abs_top_srcdir=$ac_pwd ;;
+  [\\/]* | ?:[\\/]* )  # Absolute name.
+    ac_srcdir=$srcdir$ac_dir_suffix;
+    ac_top_srcdir=$srcdir
+    ac_abs_top_srcdir=$srcdir ;;
+  *) # Relative name.
+    ac_srcdir=$ac_top_build_prefix$srcdir$ac_dir_suffix
+    ac_top_srcdir=$ac_top_build_prefix$srcdir
+    ac_abs_top_srcdir=$ac_pwd/$srcdir ;;
+esac
+ac_abs_srcdir=$ac_abs_top_srcdir$ac_dir_suffix
+
+    cd "$ac_dir" || { ac_status=$?; continue; }
+    # Check for guested configure.
+    if test -f "$ac_srcdir/configure.gnu"; then
+      echo &&
+      $SHELL "$ac_srcdir/configure.gnu" --help=recursive
+    elif test -f "$ac_srcdir/configure"; then
+      echo &&
+      $SHELL "$ac_srcdir/configure" --help=recursive
+    else
+      echo "$as_me: WARNING: no configuration information is in $ac_dir" >&2
+    fi || ac_status=$?
+    cd "$ac_pwd" || { ac_status=$?; break; }
+  done
+fi
+
+test -n "$ac_init_help" && exit $ac_status
+if $ac_init_version; then
+  cat <<\_ACEOF
+configure
+generated by GNU Autoconf 2.61
+
+Copyright (C) 1992, 1993, 1994, 1995, 1996, 1998, 1999, 2000, 2001,
+2002, 2003, 2004, 2005, 2006 Free Software Foundation, Inc.
+This configure script is free software; the Free Software Foundation
+gives unlimited permission to copy, distribute and modify it.
+_ACEOF
+  exit
+fi
+cat >config.log <<_ACEOF
+This file contains any messages produced by compilers while
+running configure, to aid debugging if configure makes a mistake.
+
+It was created by $as_me, which was
+generated by GNU Autoconf 2.61.  Invocation command line was
+
+  $ $0 $@
+
+_ACEOF
+exec 5>>config.log
+{
+cat <<_ASUNAME
+## --------- ##
+## Platform. ##
+## --------- ##
+
+hostname = `(hostname || uname -n) 2>/dev/null | sed 1q`
+uname -m = `(uname -m) 2>/dev/null || echo unknown`
+uname -r = `(uname -r) 2>/dev/null || echo unknown`
+uname -s = `(uname -s) 2>/dev/null || echo unknown`
+uname -v = `(uname -v) 2>/dev/null || echo unknown`
+
+/usr/bin/uname -p = `(/usr/bin/uname -p) 2>/dev/null || echo unknown`
+/bin/uname -X     = `(/bin/uname -X) 2>/dev/null     || echo unknown`
+
+/bin/arch              = `(/bin/arch) 2>/dev/null              || echo unknown`
+/usr/bin/arch -k       = `(/usr/bin/arch -k) 2>/dev/null       || echo unknown`
+/usr/convex/getsysinfo = `(/usr/convex/getsysinfo) 2>/dev/null || echo unknown`
+/usr/bin/hostinfo      = `(/usr/bin/hostinfo) 2>/dev/null      || echo unknown`
+/bin/machine           = `(/bin/machine) 2>/dev/null           || echo unknown`
+/usr/bin/oslevel       = `(/usr/bin/oslevel) 2>/dev/null       || echo unknown`
+/bin/universe          = `(/bin/universe) 2>/dev/null          || echo unknown`
+
+_ASUNAME
+
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  echo "PATH: $as_dir"
+done
+IFS=$as_save_IFS
+
+} >&5
+
+cat >&5 <<_ACEOF
+
+
+## ----------- ##
+## Core tests. ##
+## ----------- ##
+
+_ACEOF
+
+
+# Keep a trace of the command line.
+# Strip out --no-create and --no-recursion so they do not pile up.
+# Strip out --silent because we don't want to record it for future runs.
+# Also quote any args containing shell meta-characters.
+# Make two passes to allow for proper duplicate-argument suppression.
+ac_configure_args=
+ac_configure_args0=
+ac_configure_args1=
+ac_must_keep_next=false
+for ac_pass in 1 2
+do
+  for ac_arg
+  do
+    case $ac_arg in
+    -no-create | --no-c* | -n | -no-recursion | --no-r*) continue ;;
+    -q | -quiet | --quiet | --quie | --qui | --qu | --q \
+    | -silent | --silent | --silen | --sile | --sil)
+      continue ;;
+    *\'*)
+      ac_arg=`echo "$ac_arg" | sed "s/'/'\\\\\\\\''/g"` ;;
+    esac
+    case $ac_pass in
+    1) ac_configure_args0="$ac_configure_args0 '$ac_arg'" ;;
+    2)
+      ac_configure_args1="$ac_configure_args1 '$ac_arg'"
+      if test $ac_must_keep_next = true; then
+	ac_must_keep_next=false # Got value, back to normal.
+      else
+	case $ac_arg in
+	  *=* | --config-cache | -C | -disable-* | --disable-* \
+	  | -enable-* | --enable-* | -gas | --g* | -nfp | --nf* \
+	  | -q | -quiet | --q* | -silent | --sil* | -v | -verb* \
+	  | -with-* | --with-* | -without-* | --without-* | --x)
+	    case "$ac_configure_args0 " in
+	      "$ac_configure_args1"*" '$ac_arg' "* ) continue ;;
+	    esac
+	    ;;
+	  -* ) ac_must_keep_next=true ;;
+	esac
+      fi
+      ac_configure_args="$ac_configure_args '$ac_arg'"
+      ;;
+    esac
+  done
+done
+$as_unset ac_configure_args0 || test "${ac_configure_args0+set}" != set || { ac_configure_args0=; export ac_configure_args0; }
+$as_unset ac_configure_args1 || test "${ac_configure_args1+set}" != set || { ac_configure_args1=; export ac_configure_args1; }
+
+# When interrupted or exit'd, cleanup temporary files, and complete
+# config.log.  We remove comments because anyway the quotes in there
+# would cause problems or look ugly.
+# WARNING: Use '\'' to represent an apostrophe within the trap.
+# WARNING: Do not start the trap code with a newline, due to a FreeBSD 4.0 bug.
+trap 'exit_status=$?
+  # Save into config.log some information that might help in debugging.
+  {
+    echo
+
+    cat <<\_ASBOX
+## ---------------- ##
+## Cache variables. ##
+## ---------------- ##
+_ASBOX
+    echo
+    # The following way of writing the cache mishandles newlines in values,
+(
+  for ac_var in `(set) 2>&1 | sed -n '\''s/^\([a-zA-Z_][a-zA-Z0-9_]*\)=.*/\1/p'\''`; do
+    eval ac_val=\$$ac_var
+    case $ac_val in #(
+    *${as_nl}*)
+      case $ac_var in #(
+      *_cv_*) { echo "$as_me:$LINENO: WARNING: Cache variable $ac_var contains a newline." >&5
+echo "$as_me: WARNING: Cache variable $ac_var contains a newline." >&2;} ;;
+      esac
+      case $ac_var in #(
+      _ | IFS | as_nl) ;; #(
+      *) $as_unset $ac_var ;;
+      esac ;;
+    esac
+  done
+  (set) 2>&1 |
+    case $as_nl`(ac_space='\'' '\''; set) 2>&1` in #(
+    *${as_nl}ac_space=\ *)
+      sed -n \
+	"s/'\''/'\''\\\\'\'''\''/g;
+	  s/^\\([_$as_cr_alnum]*_cv_[_$as_cr_alnum]*\\)=\\(.*\\)/\\1='\''\\2'\''/p"
+      ;; #(
+    *)
+      sed -n "/^[_$as_cr_alnum]*_cv_[_$as_cr_alnum]*=/p"
+      ;;
+    esac |
+    sort
+)
+    echo
+
+    cat <<\_ASBOX
+## ----------------- ##
+## Output variables. ##
+## ----------------- ##
+_ASBOX
+    echo
+    for ac_var in $ac_subst_vars
+    do
+      eval ac_val=\$$ac_var
+      case $ac_val in
+      *\'\''*) ac_val=`echo "$ac_val" | sed "s/'\''/'\''\\\\\\\\'\'''\''/g"`;;
+      esac
+      echo "$ac_var='\''$ac_val'\''"
+    done | sort
+    echo
+
+    if test -n "$ac_subst_files"; then
+      cat <<\_ASBOX
+## ------------------- ##
+## File substitutions. ##
+## ------------------- ##
+_ASBOX
+      echo
+      for ac_var in $ac_subst_files
+      do
+	eval ac_val=\$$ac_var
+	case $ac_val in
+	*\'\''*) ac_val=`echo "$ac_val" | sed "s/'\''/'\''\\\\\\\\'\'''\''/g"`;;
+	esac
+	echo "$ac_var='\''$ac_val'\''"
+      done | sort
+      echo
+    fi
+
+    if test -s confdefs.h; then
+      cat <<\_ASBOX
+## ----------- ##
+## confdefs.h. ##
+## ----------- ##
+_ASBOX
+      echo
+      cat confdefs.h
+      echo
+    fi
+    test "$ac_signal" != 0 &&
+      echo "$as_me: caught signal $ac_signal"
+    echo "$as_me: exit $exit_status"
+  } >&5
+  rm -f core *.core core.conftest.* &&
+    rm -f -r conftest* confdefs* conf$$* $ac_clean_files &&
+    exit $exit_status
+' 0
+for ac_signal in 1 2 13 15; do
+  trap 'ac_signal='$ac_signal'; { (exit 1); exit 1; }' $ac_signal
+done
+ac_signal=0
+
+# confdefs.h avoids OS command line length limits that DEFS can exceed.
+rm -f -r conftest* confdefs.h
+
+# Predefined preprocessor variables.
+
+cat >>confdefs.h <<_ACEOF
+#define PACKAGE_NAME "$PACKAGE_NAME"
+_ACEOF
+
+
+cat >>confdefs.h <<_ACEOF
+#define PACKAGE_TARNAME "$PACKAGE_TARNAME"
+_ACEOF
+
+
+cat >>confdefs.h <<_ACEOF
+#define PACKAGE_VERSION "$PACKAGE_VERSION"
+_ACEOF
+
+
+cat >>confdefs.h <<_ACEOF
+#define PACKAGE_STRING "$PACKAGE_STRING"
+_ACEOF
+
+
+cat >>confdefs.h <<_ACEOF
+#define PACKAGE_BUGREPORT "$PACKAGE_BUGREPORT"
+_ACEOF
+
+
+# Let the site file select an alternate cache file if it wants to.
+# Prefer explicitly selected file to automatically selected ones.
+if test -n "$CONFIG_SITE"; then
+  set x "$CONFIG_SITE"
+elif test "x$prefix" != xNONE; then
+  set x "$prefix/share/config.site" "$prefix/etc/config.site"
+else
+  set x "$ac_default_prefix/share/config.site" \
+	"$ac_default_prefix/etc/config.site"
+fi
+shift
+for ac_site_file
+do
+  if test -r "$ac_site_file"; then
+    { echo "$as_me:$LINENO: loading site script $ac_site_file" >&5
+echo "$as_me: loading site script $ac_site_file" >&6;}
+    sed 's/^/| /' "$ac_site_file" >&5
+    . "$ac_site_file"
+  fi
+done
+
+if test -r "$cache_file"; then
+  # Some versions of bash will fail to source /dev/null (special
+  # files actually), so we avoid doing that.
+  if test -f "$cache_file"; then
+    { echo "$as_me:$LINENO: loading cache $cache_file" >&5
+echo "$as_me: loading cache $cache_file" >&6;}
+    case $cache_file in
+      [\\/]* | ?:[\\/]* ) . "$cache_file";;
+      *)                      . "./$cache_file";;
+    esac
+  fi
+else
+  { echo "$as_me:$LINENO: creating cache $cache_file" >&5
+echo "$as_me: creating cache $cache_file" >&6;}
+  >$cache_file
+fi
+
+# Check that the precious variables saved in the cache have kept the same
+# value.
+ac_cache_corrupted=false
+for ac_var in $ac_precious_vars; do
+  eval ac_old_set=\$ac_cv_env_${ac_var}_set
+  eval ac_new_set=\$ac_env_${ac_var}_set
+  eval ac_old_val=\$ac_cv_env_${ac_var}_value
+  eval ac_new_val=\$ac_env_${ac_var}_value
+  case $ac_old_set,$ac_new_set in
+    set,)
+      { echo "$as_me:$LINENO: error: \`$ac_var' was set to \`$ac_old_val' in the previous run" >&5
+echo "$as_me: error: \`$ac_var' was set to \`$ac_old_val' in the previous run" >&2;}
+      ac_cache_corrupted=: ;;
+    ,set)
+      { echo "$as_me:$LINENO: error: \`$ac_var' was not set in the previous run" >&5
+echo "$as_me: error: \`$ac_var' was not set in the previous run" >&2;}
+      ac_cache_corrupted=: ;;
+    ,);;
+    *)
+      if test "x$ac_old_val" != "x$ac_new_val"; then
+	{ echo "$as_me:$LINENO: error: \`$ac_var' has changed since the previous run:" >&5
+echo "$as_me: error: \`$ac_var' has changed since the previous run:" >&2;}
+	{ echo "$as_me:$LINENO:   former value:  $ac_old_val" >&5
+echo "$as_me:   former value:  $ac_old_val" >&2;}
+	{ echo "$as_me:$LINENO:   current value: $ac_new_val" >&5
+echo "$as_me:   current value: $ac_new_val" >&2;}
+	ac_cache_corrupted=:
+      fi;;
+  esac
+  # Pass precious variables to config.status.
+  if test "$ac_new_set" = set; then
+    case $ac_new_val in
+    *\'*) ac_arg=$ac_var=`echo "$ac_new_val" | sed "s/'/'\\\\\\\\''/g"` ;;
+    *) ac_arg=$ac_var=$ac_new_val ;;
+    esac
+    case " $ac_configure_args " in
+      *" '$ac_arg' "*) ;; # Avoid dups.  Use of quotes ensures accuracy.
+      *) ac_configure_args="$ac_configure_args '$ac_arg'" ;;
+    esac
+  fi
+done
+if $ac_cache_corrupted; then
+  { echo "$as_me:$LINENO: error: changes in the environment can compromise the build" >&5
+echo "$as_me: error: changes in the environment can compromise the build" >&2;}
+  { { echo "$as_me:$LINENO: error: run \`make distclean' and/or \`rm $cache_file' and start over" >&5
+echo "$as_me: error: run \`make distclean' and/or \`rm $cache_file' and start over" >&2;}
+   { (exit 1); exit 1; }; }
+fi
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ac_ext=c
+ac_cpp='$CPP $CPPFLAGS'
+ac_compile='$CC -c $CFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CC -o conftest$ac_exeext $CFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_c_compiler_gnu
+
+
+ac_config_headers="$ac_config_headers common/config.h"
+
+
+BUILD_PARSERS=true
+
+
+ac_ext=c
+ac_cpp='$CPP $CPPFLAGS'
+ac_compile='$CC -c $CFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CC -o conftest$ac_exeext $CFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_c_compiler_gnu
+if test -n "$ac_tool_prefix"; then
+  # Extract the first word of "${ac_tool_prefix}gcc", so it can be a program name with args.
+set dummy ${ac_tool_prefix}gcc; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$CC"; then
+  ac_cv_prog_CC="$CC" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_CC="${ac_tool_prefix}gcc"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+CC=$ac_cv_prog_CC
+if test -n "$CC"; then
+  { echo "$as_me:$LINENO: result: $CC" >&5
+echo "${ECHO_T}$CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+fi
+if test -z "$ac_cv_prog_CC"; then
+  ac_ct_CC=$CC
+  # Extract the first word of "gcc", so it can be a program name with args.
+set dummy gcc; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_ac_ct_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$ac_ct_CC"; then
+  ac_cv_prog_ac_ct_CC="$ac_ct_CC" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_ac_ct_CC="gcc"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+ac_ct_CC=$ac_cv_prog_ac_ct_CC
+if test -n "$ac_ct_CC"; then
+  { echo "$as_me:$LINENO: result: $ac_ct_CC" >&5
+echo "${ECHO_T}$ac_ct_CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+  if test "x$ac_ct_CC" = x; then
+    CC=""
+  else
+    case $cross_compiling:$ac_tool_warned in
+yes:)
+{ echo "$as_me:$LINENO: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&5
+echo "$as_me: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&2;}
+ac_tool_warned=yes ;;
+esac
+    CC=$ac_ct_CC
+  fi
+else
+  CC="$ac_cv_prog_CC"
+fi
+
+if test -z "$CC"; then
+          if test -n "$ac_tool_prefix"; then
+    # Extract the first word of "${ac_tool_prefix}cc", so it can be a program name with args.
+set dummy ${ac_tool_prefix}cc; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$CC"; then
+  ac_cv_prog_CC="$CC" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_CC="${ac_tool_prefix}cc"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+CC=$ac_cv_prog_CC
+if test -n "$CC"; then
+  { echo "$as_me:$LINENO: result: $CC" >&5
+echo "${ECHO_T}$CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+  fi
+fi
+if test -z "$CC"; then
+  # Extract the first word of "cc", so it can be a program name with args.
+set dummy cc; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$CC"; then
+  ac_cv_prog_CC="$CC" # Let the user override the test.
+else
+  ac_prog_rejected=no
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    if test "$as_dir/$ac_word$ac_exec_ext" = "/usr/ucb/cc"; then
+       ac_prog_rejected=yes
+       continue
+     fi
+    ac_cv_prog_CC="cc"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+if test $ac_prog_rejected = yes; then
+  # We found a bogon in the path, so make sure we never use it.
+  set dummy $ac_cv_prog_CC
+  shift
+  if test $# != 0; then
+    # We chose a different compiler from the bogus one.
+    # However, it has the same basename, so the bogon will be chosen
+    # first if we set CC to just the basename; use the full file name.
+    shift
+    ac_cv_prog_CC="$as_dir/$ac_word${1+' '}$@"
+  fi
+fi
+fi
+fi
+CC=$ac_cv_prog_CC
+if test -n "$CC"; then
+  { echo "$as_me:$LINENO: result: $CC" >&5
+echo "${ECHO_T}$CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+fi
+if test -z "$CC"; then
+  if test -n "$ac_tool_prefix"; then
+  for ac_prog in cl.exe
+  do
+    # Extract the first word of "$ac_tool_prefix$ac_prog", so it can be a program name with args.
+set dummy $ac_tool_prefix$ac_prog; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$CC"; then
+  ac_cv_prog_CC="$CC" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_CC="$ac_tool_prefix$ac_prog"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+CC=$ac_cv_prog_CC
+if test -n "$CC"; then
+  { echo "$as_me:$LINENO: result: $CC" >&5
+echo "${ECHO_T}$CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+    test -n "$CC" && break
+  done
+fi
+if test -z "$CC"; then
+  ac_ct_CC=$CC
+  for ac_prog in cl.exe
+do
+  # Extract the first word of "$ac_prog", so it can be a program name with args.
+set dummy $ac_prog; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_ac_ct_CC+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$ac_ct_CC"; then
+  ac_cv_prog_ac_ct_CC="$ac_ct_CC" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_ac_ct_CC="$ac_prog"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+ac_ct_CC=$ac_cv_prog_ac_ct_CC
+if test -n "$ac_ct_CC"; then
+  { echo "$as_me:$LINENO: result: $ac_ct_CC" >&5
+echo "${ECHO_T}$ac_ct_CC" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+  test -n "$ac_ct_CC" && break
+done
+
+  if test "x$ac_ct_CC" = x; then
+    CC=""
+  else
+    case $cross_compiling:$ac_tool_warned in
+yes:)
+{ echo "$as_me:$LINENO: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&5
+echo "$as_me: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&2;}
+ac_tool_warned=yes ;;
+esac
+    CC=$ac_ct_CC
+  fi
+fi
+
+fi
+
+
+test -z "$CC" && { { echo "$as_me:$LINENO: error: no acceptable C compiler found in \$PATH
+See \`config.log' for more details." >&5
+echo "$as_me: error: no acceptable C compiler found in \$PATH
+See \`config.log' for more details." >&2;}
+   { (exit 1); exit 1; }; }
+
+# Provide some information about the compiler.
+echo "$as_me:$LINENO: checking for C compiler version" >&5
+ac_compiler=`set X $ac_compile; echo $2`
+{ (ac_try="$ac_compiler --version >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler --version >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+{ (ac_try="$ac_compiler -v >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler -v >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+{ (ac_try="$ac_compiler -V >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler -V >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+
+cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+ac_clean_files_save=$ac_clean_files
+ac_clean_files="$ac_clean_files a.out a.exe b.out"
+# Try to create an executable without -o first, disregard a.out.
+# It will help us diagnose broken compilers, and finding out an intuition
+# of exeext.
+{ echo "$as_me:$LINENO: checking for C compiler default output file name" >&5
+echo $ECHO_N "checking for C compiler default output file name... $ECHO_C" >&6; }
+ac_link_default=`echo "$ac_link" | sed 's/ -o *conftest[^ ]*//'`
+#
+# List of possible output files, starting from the most likely.
+# The algorithm is not robust to junk in `.', hence go to wildcards (a.*)
+# only as a last resort.  b.out is created by i960 compilers.
+ac_files='a_out.exe a.exe conftest.exe a.out conftest a.* conftest.* b.out'
+#
+# The IRIX 6 linker writes into existing files which may not be
+# executable, retaining their permissions.  Remove them first so a
+# subsequent execution test works.
+ac_rmfiles=
+for ac_file in $ac_files
+do
+  case $ac_file in
+    *.$ac_ext | *.xcoff | *.tds | *.d | *.pdb | *.xSYM | *.bb | *.bbg | *.map | *.inf | *.o | *.obj ) ;;
+    * ) ac_rmfiles="$ac_rmfiles $ac_file";;
+  esac
+done
+rm -f $ac_rmfiles
+
+if { (ac_try="$ac_link_default"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_link_default") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }; then
+  # Autoconf-2.13 could set the ac_cv_exeext variable to `no'.
+# So ignore a value of `no', otherwise this would lead to `EXEEXT = no'
+# in a Makefile.  We should not override ac_cv_exeext if it was cached,
+# so that the user can short-circuit this test for compilers unknown to
+# Autoconf.
+for ac_file in $ac_files ''
+do
+  test -f "$ac_file" || continue
+  case $ac_file in
+    *.$ac_ext | *.xcoff | *.tds | *.d | *.pdb | *.xSYM | *.bb | *.bbg | *.map | *.inf | *.o | *.obj )
+	;;
+    [ab].out )
+	# We found the default executable, but exeext='' is most
+	# certainly right.
+	break;;
+    *.* )
+        if test "${ac_cv_exeext+set}" = set && test "$ac_cv_exeext" != no;
+	then :; else
+	   ac_cv_exeext=`expr "$ac_file" : '[^.]*\(\..*\)'`
+	fi
+	# We set ac_cv_exeext here because the later test for it is not
+	# safe: cross compilers may not add the suffix if given an `-o'
+	# argument, so we may need to know it at that point already.
+	# Even if this section looks crufty: it has the advantage of
+	# actually working.
+	break;;
+    * )
+	break;;
+  esac
+done
+test "$ac_cv_exeext" = no && ac_cv_exeext=
+
+else
+  ac_file=''
+fi
+
+{ echo "$as_me:$LINENO: result: $ac_file" >&5
+echo "${ECHO_T}$ac_file" >&6; }
+if test -z "$ac_file"; then
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+{ { echo "$as_me:$LINENO: error: C compiler cannot create executables
+See \`config.log' for more details." >&5
+echo "$as_me: error: C compiler cannot create executables
+See \`config.log' for more details." >&2;}
+   { (exit 77); exit 77; }; }
+fi
+
+ac_exeext=$ac_cv_exeext
+
+# Check that the compiler produces executables we can run.  If not, either
+# the compiler is broken, or we cross compile.
+{ echo "$as_me:$LINENO: checking whether the C compiler works" >&5
+echo $ECHO_N "checking whether the C compiler works... $ECHO_C" >&6; }
+# FIXME: These cross compiler hacks should be removed for Autoconf 3.0
+# If not cross compiling, check that we can run a simple program.
+if test "$cross_compiling" != yes; then
+  if { ac_try='./$ac_file'
+  { (case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_try") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }; }; then
+    cross_compiling=no
+  else
+    if test "$cross_compiling" = maybe; then
+	cross_compiling=yes
+    else
+	{ { echo "$as_me:$LINENO: error: cannot run C compiled programs.
+If you meant to cross compile, use \`--host'.
+See \`config.log' for more details." >&5
+echo "$as_me: error: cannot run C compiled programs.
+If you meant to cross compile, use \`--host'.
+See \`config.log' for more details." >&2;}
+   { (exit 1); exit 1; }; }
+    fi
+  fi
+fi
+{ echo "$as_me:$LINENO: result: yes" >&5
+echo "${ECHO_T}yes" >&6; }
+
+rm -f a.out a.exe conftest$ac_cv_exeext b.out
+ac_clean_files=$ac_clean_files_save
+# Check that the compiler produces executables we can run.  If not, either
+# the compiler is broken, or we cross compile.
+{ echo "$as_me:$LINENO: checking whether we are cross compiling" >&5
+echo $ECHO_N "checking whether we are cross compiling... $ECHO_C" >&6; }
+{ echo "$as_me:$LINENO: result: $cross_compiling" >&5
+echo "${ECHO_T}$cross_compiling" >&6; }
+
+{ echo "$as_me:$LINENO: checking for suffix of executables" >&5
+echo $ECHO_N "checking for suffix of executables... $ECHO_C" >&6; }
+if { (ac_try="$ac_link"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_link") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }; then
+  # If both `conftest.exe' and `conftest' are `present' (well, observable)
+# catch `conftest.exe'.  For instance with Cygwin, `ls conftest' will
+# work properly (i.e., refer to `conftest.exe'), while it won't with
+# `rm'.
+for ac_file in conftest.exe conftest conftest.*; do
+  test -f "$ac_file" || continue
+  case $ac_file in
+    *.$ac_ext | *.xcoff | *.tds | *.d | *.pdb | *.xSYM | *.bb | *.bbg | *.map | *.inf | *.o | *.obj ) ;;
+    *.* ) ac_cv_exeext=`expr "$ac_file" : '[^.]*\(\..*\)'`
+	  break;;
+    * ) break;;
+  esac
+done
+else
+  { { echo "$as_me:$LINENO: error: cannot compute suffix of executables: cannot compile and link
+See \`config.log' for more details." >&5
+echo "$as_me: error: cannot compute suffix of executables: cannot compile and link
+See \`config.log' for more details." >&2;}
+   { (exit 1); exit 1; }; }
+fi
+
+rm -f conftest$ac_cv_exeext
+{ echo "$as_me:$LINENO: result: $ac_cv_exeext" >&5
+echo "${ECHO_T}$ac_cv_exeext" >&6; }
+
+rm -f conftest.$ac_ext
+EXEEXT=$ac_cv_exeext
+ac_exeext=$EXEEXT
+{ echo "$as_me:$LINENO: checking for suffix of object files" >&5
+echo $ECHO_N "checking for suffix of object files... $ECHO_C" >&6; }
+if test "${ac_cv_objext+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.o conftest.obj
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }; then
+  for ac_file in conftest.o conftest.obj conftest.*; do
+  test -f "$ac_file" || continue;
+  case $ac_file in
+    *.$ac_ext | *.xcoff | *.tds | *.d | *.pdb | *.xSYM | *.bb | *.bbg | *.map | *.inf ) ;;
+    *) ac_cv_objext=`expr "$ac_file" : '.*\.\(.*\)'`
+       break;;
+  esac
+done
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+{ { echo "$as_me:$LINENO: error: cannot compute suffix of object files: cannot compile
+See \`config.log' for more details." >&5
+echo "$as_me: error: cannot compute suffix of object files: cannot compile
+See \`config.log' for more details." >&2;}
+   { (exit 1); exit 1; }; }
+fi
+
+rm -f conftest.$ac_cv_objext conftest.$ac_ext
+fi
+{ echo "$as_me:$LINENO: result: $ac_cv_objext" >&5
+echo "${ECHO_T}$ac_cv_objext" >&6; }
+OBJEXT=$ac_cv_objext
+ac_objext=$OBJEXT
+{ echo "$as_me:$LINENO: checking whether we are using the GNU C compiler" >&5
+echo $ECHO_N "checking whether we are using the GNU C compiler... $ECHO_C" >&6; }
+if test "${ac_cv_c_compiler_gnu+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+#ifndef __GNUC__
+       choke me
+#endif
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_c_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_compiler_gnu=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	ac_compiler_gnu=no
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+ac_cv_c_compiler_gnu=$ac_compiler_gnu
+
+fi
+{ echo "$as_me:$LINENO: result: $ac_cv_c_compiler_gnu" >&5
+echo "${ECHO_T}$ac_cv_c_compiler_gnu" >&6; }
+GCC=`test $ac_compiler_gnu = yes && echo yes`
+ac_test_CFLAGS=${CFLAGS+set}
+ac_save_CFLAGS=$CFLAGS
+{ echo "$as_me:$LINENO: checking whether $CC accepts -g" >&5
+echo $ECHO_N "checking whether $CC accepts -g... $ECHO_C" >&6; }
+if test "${ac_cv_prog_cc_g+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  ac_save_c_werror_flag=$ac_c_werror_flag
+   ac_c_werror_flag=yes
+   ac_cv_prog_cc_g=no
+   CFLAGS="-g"
+   cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_c_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_cv_prog_cc_g=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	CFLAGS=""
+      cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_c_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  :
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	ac_c_werror_flag=$ac_save_c_werror_flag
+	 CFLAGS="-g"
+	 cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_c_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_cv_prog_cc_g=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+   ac_c_werror_flag=$ac_save_c_werror_flag
+fi
+{ echo "$as_me:$LINENO: result: $ac_cv_prog_cc_g" >&5
+echo "${ECHO_T}$ac_cv_prog_cc_g" >&6; }
+if test "$ac_test_CFLAGS" = set; then
+  CFLAGS=$ac_save_CFLAGS
+elif test $ac_cv_prog_cc_g = yes; then
+  if test "$GCC" = yes; then
+    CFLAGS="-g -O2"
+  else
+    CFLAGS="-g"
+  fi
+else
+  if test "$GCC" = yes; then
+    CFLAGS="-O2"
+  else
+    CFLAGS=
+  fi
+fi
+{ echo "$as_me:$LINENO: checking for $CC option to accept ISO C89" >&5
+echo $ECHO_N "checking for $CC option to accept ISO C89... $ECHO_C" >&6; }
+if test "${ac_cv_prog_cc_c89+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  ac_cv_prog_cc_c89=no
+ac_save_CC=$CC
+cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+#include <stdarg.h>
+#include <stdio.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+/* Most of the following tests are stolen from RCS 5.7's src/conf.sh.  */
+struct buf { int x; };
+FILE * (*rcsopen) (struct buf *, struct stat *, int);
+static char *e (p, i)
+     char **p;
+     int i;
+{
+  return p[i];
+}
+static char *f (char * (*g) (char **, int), char **p, ...)
+{
+  char *s;
+  va_list v;
+  va_start (v,p);
+  s = g (p, va_arg (v,int));
+  va_end (v);
+  return s;
+}
+
+/* OSF 4.0 Compaq cc is some sort of almost-ANSI by default.  It has
+   function prototypes and stuff, but not '\xHH' hex character constants.
+   These don't provoke an error unfortunately, instead are silently treated
+   as 'x'.  The following induces an error, until -std is added to get
+   proper ANSI mode.  Curiously '\x00'!='x' always comes out true, for an
+   array size at least.  It's necessary to write '\x00'==0 to get something
+   that's true only with -std.  */
+int osf4_cc_array ['\x00' == 0 ? 1 : -1];
+
+/* IBM C 6 for AIX is almost-ANSI by default, but it replaces macro parameters
+   inside strings and character constants.  */
+#define FOO(x) 'x'
+int xlc6_cc_array[FOO(a) == 'x' ? 1 : -1];
+
+int test (int i, double x);
+struct s1 {int (*f) (int a);};
+struct s2 {int (*f) (double a);};
+int pairnames (int, char **, FILE *(*)(struct buf *, struct stat *, int), int, int);
+int argc;
+char **argv;
+int
+main ()
+{
+return f (e, argv, 0) != argv[0]  ||  f (e, argv, 1) != argv[1];
+  ;
+  return 0;
+}
+_ACEOF
+for ac_arg in '' -qlanglvl=extc89 -qlanglvl=ansi -std \
+	-Ae "-Aa -D_HPUX_SOURCE" "-Xc -D__EXTENSIONS__"
+do
+  CC="$ac_save_CC $ac_arg"
+  rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_c_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_cv_prog_cc_c89=$ac_arg
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+
+fi
+
+rm -f core conftest.err conftest.$ac_objext
+  test "x$ac_cv_prog_cc_c89" != "xno" && break
+done
+rm -f conftest.$ac_ext
+CC=$ac_save_CC
+
+fi
+# AC_CACHE_VAL
+case "x$ac_cv_prog_cc_c89" in
+  x)
+    { echo "$as_me:$LINENO: result: none needed" >&5
+echo "${ECHO_T}none needed" >&6; } ;;
+  xno)
+    { echo "$as_me:$LINENO: result: unsupported" >&5
+echo "${ECHO_T}unsupported" >&6; } ;;
+  *)
+    CC="$CC $ac_cv_prog_cc_c89"
+    { echo "$as_me:$LINENO: result: $ac_cv_prog_cc_c89" >&5
+echo "${ECHO_T}$ac_cv_prog_cc_c89" >&6; } ;;
+esac
+
+
+ac_ext=c
+ac_cpp='$CPP $CPPFLAGS'
+ac_compile='$CC -c $CFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CC -o conftest$ac_exeext $CFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_c_compiler_gnu
+
+cat >>confdefs.h <<_ACEOF
+#define CC $CC
+_ACEOF
+
+
+ac_ext=cpp
+ac_cpp='$CXXCPP $CPPFLAGS'
+ac_compile='$CXX -c $CXXFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CXX -o conftest$ac_exeext $CXXFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_cxx_compiler_gnu
+if test -z "$CXX"; then
+  if test -n "$CCC"; then
+    CXX=$CCC
+  else
+    if test -n "$ac_tool_prefix"; then
+  for ac_prog in g++ c++ gpp aCC CC cxx cc++ cl.exe FCC KCC RCC xlC_r xlC
+  do
+    # Extract the first word of "$ac_tool_prefix$ac_prog", so it can be a program name with args.
+set dummy $ac_tool_prefix$ac_prog; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_CXX+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$CXX"; then
+  ac_cv_prog_CXX="$CXX" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_CXX="$ac_tool_prefix$ac_prog"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+CXX=$ac_cv_prog_CXX
+if test -n "$CXX"; then
+  { echo "$as_me:$LINENO: result: $CXX" >&5
+echo "${ECHO_T}$CXX" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+    test -n "$CXX" && break
+  done
+fi
+if test -z "$CXX"; then
+  ac_ct_CXX=$CXX
+  for ac_prog in g++ c++ gpp aCC CC cxx cc++ cl.exe FCC KCC RCC xlC_r xlC
+do
+  # Extract the first word of "$ac_prog", so it can be a program name with args.
+set dummy $ac_prog; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_ac_ct_CXX+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$ac_ct_CXX"; then
+  ac_cv_prog_ac_ct_CXX="$ac_ct_CXX" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_ac_ct_CXX="$ac_prog"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+ac_ct_CXX=$ac_cv_prog_ac_ct_CXX
+if test -n "$ac_ct_CXX"; then
+  { echo "$as_me:$LINENO: result: $ac_ct_CXX" >&5
+echo "${ECHO_T}$ac_ct_CXX" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+  test -n "$ac_ct_CXX" && break
+done
+
+  if test "x$ac_ct_CXX" = x; then
+    CXX="g++"
+  else
+    case $cross_compiling:$ac_tool_warned in
+yes:)
+{ echo "$as_me:$LINENO: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&5
+echo "$as_me: WARNING: In the future, Autoconf will not detect cross-tools
+whose name does not start with the host triplet.  If you think this
+configuration is useful to you, please write to autoconf@gnu.org." >&2;}
+ac_tool_warned=yes ;;
+esac
+    CXX=$ac_ct_CXX
+  fi
+fi
+
+  fi
+fi
+# Provide some information about the compiler.
+echo "$as_me:$LINENO: checking for C++ compiler version" >&5
+ac_compiler=`set X $ac_compile; echo $2`
+{ (ac_try="$ac_compiler --version >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler --version >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+{ (ac_try="$ac_compiler -v >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler -v >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+{ (ac_try="$ac_compiler -V >&5"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compiler -V >&5") 2>&5
+  ac_status=$?
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); }
+
+{ echo "$as_me:$LINENO: checking whether we are using the GNU C++ compiler" >&5
+echo $ECHO_N "checking whether we are using the GNU C++ compiler... $ECHO_C" >&6; }
+if test "${ac_cv_cxx_compiler_gnu+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+#ifndef __GNUC__
+       choke me
+#endif
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_cxx_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_compiler_gnu=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	ac_compiler_gnu=no
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+ac_cv_cxx_compiler_gnu=$ac_compiler_gnu
+
+fi
+{ echo "$as_me:$LINENO: result: $ac_cv_cxx_compiler_gnu" >&5
+echo "${ECHO_T}$ac_cv_cxx_compiler_gnu" >&6; }
+GXX=`test $ac_compiler_gnu = yes && echo yes`
+ac_test_CXXFLAGS=${CXXFLAGS+set}
+ac_save_CXXFLAGS=$CXXFLAGS
+{ echo "$as_me:$LINENO: checking whether $CXX accepts -g" >&5
+echo $ECHO_N "checking whether $CXX accepts -g... $ECHO_C" >&6; }
+if test "${ac_cv_prog_cxx_g+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  ac_save_cxx_werror_flag=$ac_cxx_werror_flag
+   ac_cxx_werror_flag=yes
+   ac_cv_prog_cxx_g=no
+   CXXFLAGS="-g"
+   cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_cxx_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_cv_prog_cxx_g=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	CXXFLAGS=""
+      cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_cxx_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  :
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+	ac_cxx_werror_flag=$ac_save_cxx_werror_flag
+	 CXXFLAGS="-g"
+	 cat >conftest.$ac_ext <<_ACEOF
+/* confdefs.h.  */
+_ACEOF
+cat confdefs.h >>conftest.$ac_ext
+cat >>conftest.$ac_ext <<_ACEOF
+/* end confdefs.h.  */
+
+int
+main ()
+{
+
+  ;
+  return 0;
+}
+_ACEOF
+rm -f conftest.$ac_objext
+if { (ac_try="$ac_compile"
+case "(($ac_try" in
+  *\"* | *\`* | *\\*) ac_try_echo=\$ac_try;;
+  *) ac_try_echo=$ac_try;;
+esac
+eval "echo \"\$as_me:$LINENO: $ac_try_echo\"") >&5
+  (eval "$ac_compile") 2>conftest.er1
+  ac_status=$?
+  grep -v '^ *+' conftest.er1 >conftest.err
+  rm -f conftest.er1
+  cat conftest.err >&5
+  echo "$as_me:$LINENO: \$? = $ac_status" >&5
+  (exit $ac_status); } && {
+	 test -z "$ac_cxx_werror_flag" ||
+	 test ! -s conftest.err
+       } && test -s conftest.$ac_objext; then
+  ac_cv_prog_cxx_g=yes
+else
+  echo "$as_me: failed program was:" >&5
+sed 's/^/| /' conftest.$ac_ext >&5
+
+
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+fi
+
+rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
+   ac_cxx_werror_flag=$ac_save_cxx_werror_flag
+fi
+{ echo "$as_me:$LINENO: result: $ac_cv_prog_cxx_g" >&5
+echo "${ECHO_T}$ac_cv_prog_cxx_g" >&6; }
+if test "$ac_test_CXXFLAGS" = set; then
+  CXXFLAGS=$ac_save_CXXFLAGS
+elif test $ac_cv_prog_cxx_g = yes; then
+  if test "$GXX" = yes; then
+    CXXFLAGS="-g -O2"
+  else
+    CXXFLAGS="-g"
+  fi
+else
+  if test "$GXX" = yes; then
+    CXXFLAGS="-O2"
+  else
+    CXXFLAGS=
+  fi
+fi
+ac_ext=c
+ac_cpp='$CPP $CPPFLAGS'
+ac_compile='$CC -c $CFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CC -o conftest$ac_exeext $CFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_c_compiler_gnu
+
+cat >>confdefs.h <<_ACEOF
+#define CXX $CXX
+_ACEOF
+
+
+ac_ext=cpp
+ac_cpp='$CXXCPP $CPPFLAGS'
+ac_compile='$CXX -c $CXXFLAGS $CPPFLAGS conftest.$ac_ext >&5'
+ac_link='$CXX -o conftest$ac_exeext $CXXFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $LIBS >&5'
+ac_compiler_gnu=$ac_cv_cxx_compiler_gnu
+
+
+{ echo "$as_me:$LINENO: checking whether ${MAKE-make} sets \$(MAKE)" >&5
+echo $ECHO_N "checking whether ${MAKE-make} sets \$(MAKE)... $ECHO_C" >&6; }
+set x ${MAKE-make}; ac_make=`echo "$2" | sed 's/+/p/g; s/[^a-zA-Z0-9_]/_/g'`
+if { as_var=ac_cv_prog_make_${ac_make}_set; eval "test \"\${$as_var+set}\" = set"; }; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  cat >conftest.make <<\_ACEOF
+SHELL = /bin/sh
+all:
+	@echo '@@@%%%=$(MAKE)=@@@%%%'
+_ACEOF
+# GNU make sometimes prints "make[1]: Entering...", which would confuse us.
+case `${MAKE-make} -f conftest.make 2>/dev/null` in
+  *@@@%%%=?*=@@@%%%*)
+    eval ac_cv_prog_make_${ac_make}_set=yes;;
+  *)
+    eval ac_cv_prog_make_${ac_make}_set=no;;
+esac
+rm -f conftest.make
+fi
+if eval test \$ac_cv_prog_make_${ac_make}_set = yes; then
+  { echo "$as_me:$LINENO: result: yes" >&5
+echo "${ECHO_T}yes" >&6; }
+  SET_MAKE=
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+  SET_MAKE="MAKE=${MAKE-make}"
+fi
+
+
+# Logging features
+# Check whether --enable-log was given.
+if test "${enable_log+set}" = set; then
+  enableval=$enable_log; cat >>confdefs.h <<\_ACEOF
+#define COLM_LOG 1
+_ACEOF
+
+fi
+
+# Check whether --enable-log-bytecode was given.
+if test "${enable_log_bytecode+set}" = set; then
+  enableval=$enable_log_bytecode; cat >>confdefs.h <<\_ACEOF
+#define COLM_LOG_BYTECODE 1
+_ACEOF
+
+fi
+
+# Check whether --enable-log-parse was given.
+if test "${enable_log_parse+set}" = set; then
+  enableval=$enable_log_parse; cat >>confdefs.h <<\_ACEOF
+#define COLM_LOG_PARSE 1
+_ACEOF
+
+fi
+
+# Check whether --enable-log-match was given.
+if test "${enable_log_match+set}" = set; then
+  enableval=$enable_log_match; cat >>confdefs.h <<\_ACEOF
+#define COLM_LOG_MATCH 1
+_ACEOF
+
+fi
+
+# Check whether --enable-log-compile was given.
+if test "${enable_log_compile+set}" = set; then
+  enableval=$enable_log_compile; cat >>confdefs.h <<\_ACEOF
+#define COLM_LOG_COMPILE 1
+_ACEOF
+
+fi
+
+
+if test $BUILD_PARSERS = true; then
+
+# Extract the first word of "ragel", so it can be a program name with args.
+set dummy ragel; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_RAGEL+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$RAGEL"; then
+  ac_cv_prog_RAGEL="$RAGEL" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_RAGEL="ragel"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+RAGEL=$ac_cv_prog_RAGEL
+if test -n "$RAGEL"; then
+  { echo "$as_me:$LINENO: result: $RAGEL" >&5
+echo "${ECHO_T}$RAGEL" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+if test -z "$RAGEL"; then
+	echo
+	echo "error: ragel is required to build the parsers"
+	echo
+	exit 1
+fi
+
+# Extract the first word of "kelbt", so it can be a program name with args.
+set dummy kelbt; ac_word=$2
+{ echo "$as_me:$LINENO: checking for $ac_word" >&5
+echo $ECHO_N "checking for $ac_word... $ECHO_C" >&6; }
+if test "${ac_cv_prog_KELBT+set}" = set; then
+  echo $ECHO_N "(cached) $ECHO_C" >&6
+else
+  if test -n "$KELBT"; then
+  ac_cv_prog_KELBT="$KELBT" # Let the user override the test.
+else
+as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  for ac_exec_ext in '' $ac_executable_extensions; do
+  if { test -f "$as_dir/$ac_word$ac_exec_ext" && $as_test_x "$as_dir/$ac_word$ac_exec_ext"; }; then
+    ac_cv_prog_KELBT="kelbt"
+    echo "$as_me:$LINENO: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+done
+IFS=$as_save_IFS
+
+fi
+fi
+KELBT=$ac_cv_prog_KELBT
+if test -n "$KELBT"; then
+  { echo "$as_me:$LINENO: result: $KELBT" >&5
+echo "${ECHO_T}$KELBT" >&6; }
+else
+  { echo "$as_me:$LINENO: result: no" >&5
+echo "${ECHO_T}no" >&6; }
+fi
+
+
+if test -z "$KELBT"; then
+	echo
+	echo "error: kelbt is required to build the parsers"
+	echo
+	exit 1
+fi
+
+fi # BUILD_PARSERS
+
+ac_config_files="$ac_config_files Makefile common/Makefile colm/Makefile"
+
+cat >confcache <<\_ACEOF
+# This file is a shell script that caches the results of configure
+# tests run on this system so they can be shared between configure
+# scripts and configure runs, see configure's option --config-cache.
+# It is not useful on other systems.  If it contains results you don't
+# want to keep, you may remove or edit it.
+#
+# config.status only pays attention to the cache file if you give it
+# the --recheck option to rerun configure.
+#
+# `ac_cv_env_foo' variables (set or unset) will be overridden when
+# loading this file, other *unset* `ac_cv_foo' will be assigned the
+# following values.
+
+_ACEOF
+
+# The following way of writing the cache mishandles newlines in values,
+# but we know of no workaround that is simple, portable, and efficient.
+# So, we kill variables containing newlines.
+# Ultrix sh set writes to stderr and can't be redirected directly,
+# and sets the high bit in the cache file unless we assign to the vars.
+(
+  for ac_var in `(set) 2>&1 | sed -n 's/^\([a-zA-Z_][a-zA-Z0-9_]*\)=.*/\1/p'`; do
+    eval ac_val=\$$ac_var
+    case $ac_val in #(
+    *${as_nl}*)
+      case $ac_var in #(
+      *_cv_*) { echo "$as_me:$LINENO: WARNING: Cache variable $ac_var contains a newline." >&5
+echo "$as_me: WARNING: Cache variable $ac_var contains a newline." >&2;} ;;
+      esac
+      case $ac_var in #(
+      _ | IFS | as_nl) ;; #(
+      *) $as_unset $ac_var ;;
+      esac ;;
+    esac
+  done
+
+  (set) 2>&1 |
+    case $as_nl`(ac_space=' '; set) 2>&1` in #(
+    *${as_nl}ac_space=\ *)
+      # `set' does not quote correctly, so add quotes (double-quote
+      # substitution turns \\\\ into \\, and sed turns \\ into \).
+      sed -n \
+	"s/'/'\\\\''/g;
+	  s/^\\([_$as_cr_alnum]*_cv_[_$as_cr_alnum]*\\)=\\(.*\\)/\\1='\\2'/p"
+      ;; #(
+    *)
+      # `set' quotes correctly as required by POSIX, so do not add quotes.
+      sed -n "/^[_$as_cr_alnum]*_cv_[_$as_cr_alnum]*=/p"
+      ;;
+    esac |
+    sort
+) |
+  sed '
+     /^ac_cv_env_/b end
+     t clear
+     :clear
+     s/^\([^=]*\)=\(.*[{}].*\)$/test "${\1+set}" = set || &/
+     t end
+     s/^\([^=]*\)=\(.*\)$/\1=${\1=\2}/
+     :end' >>confcache
+if diff "$cache_file" confcache >/dev/null 2>&1; then :; else
+  if test -w "$cache_file"; then
+    test "x$cache_file" != "x/dev/null" &&
+      { echo "$as_me:$LINENO: updating cache $cache_file" >&5
+echo "$as_me: updating cache $cache_file" >&6;}
+    cat confcache >$cache_file
+  else
+    { echo "$as_me:$LINENO: not updating unwritable cache $cache_file" >&5
+echo "$as_me: not updating unwritable cache $cache_file" >&6;}
+  fi
+fi
+rm -f confcache
+
+test "x$prefix" = xNONE && prefix=$ac_default_prefix
+# Let make expand exec_prefix.
+test "x$exec_prefix" = xNONE && exec_prefix='${prefix}'
+
+DEFS=-DHAVE_CONFIG_H
+
+ac_libobjs=
+ac_ltlibobjs=
+for ac_i in : $LIBOBJS; do test "x$ac_i" = x: && continue
+  # 1. Remove the extension, and $U if already installed.
+  ac_script='s/\$U\././;s/\.o$//;s/\.obj$//'
+  ac_i=`echo "$ac_i" | sed "$ac_script"`
+  # 2. Prepend LIBOBJDIR.  When used with automake>=1.10 LIBOBJDIR
+  #    will be set to the directory where LIBOBJS objects are built.
+  ac_libobjs="$ac_libobjs \${LIBOBJDIR}$ac_i\$U.$ac_objext"
+  ac_ltlibobjs="$ac_ltlibobjs \${LIBOBJDIR}$ac_i"'$U.lo'
+done
+LIBOBJS=$ac_libobjs
+
+LTLIBOBJS=$ac_ltlibobjs
+
+
+
+: ${CONFIG_STATUS=./config.status}
+ac_clean_files_save=$ac_clean_files
+ac_clean_files="$ac_clean_files $CONFIG_STATUS"
+{ echo "$as_me:$LINENO: creating $CONFIG_STATUS" >&5
+echo "$as_me: creating $CONFIG_STATUS" >&6;}
+cat >$CONFIG_STATUS <<_ACEOF
+#! $SHELL
+# Generated by $as_me.
+# Run this file to recreate the current configuration.
+# Compiler output produced by configure, useful for debugging
+# configure, is in config.log if it exists.
+
+debug=false
+ac_cs_recheck=false
+ac_cs_silent=false
+SHELL=\${CONFIG_SHELL-$SHELL}
+_ACEOF
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+## --------------------- ##
+## M4sh Initialization.  ##
+## --------------------- ##
+
+# Be more Bourne compatible
+DUALCASE=1; export DUALCASE # for MKS sh
+if test -n "${ZSH_VERSION+set}" && (emulate sh) >/dev/null 2>&1; then
+  emulate sh
+  NULLCMD=:
+  # Zsh 3.x and 4.x performs word splitting on ${1+"$@"}, which
+  # is contrary to our usage.  Disable this feature.
+  alias -g '${1+"$@"}'='"$@"'
+  setopt NO_GLOB_SUBST
+else
+  case `(set -o) 2>/dev/null` in
+  *posix*) set -o posix ;;
+esac
+
+fi
+
+
+
+
+# PATH needs CR
+# Avoid depending upon Character Ranges.
+as_cr_letters='abcdefghijklmnopqrstuvwxyz'
+as_cr_LETTERS='ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+as_cr_Letters=$as_cr_letters$as_cr_LETTERS
+as_cr_digits='0123456789'
+as_cr_alnum=$as_cr_Letters$as_cr_digits
+
+# The user is always right.
+if test "${PATH_SEPARATOR+set}" != set; then
+  echo "#! /bin/sh" >conf$$.sh
+  echo  "exit 0"   >>conf$$.sh
+  chmod +x conf$$.sh
+  if (PATH="/nonexistent;."; conf$$.sh) >/dev/null 2>&1; then
+    PATH_SEPARATOR=';'
+  else
+    PATH_SEPARATOR=:
+  fi
+  rm -f conf$$.sh
+fi
+
+# Support unset when possible.
+if ( (MAIL=60; unset MAIL) || exit) >/dev/null 2>&1; then
+  as_unset=unset
+else
+  as_unset=false
+fi
+
+
+# IFS
+# We need space, tab and new line, in precisely that order.  Quoting is
+# there to prevent editors from complaining about space-tab.
+# (If _AS_PATH_WALK were called with IFS unset, it would disable word
+# splitting by setting IFS to empty value.)
+as_nl='
+'
+IFS=" ""	$as_nl"
+
+# Find who we are.  Look in the path if we contain no directory separator.
+case $0 in
+  *[\\/]* ) as_myself=$0 ;;
+  *) as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+  test -r "$as_dir/$0" && as_myself=$as_dir/$0 && break
+done
+IFS=$as_save_IFS
+
+     ;;
+esac
+# We did not find ourselves, most probably we were run as `sh COMMAND'
+# in which case we are not to be found in the path.
+if test "x$as_myself" = x; then
+  as_myself=$0
+fi
+if test ! -f "$as_myself"; then
+  echo "$as_myself: error: cannot find myself; rerun with an absolute file name" >&2
+  { (exit 1); exit 1; }
+fi
+
+# Work around bugs in pre-3.0 UWIN ksh.
+for as_var in ENV MAIL MAILPATH
+do ($as_unset $as_var) >/dev/null 2>&1 && $as_unset $as_var
+done
+PS1='$ '
+PS2='> '
+PS4='+ '
+
+# NLS nuisances.
+for as_var in \
+  LANG LANGUAGE LC_ADDRESS LC_ALL LC_COLLATE LC_CTYPE LC_IDENTIFICATION \
+  LC_MEASUREMENT LC_MESSAGES LC_MONETARY LC_NAME LC_NUMERIC LC_PAPER \
+  LC_TELEPHONE LC_TIME
+do
+  if (set +x; test -z "`(eval $as_var=C; export $as_var) 2>&1`"); then
+    eval $as_var=C; export $as_var
+  else
+    ($as_unset $as_var) >/dev/null 2>&1 && $as_unset $as_var
+  fi
+done
+
+# Required to use basename.
+if expr a : '\(a\)' >/dev/null 2>&1 &&
+   test "X`expr 00001 : '.*\(...\)'`" = X001; then
+  as_expr=expr
+else
+  as_expr=false
+fi
+
+if (basename -- /) >/dev/null 2>&1 && test "X`basename -- / 2>&1`" = "X/"; then
+  as_basename=basename
+else
+  as_basename=false
+fi
+
+
+# Name of the executable.
+as_me=`$as_basename -- "$0" ||
+$as_expr X/"$0" : '.*/\([^/][^/]*\)/*$' \| \
+	 X"$0" : 'X\(//\)$' \| \
+	 X"$0" : 'X\(/\)' \| . 2>/dev/null ||
+echo X/"$0" |
+    sed '/^.*\/\([^/][^/]*\)\/*$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\/\(\/\/\)$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\/\(\/\).*/{
+	    s//\1/
+	    q
+	  }
+	  s/.*/./; q'`
+
+# CDPATH.
+$as_unset CDPATH
+
+
+
+  as_lineno_1=$LINENO
+  as_lineno_2=$LINENO
+  test "x$as_lineno_1" != "x$as_lineno_2" &&
+  test "x`expr $as_lineno_1 + 1`" = "x$as_lineno_2" || {
+
+  # Create $as_me.lineno as a copy of $as_myself, but with $LINENO
+  # uniformly replaced by the line number.  The first 'sed' inserts a
+  # line-number line after each line using $LINENO; the second 'sed'
+  # does the real work.  The second script uses 'N' to pair each
+  # line-number line with the line containing $LINENO, and appends
+  # trailing '-' during substitution so that $LINENO is not a special
+  # case at line end.
+  # (Raja R Harinath suggested sed '=', and Paul Eggert wrote the
+  # scripts with optimization help from Paolo Bonzini.  Blame Lee
+  # E. McMahon (1931-1989) for sed's syntax.  :-)
+  sed -n '
+    p
+    /[$]LINENO/=
+  ' <$as_myself |
+    sed '
+      s/[$]LINENO.*/&-/
+      t lineno
+      b
+      :lineno
+      N
+      :loop
+      s/[$]LINENO\([^'$as_cr_alnum'_].*\n\)\(.*\)/\2\1\2/
+      t loop
+      s/-\n.*//
+    ' >$as_me.lineno &&
+  chmod +x "$as_me.lineno" ||
+    { echo "$as_me: error: cannot create $as_me.lineno; rerun with a POSIX shell" >&2
+   { (exit 1); exit 1; }; }
+
+  # Don't try to exec as it changes $[0], causing all sort of problems
+  # (the dirname of $[0] is not the place where we might find the
+  # original and so on.  Autoconf is especially sensitive to this).
+  . "./$as_me.lineno"
+  # Exit status is that of the last command.
+  exit
+}
+
+
+if (as_dir=`dirname -- /` && test "X$as_dir" = X/) >/dev/null 2>&1; then
+  as_dirname=dirname
+else
+  as_dirname=false
+fi
+
+ECHO_C= ECHO_N= ECHO_T=
+case `echo -n x` in
+-n*)
+  case `echo 'x\c'` in
+  *c*) ECHO_T='	';;	# ECHO_T is single tab character.
+  *)   ECHO_C='\c';;
+  esac;;
+*)
+  ECHO_N='-n';;
+esac
+
+if expr a : '\(a\)' >/dev/null 2>&1 &&
+   test "X`expr 00001 : '.*\(...\)'`" = X001; then
+  as_expr=expr
+else
+  as_expr=false
+fi
+
+rm -f conf$$ conf$$.exe conf$$.file
+if test -d conf$$.dir; then
+  rm -f conf$$.dir/conf$$.file
+else
+  rm -f conf$$.dir
+  mkdir conf$$.dir
+fi
+echo >conf$$.file
+if ln -s conf$$.file conf$$ 2>/dev/null; then
+  as_ln_s='ln -s'
+  # ... but there are two gotchas:
+  # 1) On MSYS, both `ln -s file dir' and `ln file dir' fail.
+  # 2) DJGPP < 2.04 has no symlinks; `ln -s' creates a wrapper executable.
+  # In both cases, we have to default to `cp -p'.
+  ln -s conf$$.file conf$$.dir 2>/dev/null && test ! -f conf$$.exe ||
+    as_ln_s='cp -p'
+elif ln conf$$.file conf$$ 2>/dev/null; then
+  as_ln_s=ln
+else
+  as_ln_s='cp -p'
+fi
+rm -f conf$$ conf$$.exe conf$$.dir/conf$$.file conf$$.file
+rmdir conf$$.dir 2>/dev/null
+
+if mkdir -p . 2>/dev/null; then
+  as_mkdir_p=:
+else
+  test -d ./-p && rmdir ./-p
+  as_mkdir_p=false
+fi
+
+if test -x / >/dev/null 2>&1; then
+  as_test_x='test -x'
+else
+  if ls -dL / >/dev/null 2>&1; then
+    as_ls_L_option=L
+  else
+    as_ls_L_option=
+  fi
+  as_test_x='
+    eval sh -c '\''
+      if test -d "$1"; then
+        test -d "$1/.";
+      else
+	case $1 in
+        -*)set "./$1";;
+	esac;
+	case `ls -ld'$as_ls_L_option' "$1" 2>/dev/null` in
+	???[sx]*):;;*)false;;esac;fi
+    '\'' sh
+  '
+fi
+as_executable_p=$as_test_x
+
+# Sed expression to map a string onto a valid CPP name.
+as_tr_cpp="eval sed 'y%*$as_cr_letters%P$as_cr_LETTERS%;s%[^_$as_cr_alnum]%_%g'"
+
+# Sed expression to map a string onto a valid variable name.
+as_tr_sh="eval sed 'y%*+%pp%;s%[^_$as_cr_alnum]%_%g'"
+
+
+exec 6>&1
+
+# Save the log message, to keep $[0] and so on meaningful, and to
+# report actual input values of CONFIG_FILES etc. instead of their
+# values after options handling.
+ac_log="
+This file was extended by $as_me, which was
+generated by GNU Autoconf 2.61.  Invocation command line was
+
+  CONFIG_FILES    = $CONFIG_FILES
+  CONFIG_HEADERS  = $CONFIG_HEADERS
+  CONFIG_LINKS    = $CONFIG_LINKS
+  CONFIG_COMMANDS = $CONFIG_COMMANDS
+  $ $0 $@
+
+on `(hostname || uname -n) 2>/dev/null | sed 1q`
+"
+
+_ACEOF
+
+cat >>$CONFIG_STATUS <<_ACEOF
+# Files that config.status was made for.
+config_files="$ac_config_files"
+config_headers="$ac_config_headers"
+
+_ACEOF
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+ac_cs_usage="\
+\`$as_me' instantiates files from templates according to the
+current configuration.
+
+Usage: $0 [OPTIONS] [FILE]...
+
+  -h, --help       print this help, then exit
+  -V, --version    print version number and configuration settings, then exit
+  -q, --quiet      do not print progress messages
+  -d, --debug      don't remove temporary files
+      --recheck    update $as_me by reconfiguring in the same conditions
+  --file=FILE[:TEMPLATE]
+		   instantiate the configuration file FILE
+  --header=FILE[:TEMPLATE]
+		   instantiate the configuration header FILE
+
+Configuration files:
+$config_files
+
+Configuration headers:
+$config_headers
+
+Report bugs to <bug-autoconf@gnu.org>."
+
+_ACEOF
+cat >>$CONFIG_STATUS <<_ACEOF
+ac_cs_version="\\
+config.status
+configured by $0, generated by GNU Autoconf 2.61,
+  with options \\"`echo "$ac_configure_args" | sed 's/^ //; s/[\\""\`\$]/\\\\&/g'`\\"
+
+Copyright (C) 2006 Free Software Foundation, Inc.
+This config.status script is free software; the Free Software Foundation
+gives unlimited permission to copy, distribute and modify it."
+
+ac_pwd='$ac_pwd'
+srcdir='$srcdir'
+_ACEOF
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+# If no file are specified by the user, then we need to provide default
+# value.  By we need to know if files were specified by the user.
+ac_need_defaults=:
+while test $# != 0
+do
+  case $1 in
+  --*=*)
+    ac_option=`expr "X$1" : 'X\([^=]*\)='`
+    ac_optarg=`expr "X$1" : 'X[^=]*=\(.*\)'`
+    ac_shift=:
+    ;;
+  *)
+    ac_option=$1
+    ac_optarg=$2
+    ac_shift=shift
+    ;;
+  esac
+
+  case $ac_option in
+  # Handling of the options.
+  -recheck | --recheck | --rechec | --reche | --rech | --rec | --re | --r)
+    ac_cs_recheck=: ;;
+  --version | --versio | --versi | --vers | --ver | --ve | --v | -V )
+    echo "$ac_cs_version"; exit ;;
+  --debug | --debu | --deb | --de | --d | -d )
+    debug=: ;;
+  --file | --fil | --fi | --f )
+    $ac_shift
+    CONFIG_FILES="$CONFIG_FILES $ac_optarg"
+    ac_need_defaults=false;;
+  --header | --heade | --head | --hea )
+    $ac_shift
+    CONFIG_HEADERS="$CONFIG_HEADERS $ac_optarg"
+    ac_need_defaults=false;;
+  --he | --h)
+    # Conflict between --help and --header
+    { echo "$as_me: error: ambiguous option: $1
+Try \`$0 --help' for more information." >&2
+   { (exit 1); exit 1; }; };;
+  --help | --hel | -h )
+    echo "$ac_cs_usage"; exit ;;
+  -q | -quiet | --quiet | --quie | --qui | --qu | --q \
+  | -silent | --silent | --silen | --sile | --sil | --si | --s)
+    ac_cs_silent=: ;;
+
+  # This is an error.
+  -*) { echo "$as_me: error: unrecognized option: $1
+Try \`$0 --help' for more information." >&2
+   { (exit 1); exit 1; }; } ;;
+
+  *) ac_config_targets="$ac_config_targets $1"
+     ac_need_defaults=false ;;
+
+  esac
+  shift
+done
+
+ac_configure_extra_args=
+
+if $ac_cs_silent; then
+  exec 6>/dev/null
+  ac_configure_extra_args="$ac_configure_extra_args --silent"
+fi
+
+_ACEOF
+cat >>$CONFIG_STATUS <<_ACEOF
+if \$ac_cs_recheck; then
+  echo "running CONFIG_SHELL=$SHELL $SHELL $0 "$ac_configure_args \$ac_configure_extra_args " --no-create --no-recursion" >&6
+  CONFIG_SHELL=$SHELL
+  export CONFIG_SHELL
+  exec $SHELL "$0"$ac_configure_args \$ac_configure_extra_args --no-create --no-recursion
+fi
+
+_ACEOF
+cat >>$CONFIG_STATUS <<\_ACEOF
+exec 5>>config.log
+{
+  echo
+  sed 'h;s/./-/g;s/^.../## /;s/...$/ ##/;p;x;p;x' <<_ASBOX
+## Running $as_me. ##
+_ASBOX
+  echo "$ac_log"
+} >&5
+
+_ACEOF
+cat >>$CONFIG_STATUS <<_ACEOF
+_ACEOF
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+
+# Handling of arguments.
+for ac_config_target in $ac_config_targets
+do
+  case $ac_config_target in
+    "common/config.h") CONFIG_HEADERS="$CONFIG_HEADERS common/config.h" ;;
+    "Makefile") CONFIG_FILES="$CONFIG_FILES Makefile" ;;
+    "common/Makefile") CONFIG_FILES="$CONFIG_FILES common/Makefile" ;;
+    "colm/Makefile") CONFIG_FILES="$CONFIG_FILES colm/Makefile" ;;
+
+  *) { { echo "$as_me:$LINENO: error: invalid argument: $ac_config_target" >&5
+echo "$as_me: error: invalid argument: $ac_config_target" >&2;}
+   { (exit 1); exit 1; }; };;
+  esac
+done
+
+
+# If the user did not use the arguments to specify the items to instantiate,
+# then the envvar interface is used.  Set only those that are not.
+# We use the long form for the default assignment because of an extremely
+# bizarre bug on SunOS 4.1.3.
+if $ac_need_defaults; then
+  test "${CONFIG_FILES+set}" = set || CONFIG_FILES=$config_files
+  test "${CONFIG_HEADERS+set}" = set || CONFIG_HEADERS=$config_headers
+fi
+
+# Have a temporary directory for convenience.  Make it in the build tree
+# simply because there is no reason against having it here, and in addition,
+# creating and moving files from /tmp can sometimes cause problems.
+# Hook for its removal unless debugging.
+# Note that there is a small window in which the directory will not be cleaned:
+# after its creation but before its name has been assigned to `$tmp'.
+$debug ||
+{
+  tmp=
+  trap 'exit_status=$?
+  { test -z "$tmp" || test ! -d "$tmp" || rm -fr "$tmp"; } && exit $exit_status
+' 0
+  trap '{ (exit 1); exit 1; }' 1 2 13 15
+}
+# Create a (secure) tmp directory for tmp files.
+
+{
+  tmp=`(umask 077 && mktemp -d "./confXXXXXX") 2>/dev/null` &&
+  test -n "$tmp" && test -d "$tmp"
+}  ||
+{
+  tmp=./conf$$-$RANDOM
+  (umask 077 && mkdir "$tmp")
+} ||
+{
+   echo "$me: cannot create a temporary directory in ." >&2
+   { (exit 1); exit 1; }
+}
+
+#
+# Set up the sed scripts for CONFIG_FILES section.
+#
+
+# No need to generate the scripts if there are no CONFIG_FILES.
+# This happens for instance when ./config.status config.h
+if test -n "$CONFIG_FILES"; then
+
+_ACEOF
+
+
+
+ac_delim='%!_!# '
+for ac_last_try in false false false false false :; do
+  cat >conf$$subs.sed <<_ACEOF
+SHELL!$SHELL$ac_delim
+PATH_SEPARATOR!$PATH_SEPARATOR$ac_delim
+PACKAGE_NAME!$PACKAGE_NAME$ac_delim
+PACKAGE_TARNAME!$PACKAGE_TARNAME$ac_delim
+PACKAGE_VERSION!$PACKAGE_VERSION$ac_delim
+PACKAGE_STRING!$PACKAGE_STRING$ac_delim
+PACKAGE_BUGREPORT!$PACKAGE_BUGREPORT$ac_delim
+exec_prefix!$exec_prefix$ac_delim
+prefix!$prefix$ac_delim
+program_transform_name!$program_transform_name$ac_delim
+bindir!$bindir$ac_delim
+sbindir!$sbindir$ac_delim
+libexecdir!$libexecdir$ac_delim
+datarootdir!$datarootdir$ac_delim
+datadir!$datadir$ac_delim
+sysconfdir!$sysconfdir$ac_delim
+sharedstatedir!$sharedstatedir$ac_delim
+localstatedir!$localstatedir$ac_delim
+includedir!$includedir$ac_delim
+oldincludedir!$oldincludedir$ac_delim
+docdir!$docdir$ac_delim
+infodir!$infodir$ac_delim
+htmldir!$htmldir$ac_delim
+dvidir!$dvidir$ac_delim
+pdfdir!$pdfdir$ac_delim
+psdir!$psdir$ac_delim
+libdir!$libdir$ac_delim
+localedir!$localedir$ac_delim
+mandir!$mandir$ac_delim
+DEFS!$DEFS$ac_delim
+ECHO_C!$ECHO_C$ac_delim
+ECHO_N!$ECHO_N$ac_delim
+ECHO_T!$ECHO_T$ac_delim
+LIBS!$LIBS$ac_delim
+build_alias!$build_alias$ac_delim
+host_alias!$host_alias$ac_delim
+target_alias!$target_alias$ac_delim
+BUILD_PARSERS!$BUILD_PARSERS$ac_delim
+CC!$CC$ac_delim
+CFLAGS!$CFLAGS$ac_delim
+LDFLAGS!$LDFLAGS$ac_delim
+CPPFLAGS!$CPPFLAGS$ac_delim
+ac_ct_CC!$ac_ct_CC$ac_delim
+EXEEXT!$EXEEXT$ac_delim
+OBJEXT!$OBJEXT$ac_delim
+CXX!$CXX$ac_delim
+CXXFLAGS!$CXXFLAGS$ac_delim
+ac_ct_CXX!$ac_ct_CXX$ac_delim
+SET_MAKE!$SET_MAKE$ac_delim
+RAGEL!$RAGEL$ac_delim
+KELBT!$KELBT$ac_delim
+LIBOBJS!$LIBOBJS$ac_delim
+LTLIBOBJS!$LTLIBOBJS$ac_delim
+_ACEOF
+
+  if test `sed -n "s/.*$ac_delim\$/X/p" conf$$subs.sed | grep -c X` = 53; then
+    break
+  elif $ac_last_try; then
+    { { echo "$as_me:$LINENO: error: could not make $CONFIG_STATUS" >&5
+echo "$as_me: error: could not make $CONFIG_STATUS" >&2;}
+   { (exit 1); exit 1; }; }
+  else
+    ac_delim="$ac_delim!$ac_delim _$ac_delim!! "
+  fi
+done
+
+ac_eof=`sed -n '/^CEOF[0-9]*$/s/CEOF/0/p' conf$$subs.sed`
+if test -n "$ac_eof"; then
+  ac_eof=`echo "$ac_eof" | sort -nru | sed 1q`
+  ac_eof=`expr $ac_eof + 1`
+fi
+
+cat >>$CONFIG_STATUS <<_ACEOF
+cat >"\$tmp/subs-1.sed" <<\CEOF$ac_eof
+/@[a-zA-Z_][a-zA-Z_0-9]*@/!b end
+_ACEOF
+sed '
+s/[,\\&]/\\&/g; s/@/@|#_!!_#|/g
+s/^/s,@/; s/!/@,|#_!!_#|/
+:n
+t n
+s/'"$ac_delim"'$/,g/; t
+s/$/\\/; p
+N; s/^.*\n//; s/[,\\&]/\\&/g; s/@/@|#_!!_#|/g; b n
+' >>$CONFIG_STATUS <conf$$subs.sed
+rm -f conf$$subs.sed
+cat >>$CONFIG_STATUS <<_ACEOF
+:end
+s/|#_!!_#|//g
+CEOF$ac_eof
+_ACEOF
+
+
+# VPATH may cause trouble with some makes, so we remove $(srcdir),
+# ${srcdir} and @srcdir@ from VPATH if srcdir is ".", strip leading and
+# trailing colons and then remove the whole line if VPATH becomes empty
+# (actually we leave an empty line to preserve line numbers).
+if test "x$srcdir" = x.; then
+  ac_vpsub='/^[	 ]*VPATH[	 ]*=/{
+s/:*\$(srcdir):*/:/
+s/:*\${srcdir}:*/:/
+s/:*@srcdir@:*/:/
+s/^\([^=]*=[	 ]*\):*/\1/
+s/:*$//
+s/^[^=]*=[	 ]*$//
+}'
+fi
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+fi # test -n "$CONFIG_FILES"
+
+
+for ac_tag in  :F $CONFIG_FILES  :H $CONFIG_HEADERS
+do
+  case $ac_tag in
+  :[FHLC]) ac_mode=$ac_tag; continue;;
+  esac
+  case $ac_mode$ac_tag in
+  :[FHL]*:*);;
+  :L* | :C*:*) { { echo "$as_me:$LINENO: error: Invalid tag $ac_tag." >&5
+echo "$as_me: error: Invalid tag $ac_tag." >&2;}
+   { (exit 1); exit 1; }; };;
+  :[FH]-) ac_tag=-:-;;
+  :[FH]*) ac_tag=$ac_tag:$ac_tag.in;;
+  esac
+  ac_save_IFS=$IFS
+  IFS=:
+  set x $ac_tag
+  IFS=$ac_save_IFS
+  shift
+  ac_file=$1
+  shift
+
+  case $ac_mode in
+  :L) ac_source=$1;;
+  :[FH])
+    ac_file_inputs=
+    for ac_f
+    do
+      case $ac_f in
+      -) ac_f="$tmp/stdin";;
+      *) # Look for the file first in the build tree, then in the source tree
+	 # (if the path is not absolute).  The absolute path cannot be DOS-style,
+	 # because $ac_f cannot contain `:'.
+	 test -f "$ac_f" ||
+	   case $ac_f in
+	   [\\/$]*) false;;
+	   *) test -f "$srcdir/$ac_f" && ac_f="$srcdir/$ac_f";;
+	   esac ||
+	   { { echo "$as_me:$LINENO: error: cannot find input file: $ac_f" >&5
+echo "$as_me: error: cannot find input file: $ac_f" >&2;}
+   { (exit 1); exit 1; }; };;
+      esac
+      ac_file_inputs="$ac_file_inputs $ac_f"
+    done
+
+    # Let's still pretend it is `configure' which instantiates (i.e., don't
+    # use $as_me), people would be surprised to read:
+    #    /* config.h.  Generated by config.status.  */
+    configure_input="Generated from "`IFS=:
+	  echo $* | sed 's|^[^:]*/||;s|:[^:]*/|, |g'`" by configure."
+    if test x"$ac_file" != x-; then
+      configure_input="$ac_file.  $configure_input"
+      { echo "$as_me:$LINENO: creating $ac_file" >&5
+echo "$as_me: creating $ac_file" >&6;}
+    fi
+
+    case $ac_tag in
+    *:-:* | *:-) cat >"$tmp/stdin";;
+    esac
+    ;;
+  esac
+
+  ac_dir=`$as_dirname -- "$ac_file" ||
+$as_expr X"$ac_file" : 'X\(.*[^/]\)//*[^/][^/]*/*$' \| \
+	 X"$ac_file" : 'X\(//\)[^/]' \| \
+	 X"$ac_file" : 'X\(//\)$' \| \
+	 X"$ac_file" : 'X\(/\)' \| . 2>/dev/null ||
+echo X"$ac_file" |
+    sed '/^X\(.*[^/]\)\/\/*[^/][^/]*\/*$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)[^/].*/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\).*/{
+	    s//\1/
+	    q
+	  }
+	  s/.*/./; q'`
+  { as_dir="$ac_dir"
+  case $as_dir in #(
+  -*) as_dir=./$as_dir;;
+  esac
+  test -d "$as_dir" || { $as_mkdir_p && mkdir -p "$as_dir"; } || {
+    as_dirs=
+    while :; do
+      case $as_dir in #(
+      *\'*) as_qdir=`echo "$as_dir" | sed "s/'/'\\\\\\\\''/g"`;; #(
+      *) as_qdir=$as_dir;;
+      esac
+      as_dirs="'$as_qdir' $as_dirs"
+      as_dir=`$as_dirname -- "$as_dir" ||
+$as_expr X"$as_dir" : 'X\(.*[^/]\)//*[^/][^/]*/*$' \| \
+	 X"$as_dir" : 'X\(//\)[^/]' \| \
+	 X"$as_dir" : 'X\(//\)$' \| \
+	 X"$as_dir" : 'X\(/\)' \| . 2>/dev/null ||
+echo X"$as_dir" |
+    sed '/^X\(.*[^/]\)\/\/*[^/][^/]*\/*$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)[^/].*/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\/\)$/{
+	    s//\1/
+	    q
+	  }
+	  /^X\(\/\).*/{
+	    s//\1/
+	    q
+	  }
+	  s/.*/./; q'`
+      test -d "$as_dir" && break
+    done
+    test -z "$as_dirs" || eval "mkdir $as_dirs"
+  } || test -d "$as_dir" || { { echo "$as_me:$LINENO: error: cannot create directory $as_dir" >&5
+echo "$as_me: error: cannot create directory $as_dir" >&2;}
+   { (exit 1); exit 1; }; }; }
+  ac_builddir=.
+
+case "$ac_dir" in
+.) ac_dir_suffix= ac_top_builddir_sub=. ac_top_build_prefix= ;;
+*)
+  ac_dir_suffix=/`echo "$ac_dir" | sed 's,^\.[\\/],,'`
+  # A ".." for each directory in $ac_dir_suffix.
+  ac_top_builddir_sub=`echo "$ac_dir_suffix" | sed 's,/[^\\/]*,/..,g;s,/,,'`
+  case $ac_top_builddir_sub in
+  "") ac_top_builddir_sub=. ac_top_build_prefix= ;;
+  *)  ac_top_build_prefix=$ac_top_builddir_sub/ ;;
+  esac ;;
+esac
+ac_abs_top_builddir=$ac_pwd
+ac_abs_builddir=$ac_pwd$ac_dir_suffix
+# for backward compatibility:
+ac_top_builddir=$ac_top_build_prefix
+
+case $srcdir in
+  .)  # We are building in place.
+    ac_srcdir=.
+    ac_top_srcdir=$ac_top_builddir_sub
+    ac_abs_top_srcdir=$ac_pwd ;;
+  [\\/]* | ?:[\\/]* )  # Absolute name.
+    ac_srcdir=$srcdir$ac_dir_suffix;
+    ac_top_srcdir=$srcdir
+    ac_abs_top_srcdir=$srcdir ;;
+  *) # Relative name.
+    ac_srcdir=$ac_top_build_prefix$srcdir$ac_dir_suffix
+    ac_top_srcdir=$ac_top_build_prefix$srcdir
+    ac_abs_top_srcdir=$ac_pwd/$srcdir ;;
+esac
+ac_abs_srcdir=$ac_abs_top_srcdir$ac_dir_suffix
+
+
+  case $ac_mode in
+  :F)
+  #
+  # CONFIG_FILE
+  #
+
+_ACEOF
+
+cat >>$CONFIG_STATUS <<\_ACEOF
+# If the template does not know about datarootdir, expand it.
+# FIXME: This hack should be removed a few years after 2.60.
+ac_datarootdir_hack=; ac_datarootdir_seen=
+
+case `sed -n '/datarootdir/ {
+  p
+  q
+}
+/@datadir@/p
+/@docdir@/p
+/@infodir@/p
+/@localedir@/p
+/@mandir@/p
+' $ac_file_inputs` in
+*datarootdir*) ac_datarootdir_seen=yes;;
+*@datadir@*|*@docdir@*|*@infodir@*|*@localedir@*|*@mandir@*)
+  { echo "$as_me:$LINENO: WARNING: $ac_file_inputs seems to ignore the --datarootdir setting" >&5
+echo "$as_me: WARNING: $ac_file_inputs seems to ignore the --datarootdir setting" >&2;}
+_ACEOF
+cat >>$CONFIG_STATUS <<_ACEOF
+  ac_datarootdir_hack='
+  s&@datadir@&$datadir&g
+  s&@docdir@&$docdir&g
+  s&@infodir@&$infodir&g
+  s&@localedir@&$localedir&g
+  s&@mandir@&$mandir&g
+    s&\\\${datarootdir}&$datarootdir&g' ;;
+esac
+_ACEOF
+
+# Neutralize VPATH when `$srcdir' = `.'.
+# Shell code in configure.ac might set extrasub.
+# FIXME: do we really want to maintain this feature?
+cat >>$CONFIG_STATUS <<_ACEOF
+  sed "$ac_vpsub
+$extrasub
+_ACEOF
+cat >>$CONFIG_STATUS <<\_ACEOF
+:t
+/@[a-zA-Z_][a-zA-Z_0-9]*@/!b
+s&@configure_input@&$configure_input&;t t
+s&@top_builddir@&$ac_top_builddir_sub&;t t
+s&@srcdir@&$ac_srcdir&;t t
+s&@abs_srcdir@&$ac_abs_srcdir&;t t
+s&@top_srcdir@&$ac_top_srcdir&;t t
+s&@abs_top_srcdir@&$ac_abs_top_srcdir&;t t
+s&@builddir@&$ac_builddir&;t t
+s&@abs_builddir@&$ac_abs_builddir&;t t
+s&@abs_top_builddir@&$ac_abs_top_builddir&;t t
+$ac_datarootdir_hack
+" $ac_file_inputs | sed -f "$tmp/subs-1.sed" >$tmp/out
+
+test -z "$ac_datarootdir_hack$ac_datarootdir_seen" &&
+  { ac_out=`sed -n '/\${datarootdir}/p' "$tmp/out"`; test -n "$ac_out"; } &&
+  { ac_out=`sed -n '/^[	 ]*datarootdir[	 ]*:*=/p' "$tmp/out"`; test -z "$ac_out"; } &&
+  { echo "$as_me:$LINENO: WARNING: $ac_file contains a reference to the variable \`datarootdir'
+which seems to be undefined.  Please make sure it is defined." >&5
+echo "$as_me: WARNING: $ac_file contains a reference to the variable \`datarootdir'
+which seems to be undefined.  Please make sure it is defined." >&2;}
+
+  rm -f "$tmp/stdin"
+  case $ac_file in
+  -) cat "$tmp/out"; rm -f "$tmp/out";;
+  *) rm -f "$ac_file"; mv "$tmp/out" $ac_file;;
+  esac
+ ;;
+  :H)
+  #
+  # CONFIG_HEADER
+  #
+_ACEOF
+
+# Transform confdefs.h into a sed script `conftest.defines', that
+# substitutes the proper values into config.h.in to produce config.h.
+rm -f conftest.defines conftest.tail
+# First, append a space to every undef/define line, to ease matching.
+echo 's/$/ /' >conftest.defines
+# Then, protect against being on the right side of a sed subst, or in
+# an unquoted here document, in config.status.  If some macros were
+# called several times there might be several #defines for the same
+# symbol, which is useless.  But do not sort them, since the last
+# AC_DEFINE must be honored.
+ac_word_re=[_$as_cr_Letters][_$as_cr_alnum]*
+# These sed commands are passed to sed as "A NAME B PARAMS C VALUE D", where
+# NAME is the cpp macro being defined, VALUE is the value it is being given.
+# PARAMS is the parameter list in the macro definition--in most cases, it's
+# just an empty string.
+ac_dA='s,^\\([	 #]*\\)[^	 ]*\\([	 ]*'
+ac_dB='\\)[	 (].*,\\1define\\2'
+ac_dC=' '
+ac_dD=' ,'
+
+uniq confdefs.h |
+  sed -n '
+	t rset
+	:rset
+	s/^[	 ]*#[	 ]*define[	 ][	 ]*//
+	t ok
+	d
+	:ok
+	s/[\\&,]/\\&/g
+	s/^\('"$ac_word_re"'\)\(([^()]*)\)[	 ]*\(.*\)/ '"$ac_dA"'\1'"$ac_dB"'\2'"${ac_dC}"'\3'"$ac_dD"'/p
+	s/^\('"$ac_word_re"'\)[	 ]*\(.*\)/'"$ac_dA"'\1'"$ac_dB$ac_dC"'\2'"$ac_dD"'/p
+  ' >>conftest.defines
+
+# Remove the space that was appended to ease matching.
+# Then replace #undef with comments.  This is necessary, for
+# example, in the case of _POSIX_SOURCE, which is predefined and required
+# on some systems where configure will not decide to define it.
+# (The regexp can be short, since the line contains either #define or #undef.)
+echo 's/ $//
+s,^[	 #]*u.*,/* & */,' >>conftest.defines
+
+# Break up conftest.defines:
+ac_max_sed_lines=50
+
+# First sed command is:	 sed -f defines.sed $ac_file_inputs >"$tmp/out1"
+# Second one is:	 sed -f defines.sed "$tmp/out1" >"$tmp/out2"
+# Third one will be:	 sed -f defines.sed "$tmp/out2" >"$tmp/out1"
+# et cetera.
+ac_in='$ac_file_inputs'
+ac_out='"$tmp/out1"'
+ac_nxt='"$tmp/out2"'
+
+while :
+do
+  # Write a here document:
+    cat >>$CONFIG_STATUS <<_ACEOF
+    # First, check the format of the line:
+    cat >"\$tmp/defines.sed" <<\\CEOF
+/^[	 ]*#[	 ]*undef[	 ][	 ]*$ac_word_re[	 ]*\$/b def
+/^[	 ]*#[	 ]*define[	 ][	 ]*$ac_word_re[(	 ]/b def
+b
+:def
+_ACEOF
+  sed ${ac_max_sed_lines}q conftest.defines >>$CONFIG_STATUS
+  echo 'CEOF
+    sed -f "$tmp/defines.sed"' "$ac_in >$ac_out" >>$CONFIG_STATUS
+  ac_in=$ac_out; ac_out=$ac_nxt; ac_nxt=$ac_in
+  sed 1,${ac_max_sed_lines}d conftest.defines >conftest.tail
+  grep . conftest.tail >/dev/null || break
+  rm -f conftest.defines
+  mv conftest.tail conftest.defines
+done
+rm -f conftest.defines conftest.tail
+
+echo "ac_result=$ac_in" >>$CONFIG_STATUS
+cat >>$CONFIG_STATUS <<\_ACEOF
+  if test x"$ac_file" != x-; then
+    echo "/* $configure_input  */" >"$tmp/config.h"
+    cat "$ac_result" >>"$tmp/config.h"
+    if diff $ac_file "$tmp/config.h" >/dev/null 2>&1; then
+      { echo "$as_me:$LINENO: $ac_file is unchanged" >&5
+echo "$as_me: $ac_file is unchanged" >&6;}
+    else
+      rm -f $ac_file
+      mv "$tmp/config.h" $ac_file
+    fi
+  else
+    echo "/* $configure_input  */"
+    cat "$ac_result"
+  fi
+  rm -f "$tmp/out12"
+ ;;
+
+
+  esac
+
+done # for ac_tag
+
+
+{ (exit 0); exit 0; }
+_ACEOF
+chmod +x $CONFIG_STATUS
+ac_clean_files=$ac_clean_files_save
+
+
+# configure is writing to config.log, and then calls config.status.
+# config.status does its own redirection, appending to config.log.
+# Unfortunately, on DOS this fails, as config.log is still kept open
+# by configure, so config.status won't be able to write to it; its
+# output is simply discarded.  So we exec the FD to /dev/null,
+# effectively closing config.log, so it can be properly (re)opened and
+# appended to by config.status.  When coming back to configure, we
+# need to make the FD available again.
+if test "$no_create" != yes; then
+  ac_cs_success=:
+  ac_config_status_args=
+  test "$silent" = yes &&
+    ac_config_status_args="$ac_config_status_args --quiet"
+  exec 5>/dev/null
+  $SHELL $CONFIG_STATUS $ac_config_status_args || ac_cs_success=false
+  exec 5>>config.log
+  # Use ||, not &&, to avoid exiting from the if with $? = 1, which
+  # would make configure fail if this is the last instruction.
+  $ac_cs_success || { (exit 1); exit 1; }
+fi
+
+
+echo "configuration of colm complete"
diff --git a/configure.in b/configure.in
new file mode 100644
index 00000000..9a4d827d
--- /dev/null
+++ b/configure.in
@@ -0,0 +1,79 @@
+dnl 
+dnl   Copyright 2001-2008 Adrian Thurston <thurston@cs.queensu.ca>
+dnl
+
+dnl   This file is part of Colm.
+dnl  
+dnl   Colm is free software; you can redistribute it and/or modify
+dnl   it under the terms of the GNU General Public License as published by
+dnl   the Free Software Foundation; either version 2 of the License, or
+dnl   (at your option) any later version.
+dnl   
+dnl   Colm is distributed in the hope that it will be useful,
+dnl   but WITHOUT ANY WARRANTY; without even the implied warranty of
+dnl   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+dnl   GNU General Public License for more details.
+dnl   
+dnl   You should have received a copy of the GNU General Public License
+dnl   along with Colm; if not, write to the Free Software
+dnl   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+  
+AC_INIT(colm/main.cpp)
+AC_CONFIG_HEADER(common/config.h)
+
+dnl Set to true if build system should generate parsers from ragel, kelbt, and
+dnl gperf sources. Set to false if generated files are included and not to be
+dnl built (production).
+AC_SUBST(BUILD_PARSERS,true)
+
+dnl Checks for programs.
+AC_PROG_CC
+AC_DEFINE_UNQUOTED(CC,$CC)
+
+dnl Checks for programs.
+AC_PROG_CXX
+AC_DEFINE_UNQUOTED(CXX,$CXX)
+
+dnl Set test on c++ compiler.
+AC_LANG_CPLUSPLUS
+
+dnl Check for definition of MAKE.
+AC_PROG_MAKE_SET
+
+# Logging features
+AC_ARG_ENABLE(log, "turn on logging", AC_DEFINE(COLM_LOG))
+AC_ARG_ENABLE(log-bytecode, "turns on bytecode logging", 
+		AC_DEFINE(COLM_LOG_BYTECODE))
+AC_ARG_ENABLE(log-parse, "turns on parse logging", 
+		AC_DEFINE(COLM_LOG_PARSE))
+AC_ARG_ENABLE(log-match, "turns on match logging", 
+		AC_DEFINE(COLM_LOG_MATCH))
+AC_ARG_ENABLE(log-compile, "turns on compile logging", 
+		AC_DEFINE(COLM_LOG_COMPILE))
+
+if test $BUILD_PARSERS = true; then
+
+dnl Check for Ragel
+AC_CHECK_PROG(RAGEL, ragel, ragel)
+if test -z "$RAGEL"; then
+	echo
+	echo "error: ragel is required to build the parsers"
+	echo
+	exit 1
+fi
+
+dnl Check for Kelbt
+AC_CHECK_PROG(KELBT, kelbt, kelbt)
+if test -z "$KELBT"; then
+	echo
+	echo "error: kelbt is required to build the parsers"
+	echo
+	exit 1
+fi
+
+fi # BUILD_PARSERS
+
+dnl write output files
+AC_OUTPUT(Makefile common/Makefile colm/Makefile)
+
+echo "configuration of colm complete"
diff --git a/test/Makefile b/test/Makefile
new file mode 100644
index 00000000..8e420541
--- /dev/null
+++ b/test/Makefile
@@ -0,0 +1,46 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+SUBDIRS = xml python http dns diff html cxx ruby
+
+all: $(BIN) $(SUBDIRS)
+
+.PHONY: $(SUBDIRS)
+
+$(SUBDIRS):
+	@cd $@ && $(MAKE)
+
+$(BIN): %.bin: %.lm
+	../colm/colm $<
+
+# clean targets
+
+CLEAN_SUBDIRS = $(SUBDIRS:%=%-clean)
+
+.PHONY: $(CLEAN_SUBDIRS)
+
+$(CLEAN_SUBDIRS):
+	@cd $(@:%-clean=%) && $(MAKE) clean
+
+clean: $(CLEAN_SUBDIRS)
+	rm -f *.cpp *.bin
diff --git a/test/backtrack1.lm b/test/backtrack1.lm
new file mode 100644
index 00000000..0f3d8e88
--- /dev/null
+++ b/test/backtrack1.lm
@@ -0,0 +1,24 @@
+# Token names.
+
+lex start
+{
+	literal '+', '*'
+	token number /[0-9]+/
+	ignore ws / [ \t\n]+ /
+}
+
+def F
+	[number '+']
+|	[number]
+|	[F '*' number]
+
+def E
+	[E '+' F]
+|	[F]
+
+def start 
+	[E]
+
+start S = parse start( stdin )
+start R = match S ~ 9 + 9
+print_xml( R )
diff --git a/test/backtrack2.lm b/test/backtrack2.lm
new file mode 100644
index 00000000..fc63c7a6
--- /dev/null
+++ b/test/backtrack2.lm
@@ -0,0 +1,24 @@
+
+# Token names.
+lex start
+{
+	token id /[a-z]+/
+	ignore ws /[ \t\n]+/
+}
+
+token bang1 /'!'/
+token bang2 /'!'/
+
+def one [bang1 id id id]
+
+def two [bang2 id id id id]
+
+def prods 
+	[one]
+|	[two]
+
+def start
+	[prods]
+
+start S = parse start( stdin )
+match S "!aa bb cc dd"
diff --git a/test/backtrack3.lm b/test/backtrack3.lm
new file mode 100644
index 00000000..1f5e6e81
--- /dev/null
+++ b/test/backtrack3.lm
@@ -0,0 +1,27 @@
+
+# Token names.
+lex start
+{
+	token number /[0-9]+/
+	token id /[a-z]+/
+	token string /'"' [^"]* '"'/
+	ignore ws / [ \t\n]+ /
+}
+
+def prefix [id]
+
+def choice1
+	[number number]
+|	[number]
+
+def choice2 
+	[string id]
+|	[number number]
+|	[id number]
+|	[number]
+
+def start 
+	[prefix choice1 choice2 string id id]
+	{
+		match lhs "id 77 88 \"hello\" dude dude"
+	}
diff --git a/test/btscan.in b/test/btscan.in
new file mode 100644
index 00000000..88cec9d5
--- /dev/null
+++ b/test/btscan.in
@@ -0,0 +1,2 @@
+!abb !abba !aab
+
diff --git a/test/btscan.lm b/test/btscan.lm
new file mode 100644
index 00000000..ac7914c2
--- /dev/null
+++ b/test/btscan.lm
@@ -0,0 +1,34 @@
+namespace r1
+{
+	lex r1
+	{
+		literal '!', 'a', 'b'
+		ignore /[ \n\t]+/
+	}
+
+	def line [ '!' 'a' 'b' 'b' 'a']
+}
+
+namespace r2
+{
+	lex r2
+	{
+		literal '!'
+		token id /[a-zA-Z_]+/
+		ignore /[ \n\t]+/
+	}
+
+	def line [ '!' id ]
+}
+
+def item 
+	[r1::line]
+|	[r2::line]
+
+def btscan 
+	[item*]
+
+btscan P = parse btscan( stdin )
+
+match P ~!abb !abba !aab
+print_xml(P)
diff --git a/test/constructex.in b/test/constructex.in
new file mode 100644
index 00000000..f458f2ad
--- /dev/null
+++ b/test/constructex.in
@@ -0,0 +1,3 @@
+<person name=adrian hometown=kingston>
+	<t1 foo=bar2 e=f></t2>
+</person>
\ No newline at end of file
diff --git a/test/constructex.lm b/test/constructex.lm
new file mode 100644
index 00000000..01d71f37
--- /dev/null
+++ b/test/constructex.lm
@@ -0,0 +1,37 @@
+lex start
+{
+	token id /[a-zA-Z_][a-zA-Z0-9_]*/
+	literal '=', '<', '>', '/'
+	ignore /[ \t\n\r\v]+/
+}
+
+def attr 
+	[id '=' id]
+
+def open_tag 
+	['<' id attr* '>']
+
+def close_tag
+	['<' '/' id '>']
+
+def tag 
+	[open_tag item* close_tag]
+
+def item
+	[tag]
+|	[id]
+
+tag PersonTag = parse tag( stdin )
+
+match PersonTag 
+	["<person name=" Val:id attr*">" item* "</person>"]
+
+tag NameTag1 = construct tag 
+	["<name type=person>" Val "</name>"]
+
+tag NameTag2 = construct tag 
+	"<name type=person>[Val]</name>"
+
+print( NameTag1, '\n' )
+print( NameTag2, '\n' )
+
diff --git a/test/counting1.in b/test/counting1.in
new file mode 100644
index 00000000..45eeecde
--- /dev/null
+++ b/test/counting1.in
@@ -0,0 +1 @@
+3 1 b c 1 1 0 3 a b c
diff --git a/test/counting1.lm b/test/counting1.lm
new file mode 100644
index 00000000..bd0154ec
--- /dev/null
+++ b/test/counting1.lm
@@ -0,0 +1,91 @@
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+rl rl_num /[0-9]+/
+
+#
+# Tokens
+#
+
+lex start
+{
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	# Tokens. 
+	token id /rl_id/
+	token number /rl_num/
+}
+
+#
+# Global Data
+#
+
+global int target
+
+#
+# Productions
+#
+
+
+def get_target 
+	[number]
+	{
+		match lhs [Number:number]
+		target = Number.data.atoi()
+	}
+
+# Arbitrary item.
+def item 
+	[number]
+|	[id]
+
+# Type definition for the count_items nonterminal.
+def count_items
+	int count
+
+	# List production one. The condition stops the 
+	# greedy list when it has gone too far.
+	[count_items item]
+	{
+		# Pass up the data
+		lhs.count = r1.count + 1
+		if lhs.count > target {
+			reject
+		}
+	}
+
+	# List production two, the base.
+|	[]
+	{
+		lhs.count = 0
+	}
+
+# Wrapper which prevents short lists from getting through if the parser
+# encounters an error and needs to backtrack over counted list.
+def counted_list
+	[get_target count_items]
+	{
+		if r2.count < target {
+			reject
+		}
+	}
+
+
+def start 
+	[counted_list*]
+	{
+		for List:counted_list in lhs {
+			match List [Count:number Items:count_items]
+			print( 'num items: ', Count.data.atoi(), '\n' )
+
+			int i = 1
+			for Item:item in Items {
+				print( '  item ', i,  ': ', Item, '\n' )
+				i = i + 1
+			}
+		}
+	}
diff --git a/test/counting2.lm b/test/counting2.lm
new file mode 100644
index 00000000..1044e5cb
--- /dev/null
+++ b/test/counting2.lm
@@ -0,0 +1,82 @@
+
+#
+# Regular Definitions
+#
+
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+rl rl_num /[0-9]+/
+
+#
+# Tokens
+#
+
+lex start
+{
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	# Tokens. 
+	token id /rl_id/
+	token number /rl_num/
+}
+
+#
+# Productions
+#
+
+# Arbitrary item.
+def item
+	[id]
+|	[number]
+
+# List production one. The condition stops the 
+# greedy list when it has gone too far.
+def count_items
+	int target
+	int count
+
+	[count_items item]
+	{
+		# Pass up the data
+		lhs.target = r1.target
+		lhs.count = r1.count + 1
+
+		if lhs.count > lhs.target {
+			reject
+		}
+	}
+
+	# List production two, the base.
+|	[number]
+	{
+		match lhs [Number:number]
+		lhs.target = Number.data.atoi()
+		lhs.count = 0
+	}
+		
+
+# Wrapper which prevents short lists from getting through if the parser
+# encounters an error and needs to backtrack over counted list.
+def counted_list
+	[count_items]
+	{
+		if r1.count < r1.target {
+			reject
+		}
+	}
+
+def start 
+	[counted_list*]
+	{
+		for List:counted_list in lhs {
+			match List [CountItems:count_items]
+			print( 'num items: ', CountItems.target, '\n' )
+
+			int i = 1
+			for Item:item in CountItems {
+				print( '  item ', i, ': ', Item, '\n' )
+				i = i + 1
+			}
+		}
+	}
diff --git a/test/counting3.lm b/test/counting3.lm
new file mode 100644
index 00000000..d925b732
--- /dev/null
+++ b/test/counting3.lm
@@ -0,0 +1,92 @@
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+rl rl_num /[0-9]+/
+
+#
+# Tokens
+#
+
+lex start
+{
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	literal ';'
+
+	# Tokens. 
+	token id /rl_id/
+	token number /rl_num/
+}
+
+#
+# Global Data
+#
+
+global int target
+global int count
+
+#
+# Productions
+#
+
+
+def get_target 
+	[number]
+	{
+		count = 0
+		target = r1.data.atoi()
+		print( 'target: ', target, '\n' )
+	}
+
+# Arbitrary item.
+def item 
+	[number]
+|	[id]
+
+def count_items 
+	[one_item count_items]
+|	[]
+
+def one_item 
+	[item]
+	{
+		count = count + 1
+		if count > target {
+			reject
+		} 
+		print( 'ITEM\n' )
+	}
+
+
+# Wrapper which prevents short lists from getting through if the parser
+# encounters an error and needs to backtrack over counted list.
+def counted_list 
+	[get_target count_items]
+	{
+		print( 'trying: ', count, ' for: ', target, '\n' )
+		if count < target {
+			reject
+		}
+	}
+
+
+def start 
+	[counted_list*]
+	{
+
+		for List:counted_list in lhs {
+			match List [Count:number Items:count_items]
+			print( 'num items: ', Count.data.atoi(), '\n' )
+
+			int i = 1
+			for Item:item in Items {
+				print( '  item ', i, ': ', Item, '\n' )
+				i = i + 1
+			}
+		}
+		print( '*** SUCCESS ***\n' )
+	}
diff --git a/test/counting4.lm b/test/counting4.lm
new file mode 100644
index 00000000..b1a75130
--- /dev/null
+++ b/test/counting4.lm
@@ -0,0 +1,89 @@
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+rl rl_num /[0-9]+/
+
+#
+# Tokens
+#
+
+lex start
+{
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	literal ';'
+
+	# Tokens. 
+	token id /rl_id/
+	token number /rl_num/
+}
+
+#
+# Global Data
+#
+
+global int target
+global int count
+
+#
+# Productions
+#
+
+
+def get_target 
+	[number]
+	{
+		count = 0
+		target = r1.data.atoi()
+		print( 'target: ', target, '\n' )
+	}
+
+# Arbitrary item.
+def item 
+	[number]
+|	[id]
+
+def count_items 
+	[count_inc item count_items]
+|	[count_end]
+
+def count_inc 
+	[]
+	{
+		if count < target
+			count = count + 1
+		else
+			reject
+	}
+
+def count_end
+	[]
+	{
+		if count < target
+			reject
+	}
+
+def counted_list 
+	[get_target count_items]
+
+def start 
+	[counted_list*]
+	{
+		for List:counted_list in lhs {
+			match List [Count:number Items:count_items]
+			print( 'num items: ', Count.data.atoi(), '\n' )
+
+			int i = 1
+			for Item:item in Items {
+				print( '  item ', i, ': ', Item, '\n' )
+				i = i + 1
+			}
+		}
+		print( '*** SUCCESS ***\n' )
+	}
+
+parse start(stdin)
diff --git a/test/cxx/Makefile b/test/cxx/Makefile
new file mode 100644
index 00000000..a775f8c7
--- /dev/null
+++ b/test/cxx/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f cxx.cpp *.bin
diff --git a/test/cxx/cxx.lm b/test/cxx/cxx.lm
new file mode 100644
index 00000000..560bfde2
--- /dev/null
+++ b/test/cxx/cxx.lm
@@ -0,0 +1,2163 @@
+#
+# Data types for global data.
+#
+
+# Map definition
+map object_map [str object_list]
+
+# Language objects. 
+def lang_object
+	int typeId
+	str name
+
+	# If the object is a typedef, this points to the real object.
+	ptr lang_object typedefOf
+
+	object_map objectMap
+	object_list inherited
+	ptr lang_object lookupParent
+	ptr lang_object specializationOf
+	[]
+
+# This structure is used to keep track of information necessary to make a
+# declaration. While parsing a declaration it records the declaration's
+# attributes.
+def declaration_data
+	int isTypedef
+	int isFriend
+	int isTemplate
+
+	ptr lang_object typeObj
+	[]
+
+def declarator_data
+	ptr lang_object qualObj
+	ptr lang_object pdcScope
+	ptr lang_object lookupObj
+	[]
+
+list declaration_data_list [declaration_data]
+list declarator_data_list [declarator_data]
+
+# Constants for language object types.
+global int NamespaceType = typeid namespace_id
+global int ClassType = typeid class_id
+global int TemplateClassType = typeid templ_class_id
+global int EnumType = typeid enum_id
+global int IdType = typeid identifier
+global int TypedefType = typeid typedef_id
+global int TemplateIdType = typeid template_id
+
+# Object stack definition. Uses references to objects.
+list object_list [ptr lang_object]
+
+# Stack of integers.
+list int_stack [int]
+
+#
+# Global data declarations
+#
+
+# Object stacks.
+global object_list curNamespace = construct object_list []
+global object_list declNs = construct object_list []
+global object_list lookupNs = construct object_list []
+global object_list qualNs = construct object_list []
+global object_list templateParamNs = construct object_list []
+
+# Declaration, declarator data.
+global declaration_data_list declarationData = construct declaration_data_list []
+global declarator_data_list declaratorData = construct declarator_data_list []
+
+# Template declarations
+global int_stack templDecl = construct int_stack []
+
+# Root namespace object
+global ptr lang_object rootNamespace = createLangObject( NamespaceType, 
+		'<root_namespace>', nil )
+
+# Initialize the namespace and declaration stacks with the root namespace
+curNamespace.push( rootNamespace )
+declNs.push( rootNamespace )
+lookupNs.push( rootNamespace )
+
+# Start with no qualification (note variables are initialized to zero)
+qualNs.push( nil )
+
+templDecl.push( 0 )
+declarationData.push( construct declaration_data( 
+		isTypedef: 0, isFriend: 0, isTemplate: 0 ) [] )
+
+#
+# Identifier lookup.
+#
+
+# Lookup the token in the members of an object.
+ptr lang_object lookupInObject( ptr lang_object obj, str name )
+{
+	# LOG print( '  looking in ', obj->name, '\n' )
+
+	object_list ol = obj->objectMap.find( name )
+	if ol {
+		# LOG print( '  * found an object: ', ol.head, '\n' )
+		return ol.head
+	}
+
+	return nil
+}
+
+# Lookup in an object and all the objects beneath it in the inheritance
+# tree.
+ptr lang_object lookupWithInheritance( ptr lang_object obj, str name )
+{
+	ptr lang_object found = lookupInObject( obj, name )
+	if found
+		return found
+
+	object_list localObjInherited = obj->inherited
+	for II: ptr lang_object in localObjInherited {
+		ptr lang_object inh = II
+
+		# First check if the inherited object is the one we are after.
+		if inh->name == name && inh->typeId == ClassType {
+			# LOG print( '  * found a class name\n' )
+			return inh
+		}
+
+		# Otherwise look inside the inherited object.
+		found = lookupWithInheritance( inh, name )
+		if found
+			return found
+	}
+
+	return nil
+}
+
+ptr lang_object unqualifiedLookup( str name )
+{
+	ptr lang_object found
+
+	# Start with the objects in the templateParamNs.
+	object_list localTemplateParamNs = templateParamNs
+	for TemplParaObjIter: ptr lang_object in rev_child(localTemplateParamNs) {
+		found = lookupWithInheritance( TemplParaObjIter, name )
+		if found
+			break
+	}
+
+	if !found {
+		# Iterator over the objects starting at the head of the lookup stack
+		# and going up through the lookup parents.
+		ptr lang_object lookupIn = lookupNs.top
+		while lookupIn {
+			found = lookupWithInheritance( lookupIn, name )
+			if found
+				break
+			lookupIn = lookupIn->lookupParent
+		}
+	}
+
+	return found
+}
+
+# The C++ scanner.
+lex start
+{
+	rl fract_const / digit* '.' digit+ | digit+ '.' /
+	rl exponent / [eE] [+\-]? digit+ /
+	rl float_suffix / [flFL] /
+
+	# Single and double literals.
+	token TK_SingleLit /( 'L'? "'" ( [^'\\\n] | '\\' any )* "'" )/
+	token TK_DoubleLit /( 'L'? '"' ( [^"\\\n] | '\\' any )* '"' )/
+
+	literal 'extern', 'namespace', 'friend', 'typedef', 'auto', 'register',
+			'static', 'mutable', 'inline', 'virtual', 'explicit', 'const',
+			'volatile', 'restrict', 'class', 'struct', 'union', 'template',
+			'private', 'protected', 'public', 'using', 'void', 'char',
+			'wchar_t', 'bool', 'int', 'float', 'double', 'short', 'long',
+			'signed', 'unsigned', 'enum', 'new', 'delete', 'operator',
+			'typename', 'export', 'throw', 'try', 'catch', 'sizeof',
+			'dynamic_cast', 'static_cast', 'reinterpret_cast', 'const_cast',
+			'typeid', 'this', 'true', 'false', 'switch', 'case', 'default',
+			'if', 'else', 'while', 'do', 'for', 'break', 'continue',
+			'return', 'goto'
+
+	literal '__typeof'
+
+	literal '{', '}', ';', ',', '=', '(', ')', ':', '&', '*', '[', ']', '~', '+', '-',
+		'/', '<', '>', '|', '^', '%', '!', '?', '.'
+
+	literal '::', '==', '!=', '&&', '||', '*=', '/=', '%=', '+=', '-=', '&=',
+		'^=', '|=', '++', '--', '->', '->*', '.*', '...', '<<=', '>>='
+
+	# Token translation targets.
+	def unknown_id [lookup_id]
+	def class_id [lookup_id]
+	def namespace_id [lookup_id]
+	def templ_class_id [lookup_id]
+	def enum_id [lookup_id]
+	def typedef_id [lookup_id]
+	def identifier [lookup_id]
+	def template_id [lookup_id]
+
+	# Identifiers
+	token lookup_id 
+		ptr lang_object obj
+		ptr lang_object qualObj
+
+		/( [a-zA-Z_] [a-zA-Z0-9_]* )/
+		{
+			str name = match_text
+			ptr lang_object found = nil
+			ptr lang_object qualObj = nil
+			if qualNs.top {
+				# LOG print( 'qualified lookup of ', name, '\n' )
+
+				# Transfer the qualification to the token and reset it.
+				qualObj = qualNs.top
+				qualNs.top = nil
+
+				# Lookup using the qualification. 
+				found = lookupWithInheritance( qualObj, name )
+			}
+			else {
+				# No qualification, full search.
+				# LOG print( 'unqualified lookup of ', name, '\n' )
+				found = unqualifiedLookup( name )
+			}
+
+			# If no match, return an Unknown ID
+			int id = typeid unknown_id
+			if found
+				id = found->typeId
+
+			any LookupId = make_token( typeid lookup_id, 
+					pull(stdin, match_length), found, qualObj )
+			send( make_tree( id, LookupId ) )
+
+		}
+
+	# Floats.
+	token TK_Float /( fract_const exponent? float_suffix? |
+		digit+ exponent float_suffix? )/
+
+	# Integer decimal. Leading part buffered by float.
+	token TK_IntegerDecimal /( ( '0' | [1-9] [0-9]* ) [ulUL]{0,3} )/
+
+	# Integer octal. Leading part buffered by float.
+	token TK_IntegerOctal /( '0' [0-9]+ [ulUL]{0,2} )/
+
+	# Integer hex. Leading 0 buffered by float.
+	token TK_IntegerHex /( '0x' [0-9a-fA-F]+ [ulUL]{0,2} )/
+
+	# Preprocessor line.
+	ignore /'#' [^\n]* '\n'/
+
+	# Comments and whitespace.
+	ignore /( '/*' (any | '\n')* :>> '*/' )/
+	ignore /( '//' any* :> '\n' )/
+	ignore /( any - 33..126 )+/
+}
+
+#
+# Support functions
+#
+
+ptr lang_object createLangObject( int typeId, str name, ptr lang_object lookupParent )
+{
+	ptr lang_object obj = new construct lang_object(
+			typeId: typeId, 
+			name: name,
+			objectMap: construct object_map [],
+			inherited: construct object_list [],
+			lookupParent: lookupParent ) []
+	return obj
+}
+
+# Building the language object tree.
+int insertObject( ptr lang_object definedIn, str name, ptr lang_object obj )
+{
+	object_list ol = definedIn->objectMap.find( name )
+	if !ol {
+		# Element not in the map already
+		ol = construct object_list []
+	}
+	ol.append( obj )
+	definedIn->objectMap.store( name, ol )
+}
+
+ptr lang_object findClass( ptr lang_object inObj, str name )
+{
+	object_list ol = inObj->objectMap.find( name )
+	if ol { 
+		for ObjIter: ptr lang_object in ol {
+			ptr lang_object obj = ObjIter
+			if obj->typeId == ClassType {
+				return obj
+			}
+		}
+	}
+	return nil
+}
+
+ptr lang_object findTemplateClass( ptr lang_object inObj, str name )
+{
+	object_list ol = inObj->objectMap.find( name )
+	if ol { 
+		for ObjIter: ptr lang_object in ol {
+			ptr lang_object obj = ObjIter
+			if obj->typeId == TemplateClassType
+				return obj
+		}
+	}
+	return nil
+}
+
+def root_qual_opt 
+	[]
+|	['::']
+
+def nested_name_specifier_opt 
+	[nested_name_specifier_opt qualifying_name '::' designated_qualifying_name '::']
+|	[nested_name_specifier_opt qualifying_name '::']
+|	[]
+
+def nested_name_specifier 
+	[nested_name_specifier designated_qualifying_name '::']
+|	[nested_name_specifier qualifying_name '::']
+|	[qualifying_name '::']
+
+def qualifying_name 
+	[class_name]
+	{
+		qualNs.top = r1.lookupId.obj
+	}
+
+|	[namespace_id]
+	{
+		match r1 [Id: lookup_id]
+		qualNs.top = Id.obj
+	}
+
+|	[typedef_id]
+	{
+		match r1 [Id: lookup_id]
+		qualNs.top = Id.obj->typedefOf
+	}
+
+def designated_qualifying_name 
+	['template' any_id]
+	{
+		# FIXME: nulling qualNs is not the right thing to do here.
+		qualNs.top = nil
+	}
+
+|	['template' any_id 
+		templ_arg_open template_argument_list_opt templ_arg_close]
+	{
+		# FIXME: nulling qualNs is not the right thing to do here.
+		qualNs.top = nil
+	}
+
+#
+# Id Expression
+#
+
+def id_expression 
+	lookup_id lookupId
+
+	[root_qual_opt nested_name_specifier_opt unknown_id]
+	{
+		lhs.lookupId = lookup_id in r3
+	}
+
+|	[root_qual_opt nested_name_specifier_opt identifier]
+	{
+		lhs.lookupId = lookup_id in r3
+	}
+
+|	[root_qual_opt nested_name_specifier_opt operator_function_id]
+	{
+		# Normally the token translation transfers the qualification. Since
+		# the operator_function_id does not end in a lookup we must do it ourselves.
+		ptr lang_object qualObj = qualNs.top
+		qualNs.top = nil
+
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<operator_function_id>'
+		lhs.lookupId.qualObj = qualObj
+	}
+
+|	[root_qual_opt nested_name_specifier_opt conversion_function_id]
+	{
+		# Normally the token translation transfers the qualification. Since
+		# the operator_function_id does not } in a lookup we must do it ourselves.
+		ptr lang_object qualObj = qualNs.top
+		qualNs.top = nil
+
+		# Do we need qual reset here becauase operator_function_id does not do it?
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<conversion_function_id>'
+		lhs.lookupId.qualObj = qualObj
+	}
+
+|	[root_qual_opt nested_name_specifier_opt '~' class_name]
+	{
+		lhs.lookupId = r4.lookupId
+	}
+
+|	[root_qual_opt nested_name_specifier_opt template_name]
+	{
+		lhs.lookupId = r3.lookupId
+	}
+		
+def template_name 
+	lookup_id lookupId
+
+	[template_id templ_arg_open template_argument_list_opt templ_arg_close]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+|	[template_id]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+
+#
+# Class Names
+#
+
+def class_name 
+	lookup_id lookupId
+
+	[class_id]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+|	[templ_class_id]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+|	[templ_class_id templ_arg_open template_argument_list_opt templ_arg_close]
+	{
+		# TODO: Look for a specialization.
+		lhs.lookupId = lookup_id in r1
+	}
+
+def templ_arg_open 
+	['<']
+	{
+		qualNs.push( nil )
+	}
+
+def templ_arg_close
+	['>']
+	{
+		qualNs.pop()
+	}
+
+def declaration 
+	[block_declaration] commit
+|	[function_definition] commit
+|	[template_declaration] commit
+|	[explicit_instantiation] commit
+|	[explicit_specialization] commit
+|	[linkage_specification] commit
+|	[namespace_definition] commit
+
+#
+# Declarations
+#
+
+def block_declaration 
+	[simple_declaration]
+|	[using_declaration]
+|	[using_directive]
+
+def simple_declaration 
+	[declaration_start simple_declaration_forms declaration_end ';']
+
+# Ordering is important for optimization. The form with the optional
+# decl_specifier_sing should go second.
+def simple_declaration_forms
+	[decl_specifier_mult_seq_opt decl_specifier_sing 
+		decl_specifier_mult_seq_opt init_declarator_list_opt]
+
+|	[decl_specifier_mult_seq_opt init_declarator_list_opt]
+
+def declaration_start 
+	[]
+	{
+		# LOG print( 'opening new declaration_data with templDecl: ', templDecl.top, '\n' )
+		declarationData.push( construct declaration_data (
+				isTypedef: 0, isFriend: 0, isTemplate: 0 ) [] )
+
+		# Transfer the template flag and reset it.
+		declarationData.top.isTemplate = templDecl.top
+		templDecl.push( 0 )
+	}
+
+def declaration_end 
+	[]
+	{
+		# LOG print( 'closing declaration_data\n' )
+		declarationData.pop()
+		templDecl.pop()
+	}
+
+def decl_specifier_sing 
+	[type_specifier_sing]
+	{
+		# Store the object type of the declaration (if any) for use
+		# by typedefs. 
+		declarationData.top.typeObj = r1.lookupId.obj
+	}
+
+def type_specifier_seq
+	lookup_id lookupId
+
+	[type_specifier_mult_seq_opt type_specifier_sing type_specifier_mult_seq_opt]
+	{
+		lhs.lookupId = r2.lookupId
+	}
+
+def type_specifier_sing
+	lookup_id lookupId
+
+	[simple_type_specifier]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+		
+|	[class_specifier]
+	{
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<class_specifier>'
+	}
+
+|	[enum_specifier]
+	{
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<enum_specifier>'
+	}
+
+|	[elaborated_type_specifier]
+	{
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<elaborated_type_specifier>'
+	}
+
+# Type specifier sequence without enum specifier or class specifier.
+def necs_type_specifier_seq
+	[type_specifier_mult_seq_opt necs_type_specifier_sing type_specifier_mult_seq_opt]
+
+# Type specifier singular without enum specifier or class specifier.
+def necs_type_specifier_sing 
+	[simple_type_specifier]
+|	[elaborated_type_specifier]
+
+def type_specifier_mult_seq_opt 
+	[type_specifier_mult_seq_opt type_specifier_mult]
+|	[]
+
+def type_specifier_mult_seq 
+	[type_specifier_mult_seq type_specifier_mult]
+|	[type_specifier_mult]
+
+def simple_type_specifier
+	lookup_id lookupId
+
+	[simple_type_specifier_name]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+
+|	[simple_type_specifier_kw_seq]
+	{
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<simple_type_specifier_kw_seq>'
+	}
+
+|	['typename' root_qual_opt nested_name_specifier type_name]
+	{
+		lhs.lookupId = r4.lookupId
+	}
+
+|	['typename' root_qual_opt nested_name_specifier identifier]
+	{
+		lhs.lookupId = lookup_id in r4
+	}
+
+|	['typename' root_qual_opt nested_name_specifier unknown_id]
+	{
+		lhs.lookupId = lookup_id in r4
+	}
+
+	# Extension.
+|	['__typeof' '(' identifier ')']
+	{
+		lhs.lookupId = construct lookup_id ["x"]
+		lhs.lookupId.data = '<simple_type_specifier_kw_seq>'
+	}
+
+def simple_type_specifier_name
+	lookup_id lookupId
+
+	[qual_type_name]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+
+def simple_type_specifier_kw_seq 
+	[simple_type_specifier_kw_seq simple_type_specifier_kw]
+|	[simple_type_specifier_kw]
+
+def simple_type_specifier_kw 
+	['void']
+|	['char']
+|	['wchar_t']
+|	['bool']
+|	['int']
+|	['float']
+|	['double']
+|	['short']
+|	['long']
+|	['signed']
+|	['unsigned']
+
+def qual_type_name
+	lookup_id lookupId
+
+	[root_qual_opt nested_name_specifier_opt type_name]
+	{
+		lhs.lookupId = r3.lookupId
+	}
+
+def type_name
+	lookup_id lookupId
+
+	[class_name]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+
+|	[enum_id]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+|	[typedef_id]
+	{
+		lhs.lookupId = lookup_id in r1
+	}
+
+# NOTE: the typename case is moved to simple type specifier
+# to take advantage of its conflict resolution.
+def elaborated_type_specifier
+	[class_key nested_name_specifier_opt class_head_name]
+	{
+		lookup_id Id = lookup_id in r3
+		str name = Id.data
+
+		# Get the ns the class is declared in.
+		ptr lang_object parentObj = declNs.top
+		if Id.qualObj
+			parentObj = Id.qualObj
+
+		# Look for the class in the given scope.
+		ptr lang_object declaredClass = findClass( parentObj, name )
+		if !declaredClass
+			declaredClass = findTemplateClass( parentObj, name )
+
+		if !declaredClass {
+			# LOG print( 'creating new class: ', name, '\n' )
+
+			# Class does not exist in the parent scope, create it.
+			int nsType = declaredClassType()
+
+			declaredClass = createLangObject( nsType, name, lookupNs.top )
+
+			# FIXME: handle friends. Make the class visible only if we are NOT
+			# in a friend declaration.  The new class object is necessary to
+			# properly process the body of the class.
+			if declarationData.top.isFriend == 0
+				insertObject( parentObj, name, declaredClass )
+		}
+	}
+
+	# TODO: Lookup type specialization.
+|	[class_key nested_name_specifier_opt templ_class_id
+		templ_arg_open template_argument_list_opt templ_arg_close]
+
+|	['enum' nested_name_specifier_opt enum_head_name]
+	{
+		# TODO: should look for existing enums of the same name.
+		lookup_id Id = lookup_id in r3
+		# LOG print( 'creating enumeration ', Id.data, '\n' )
+		ptr lang_object enum = createLangObject( EnumType, Id.data, lookupNs.top )
+		insertObject( declNs.top, Id.data, enum )
+	}
+
+def decl_specifier_mult_seq_opt 
+	[decl_specifier_mult_seq_opt decl_specifier_mult]
+|	[]
+
+def decl_specifier_mult_seq 
+	[decl_specifier_mult_seq decl_specifier_mult]
+|	[decl_specifier_mult]
+
+def decl_specifier_mult 
+	[type_specifier_mult]
+|	[storage_class_specifier]
+|	[function_specifier]
+
+|	['friend']
+	{
+		declarationData.top.isFriend = 1
+	}
+
+|	['typedef']
+	{
+		declarationData.top.isTypedef = 1
+	}
+
+def storage_class_specifier 
+	['auto']
+|	['register']
+|	['static']
+|	['extern']
+|	['mutable']
+
+def function_specifier 
+	['inline']
+|	['virtual']
+|	['explicit']
+
+def type_specifier_mult 
+	[cv_qualifier]
+
+def cv_qualifier 
+	['const']
+|	['volatile']
+|	['restrict']
+
+def cv_qualifier_rep 
+	[cv_qualifier_rep cv_qualifier]
+|	[]
+
+def namespace_definition 
+	[named_namespace_definition]
+|	[unnamed_namespace_definition]
+
+def named_namespace_definition
+	[original_namespace_definition]
+|	[extension_namespace_definition]
+
+#
+# Enumerations
+#
+
+def enum_specifier 
+	['enum' nested_name_specifier_opt 
+			enum_head_name '{' enumerator_list_opt '}']
+	{
+		# TODO: should look for existing enums of the same name.
+		lookup_id Id = lookup_id in r3
+		# LOG print( 'creating enumeration ', Id.data, '\n' )
+		ptr lang_object enum = createLangObject( EnumType, Id.data, lookupNs.top )
+		insertObject( declNs.top, Id.data, enum )
+	}
+
+|	['enum' '{' enumerator_list_opt '}']
+
+def enum_head_name
+	[class_id] 
+|	[templ_class_id]
+|	[namespace_id]
+|	[typedef_id]
+|	[enum_id]
+|	[identifier]
+|	[template_id]
+|	[unknown_id]
+
+def enumerator_list_opt 
+	[enumerator_list]
+|	[enumerator_list ',']
+|	[]
+
+def enumerator_list 
+	[enumerator_list ',' enumerator_definition]
+|	[enumerator_definition]
+
+def enumerator_definition 
+	[enumerator_id]
+	{
+		lookup_id Id = lookup_id in r1
+		ptr lang_object enumId = createLangObject( IdType, Id.data, lookupNs.top )
+		insertObject( declNs.top, Id.data, enumId )
+	}
+
+|	[enumerator_id '=' constant_expression]
+	{
+		lookup_id Id = lookup_id in r1
+		ptr lang_object enumId = createLangObject( IdType, Id.data, lookupNs.top )
+		insertObject( declNs.top, Id.data, enumId )
+	}
+
+def enumerator_id
+	[namespace_id] 
+|	[typedef_id]
+|	[enum_id]
+|	[class_id] 
+|	[templ_class_id]
+|	[template_id]
+|	[identifier]
+|	[unknown_id]
+
+#
+# Declarators
+#
+
+def init_declarator_list_opt 
+	[init_declarator_list]
+|	[]
+
+def init_declarator_list
+	[init_declarator_list ',' init_declarator]
+|	[init_declarator]
+
+def init_declarator
+	[declarator initializer_opt]
+
+def initializer_opt
+	['=' initializer_clause]
+|	['(' expression ')']
+|	[]
+
+def initializer_clause 
+	[assignment_expression]
+|	['{' initializer_list '}']
+|	['{' initializer_list ',' '}']
+|	['{' '}']
+
+def initializer_list
+	[initializer_list ',' initializer_clause]
+|	[initializer_clause]
+
+#
+# Expressions
+#
+
+def expression 
+	[expression ',' assignment_expression]
+|	[assignment_expression]
+
+def expression_opt
+	[expression]
+|	[]
+
+def constant_expression
+	[conditional_expression]
+
+def constant_expression_opt 
+	[constant_expression]
+|	[]
+
+def assignment_expression 
+	[conditional_expression]
+|	[logical_or_expression assignment_op assignment_expression]
+|	[throw_expression]
+
+def assignment_op 
+	['=']
+|	['*=']
+|	['/=']
+|	['%=']
+|	['+=']
+|	['-=']
+|	['>>=']
+|	['<<=']
+|	['&=']
+|	['^=']
+|	['|=']
+
+def conditional_expression 
+	[logical_or_expression]
+|	[logical_or_expression '?' expression ':' assignment_expression]
+
+def logical_or_expression 
+	[logical_or_expression '||' logical_and_expression]
+|	[logical_and_expression]
+
+def logical_and_expression 
+	[logical_and_expression '&&' inclusive_or_expression]
+|	[inclusive_or_expression]
+
+def inclusive_or_expression 
+	[inclusive_or_expression '|' exclusive_or_expression]
+|	[exclusive_or_expression]
+
+def exclusive_or_expression 
+	[exclusive_or_expression '^' and_expression]
+|	[and_expression]
+
+def and_expression 
+	[and_expression '&' equality_expression]
+|	[equality_expression]
+
+def equality_expression 
+	[equality_expression '==' relational_expression]
+|	[equality_expression '!=' relational_expression]
+|	[relational_expression]
+
+def relational_expression 
+	[relational_expression '<' shift_expression]
+|	[relational_expression '>' shift_expression]
+|	[relational_expression lt_eq shift_expression]
+|	[relational_expression gt_eq shift_expression]
+|	[shift_expression]
+
+def shift_expression 
+	[shift_expression shift_left additive_expression]
+|	[shift_expression shift_right additive_expression]
+|	[additive_expression]
+
+def additive_expression 
+	[additive_expression '+' multiplicative_expression]
+|	[additive_expression '-' multiplicative_expression]
+|	[multiplicative_expression]
+
+def multiplicative_expression 
+	[multiplicative_expression '*' pm_expression]
+|	[multiplicative_expression '/' pm_expression]
+|	[multiplicative_expression '%' pm_expression]
+|	[pm_expression]
+
+def pm_expression 
+	[pm_expression '->*' cast_expression]
+|	[pm_expression '.*' cast_expression]
+|	[cast_expression]
+
+def cast_expression 
+	[unary_expression]
+|	['(' type_id ')' cast_expression]
+
+def delete_expression 
+	[root_qual_opt 'delete' cast_expression]
+|	[root_qual_opt 'delete' '[' ']' cast_expression]
+
+def new_initializer_opt 
+	[new_initializer]
+|	[]
+
+def new_initializer 
+	['(' expression_opt ')']
+
+def direct_new_declarator 
+	['[' expression ']']
+|	[direct_new_declarator '[' constant_expression ']']
+
+def new_declarator_opt 
+	[new_declarator]
+|	[]
+
+def new_declarator 
+	[direct_new_declarator]
+|	[ptr_operator_seq direct_new_declarator]
+|	[ptr_operator_seq]
+
+def new_type_id 
+	[necs_type_specifier_seq new_declarator_opt]
+
+def new_placement 
+	['(' expression ')']
+
+def new_expression 
+	[root_qual_opt 'new' new_type_id new_initializer_opt]
+|	[root_qual_opt 'new' new_placement new_type_id new_initializer_opt]
+|	[root_qual_opt 'new' '(' type_id ')' new_initializer_opt]
+|	[root_qual_opt 'new' new_placement '(' type_id ')' new_initializer_opt]
+
+def unary_operator 
+	['*']
+|	['&']
+|	['+']
+|	['-']
+|	['!']
+|	['~']
+
+def unary_expression 
+	[postfix_expression]
+|	['++' cast_expression]
+|	['--' cast_expression]
+|	[unary_operator cast_expression]
+|	['sizeof' '(' type_id ')']
+|	['sizeof' unary_expression]
+|	[new_expression]
+|	[delete_expression]
+
+def function_style_type_conv 
+	[simple_type_specifier]
+
+
+def postfix_expression 
+	[primary_expression]
+|	[postfix_expression '[' expression ']']
+|	[postfix_expression '(' expression_opt ')']
+|	[function_style_type_conv '(' expression_opt ')']
+|	[member_request_expr dot_arrow id_expression]
+|	[member_request_expr dot_arrow pseudo_destructor_call]
+|	[postfix_expression '++']
+|	[postfix_expression '--']
+|	['dynamic_cast' templ_arg_open type_id templ_arg_close '(' expression ')']
+|	['static_cast' templ_arg_open type_id templ_arg_close '(' expression ')']
+|	['reinterpret_cast' templ_arg_open type_id templ_arg_close '(' expression ')']
+|	['const_cast' templ_arg_open type_id templ_arg_close '(' expression ')']
+|	['typeid' '(' expression ')']
+|	['typeid' '(' type_id ')']
+
+def pseudo_destructor_call
+	[root_qual_opt nested_name_specifier_opt '~' pdc_type_name]
+
+def primary_expression 
+	[expr_lit]
+|	['this']
+|	['(' expression ')']
+|	[id_expression]
+
+# This is an GNU extension.
+def primary_expression 
+	['(' '{' statement_rep '}' ')']
+
+def expr_lit 
+	[TK_IntegerDecimal]
+|	[TK_IntegerOctal]
+|	[TK_IntegerHex]
+|	[TK_SingleLit]
+|	[TK_Float]
+|	[double_lit_list]
+|	['true']
+|	['false']
+
+def double_lit_list 
+	[TK_DoubleLit double_lit_list]
+|	[TK_DoubleLit]
+
+def member_request_expr 
+	[postfix_expression]
+#	{
+#		# FIXME: If no proper type is found, we must fail.
+#		# LOG print( 'setting member request scope\n' )
+#		# qualNs.set( $1->type != 0 ? $1->type->getObject() : 0 );
+#	}
+
+def dot_arrow 
+	['->']
+|	['.']
+
+def pdc_type_name 
+	[enum_id]
+|	[typedef_id]
+
+#
+# Statements
+#
+
+def statement_rep 
+	[statement_rep statement]
+|	[]
+
+def statement 
+	[declaration_statement]
+|	[labeled_statement]
+|	[expression_statement]
+|	[compound_statement]
+|	[selection_statement]
+|	[iteration_statement]
+|	[jump_statement]
+|	[try_block]
+
+def labeled_statement 
+	[label_id ':' statement]
+|	['case' constant_expression ':' statement]
+|	['default' ':' statement]
+
+def label_id 
+	[unknown_id]
+|	[identifier]
+|	[class_id]
+|	[templ_class_id]
+|	[namespace_id]
+|	[typedef_id]
+|	[enum_id]
+|	[template_id]
+
+def compound_statement
+	['{' compound_begin statement_rep compound_end '}']
+
+def compound_begin 
+	[]
+	{
+		ptr lang_object newCompound = createLangObject( 0, '<compound_begin>', lookupNs.top  )
+		lookupNs.push( newCompound )
+		declNs.push( newCompound )
+		# LOG print( 'opening <compound>\n' )
+	}
+
+def compound_end 
+	[]
+	{
+		lookupNs.pop()
+		declNs.pop()
+		# LOG print( 'closing <compound>\n' )
+	}
+
+def selection_statement 
+	['if' '(' condition ')' statement elseif_clauses else_clause]
+|	['switch' '(' condition ')' statement]
+
+def elseif_clauses 
+	[elseif_clauses 'else' 'if' '(' condition ')' statement]
+|	[]
+
+def else_clause 
+	['else' statement]
+|	[]
+
+def iteration_statement
+	['while' '(' condition ')' statement]
+|	['do' statement 'while' '(' expression ')' ';']
+|	['for' '(' for_init_statement condition_opt ';' expression_opt ')' statement]
+
+def jump_statement 
+	['break' ';']
+|	['continue' ';']
+|	['return' expression_opt ';']
+|	['goto' any_id ';']
+
+def any_id
+	[unknown_id]
+|	[class_id]
+|	[namespace_id]
+|	[templ_class_id]
+|	[enum_id]
+|	[typedef_id]
+|	[identifier]
+|	[template_id]
+	
+
+def for_init_statement 
+	[expression_statement]
+|	[stmt_block_declaration_forms ';']
+
+def condition 
+	[expression]
+|	[type_specifier_seq declarator '=' assignment_expression]
+
+def condition_opt 
+	[condition]
+|	[]
+
+def expression_statement 
+	[expression ';']
+|	[';']
+
+def declaration_statement 
+	[stmt_block_declaration]
+
+def stmt_block_declaration 
+	[declaration_start stmt_block_declaration_forms declaration_end ';']
+|	[using_declaration]
+|	[using_directive]
+
+def stmt_block_declaration_forms
+	[decl_specifier_mult_seq_opt decl_specifier_sing decl_specifier_mult_seq_opt 
+		init_declarator_list_opt]
+|	[decl_specifier_mult_seq init_declarator_list_opt]
+
+#
+# Declarators
+#
+
+def declarator
+	ptr lang_object lookupObj
+
+	[ptr_operator_seq_opt declarator_id decl_array_or_param_rep declarator_end]
+	{
+		lhs.lookupObj = r4.lookupObj
+	}
+
+|	[ptr_operator_seq_opt '(' sub_declarator ')' decl_array_or_param_rep declarator_end]
+	{
+		lhs.lookupObj = r6.lookupObj
+	}
+
+def sub_declarator 
+	[ptr_operator_seq declarator_id decl_array_or_param_rep]
+|	[ptr_operator_seq '(' sub_declarator ')' decl_array_or_param_rep]
+|	['(' sub_declarator ')' decl_array_or_param_rep]
+|	[declarator_id decl_array_or_param_rep]
+
+def decl_array_or_param_rep 
+	[decl_array_or_param_rep decl_array_or_param]
+|	[]
+
+def decl_array_or_param 
+	['[' constant_expression_opt ']']
+|	['(' parameter_declaration_clause ')' cv_qualifier_rep exception_specification_opt]
+
+def declarator_id
+	[declarator_id_forms]
+	{
+		str name = r1.lookupId.data
+		ptr lang_object qualObj = r1.lookupId.qualObj
+
+		ptr lang_object parentObj = declNs.top
+		if qualObj {
+			parentObj = qualObj
+		}
+
+		# Decide if we are declaring a constructor/destructor.
+		bool isConstructor
+		if parentObj == r1.lookupId.obj {
+			isConstructor = true
+			# LOG print( 'making declarator ', name, ' a constructor/destructor\n' )
+		}
+
+		if parentObj->specializationOf && 
+				parentObj->specializationOf == r1.lookupId.obj
+		{
+			isConstructor = true
+			# LOG print( 'making declarator ', name, ' a constructor/destructor\n' )
+		}
+
+		ptr lang_object obj = nil
+		if name && !isConstructor && declarationData.top.isFriend == 0 {
+			if declarationData.top.isTypedef {
+				obj = createLangObject( TypedefType, name, lookupNs.top )
+				obj->typedefOf = declarationData.top.typeObj
+				insertObject( parentObj, name, obj )
+
+				# LOG print( 'making declarator ', name, ' a typedef\n' )
+			}
+			else {
+				if !qualObj {
+					if declarationData.top.isTemplate {
+						# If in a template declaration and the name is not qualified then
+						# create the template id.
+						obj = createLangObject( TemplateIdType, name, lookupNs.top )
+						#object->objType = declarationData.top.type
+						insertObject( declNs.top, name, obj )
+
+						# LOG print( 'making declarator ', name, ' a template id\n' )
+					}
+					else {
+						obj = createLangObject( IdType, name, lookupNs.top )
+						#object->objType = declarationData.top().type;
+						insertObject( declNs.top, name, obj )
+
+						# LOG print( 'making declarator ', name, ' an id\n' ) 
+					}
+				}
+			}
+		}
+
+		declaratorData.push( construct declarator_data (
+				qualObj: qualObj, lookupObj: lookupNs.top ) [] )
+
+		# If the declarator is qualified, push the qualification to the lookup
+		# stack. Also save it in the declarator data so it can be passed to a
+		# function body if needed.
+		if qualObj {
+			lookupNs.push( qualObj )
+			declaratorData.top.lookupObj = qualObj
+		}
+
+		# LOG print( 'reduced declarator_id: ', name, '\n' )
+	}
+
+# Undoes the setup done by declarator_id and pdc_start.
+def declarator_end
+	ptr lang_object lookupObj
+
+	[]
+	{
+		# Get the lookupObject from the scope and pass it up. If we are about to
+		# parse a function body it will be needed.
+		lhs.lookupObj = declaratorData.top.lookupObj
+
+		ptr lang_object pdcScope = declaratorData.top.pdcScope
+		ptr lang_object qualObj = declaratorData.top.qualObj
+
+		declaratorData.pop()
+
+		if pdcScope {
+			# LOG print( 'closing <pdc_scope>\n' )
+			lookupNs.pop()
+			declNs.pop()
+		}
+
+		if qualObj {
+			# LOG print( 'popping lookupNs\n' )
+			lookupNs.pop()
+		}
+	}
+
+def declarator_id_forms
+	lookup_id lookupId
+
+	[id_expression]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+
+|	[root_qual_opt nested_name_specifier_opt type_name]
+	{
+		lhs.lookupId = r3.lookupId
+	}
+
+|	[root_qual_opt nested_name_specifier_opt '~' class_id]
+	{
+		lhs.lookupId = lookup_id in r4
+	}
+
+|	[root_qual_opt nested_name_specifier_opt '~' templ_class_id]
+	{
+		lhs.lookupId = lookup_id in r4
+	}
+
+def type_id
+	lookup_id lookupId
+
+	[type_specifier_seq abstract_declarator_opt]
+	{
+		lhs.lookupId = r1.lookupId
+	}
+
+def abstract_declarator_opt 
+	[abstract_declarator]
+|	[]
+
+def abstract_declarator
+	[ptr_operator_seq abstract_noid abstract_decl_array_or_param_seq_opt declarator_end]
+|	[ptr_operator_seq '(' sub_abstract_declarator ')' 
+		abstract_decl_array_or_param_seq_opt declarator_end]
+|	[abstract_noid abstract_decl_array_or_param_seq declarator_end]
+|	['(' sub_abstract_declarator ')' abstract_decl_array_or_param_seq_opt declarator_end]
+
+def sub_abstract_declarator
+	[ptr_operator_seq abstract_noid abstract_decl_array_or_param_seq_opt]
+
+|	[ptr_operator_seq '(' sub_abstract_declarator ')' 
+		abstract_decl_array_or_param_seq_opt]
+	
+|	['(' sub_abstract_declarator ')' abstract_decl_array_or_param_seq_opt]
+
+def abstract_noid 
+	[]
+	{
+		#  Make scope for declarator.
+		declaratorData.push( construct declarator_data [] )
+	}
+
+def abstract_decl_array_or_param_seq_opt
+	[abstract_decl_array_or_param_seq_opt abstract_decl_array_or_param]
+|	[]
+
+def abstract_decl_array_or_param_seq
+	[abstract_decl_array_or_param_seq abstract_decl_array_or_param]
+|	[abstract_decl_array_or_param]
+
+def abstract_decl_array_or_param
+	['[' constant_expression_opt ']']
+|	['(' parameter_declaration_clause ')' cv_qualifier_rep 
+		exception_specification_opt]
+
+def parameter_declaration_clause
+	[pdc_start parameter_declaration_list]
+|	[pdc_start parameter_declaration_list '...']
+|	[pdc_start parameter_declaration_list ',' '...']
+|	[pdc_start '...']
+|	[pdc_start]
+
+def pdc_start 
+	[]
+	{
+		if !declaratorData.top.pdcScope {
+			# We are going to need a scope for the declarator.
+			ptr lang_object pdcScope = createLangObject( 0, '<pdc_scope>', lookupNs.top )
+			lookupNs.push( pdcScope )
+			declNs.push( pdcScope )
+
+			declaratorData.top.pdcScope = pdcScope
+			declaratorData.top.lookupObj = pdcScope
+			# LOG print( 'opening <pdc_scope>\n' )
+		}
+	}
+
+def parameter_declaration_list 
+	[parameter_declaration_list ',' parameter_declaration]
+|	[parameter_declaration]
+
+def parameter_declaration 
+	[declaration_start parameter_declaration_forms declaration_end]
+
+# Ordering the productions such that decl_specifier_sing is tried first is good
+# for performance.
+def parameter_declaration_forms
+	[decl_specifier_mult_seq_opt decl_specifier_sing decl_specifier_mult_seq_opt 
+		param_maybe_declarator maybe_parameter_init]
+
+|	[decl_specifier_mult_seq param_maybe_declarator maybe_parameter_init]
+
+def param_maybe_declarator 
+	[abstract_declarator]
+|	[declarator]
+|	[]
+
+def maybe_parameter_init 
+	['=' constant_expression]
+|	[]
+
+def ptr_operator 
+	['&']
+|	[root_qual_opt nested_name_specifier_opt '*' cv_qualifier_rep]
+
+def ptr_operator_seq 
+	[ptr_operator_seq ptr_operator]
+|	[ptr_operator]
+
+def ptr_operator_seq_opt 
+	[ptr_operator_seq_opt ptr_operator]
+|	[]
+
+#
+# Functions
+#
+
+def function_definition
+	[function_def_declaration ctor_initializer_opt function_body function_def_end]
+
+def function_def_declaration
+	[declaration_start function_def_declaration_forms declaration_end]
+
+def function_def_declaration_forms 
+	[decl_specifier_mult_seq_opt decl_specifier_sing 
+		decl_specifier_mult_seq_opt function_def_declarator]
+|	[decl_specifier_mult_seq function_def_declarator]
+|	[function_def_declarator]
+
+def function_def_declarator 
+	[declarator]
+	{
+		# The lookupObj from the declarator is the deepest lookup object found
+		# while parsing the declarator. Make it visible in the function body.
+		# This could be the args, the qualObj, or the parent to the function.
+		lookupNs.push( r1.lookupObj )
+	}
+
+def function_def_end 
+	[]
+	{
+		# Pop the lookup object.
+		lookupNs.pop()
+	}
+
+def function_body
+	[function_body_begin '{' statement_rep function_body_end '}']
+
+def function_body_begin 
+	[]
+	{
+		ptr lang_object newFunctionBody = createLangObject( 0, 
+				'<function_body_begin>', lookupNs.top )
+		lookupNs.push( newFunctionBody )
+		declNs.push( newFunctionBody )
+		templDecl.push( 0 )
+		# LOG print( 'opening <function_body>\n' )
+	}
+
+def function_body_end 
+	[]
+	{
+		# First undoes the function body begin work. Then undoes the setup in
+		# function_def_declarator.
+		declNs.pop()
+		lookupNs.pop()
+		templDecl.pop()
+		# LOG print( 'closing <function_body>\n' )
+	}
+
+
+
+#
+# Classs
+#
+
+int declaredClassType()
+{
+	if declarationData.top.isTemplate {
+		return TemplateClassType
+	} else {
+		return ClassType
+	}
+}
+
+def class_specifier 
+	[class_head base_clause_opt '{' class_member_rep class_body_end '}']
+	{
+# FIXME: reparse not implemented yet
+#		# Visit class function bodies, but skip nested classes.
+#		for CFB: class_function_body in lhs {
+#			skipping class_specifier
+#
+#			# Reparse the text of the class function body as a function body
+#			function_body FB = reparse function_body( CFB )
+#
+#			# Replace the class function body with the parsed function body.
+#			CFB = construct class_function_body 
+#				[FB]
+#		}
+	}
+
+def class_head 
+	[class_key]
+	{
+		int nsType = declaredClassType()
+
+		# LOG print( 'creating new anonymous class\n' )
+		ptr lang_object newClass = createLangObject( nsType, 
+				'<anon_class>', lookupNs.top )
+		lookupNs.push( newClass )
+		declNs.push( newClass )
+	}
+
+|	[class_key nested_name_specifier_opt class_head_name]
+	{
+		lookup_id Id = lookup_id in r3
+		str name = Id.data
+
+		# Get the ns the class is declared in.
+		ptr lang_object parentObj = declNs.top
+		if Id.qualObj
+			parentObj = Id.qualObj
+
+		# Look for the class in the given scope.
+		ptr lang_object declaredClass = findClass( parentObj, name )
+		if !declaredClass
+			declaredClass = findTemplateClass( parentObj, name )
+
+		if !declaredClass {
+			# LOG print( 'creating new class: ', name, '\n' )
+
+			# Class does not exist in the parent scope, create it.
+			int nsType = declaredClassType()
+
+			declaredClass = createLangObject( nsType, name, lookupNs.top )
+
+			# FIXME: handle friends. Make the class visible only if we are NOT
+			# in a friend declaration.  The new class object is necessary to
+			# properly process the body of the class.
+			if declarationData.top.isFriend == 0
+				insertObject( parentObj, name, declaredClass )
+		}
+
+		# Push the found/new class.
+		lookupNs.push( declaredClass )
+		declNs.push( declaredClass )
+	}
+
+|	[class_key nested_name_specifier_opt templ_class_id
+		templ_arg_open template_argument_list_opt templ_arg_close]
+	{
+		match r3 [Id: lookup_id]
+		str id = Id.data
+		ptr lang_object classObj = Id.obj
+
+		# TODO: Try to find the specializaition in the template class object.
+		# TypeList typeList;
+		# makeTypeList( typeList, $6->last );
+
+		ptr lang_object declaredClass
+		#declaredClass = classObj->findSpecExact( typeList );
+		if !declaredClass {
+			# LOG print( 'making new template specialization\n' )
+			int nsType = declaredClassType()
+			declaredClass = createLangObject( nsType, id, lookupNs.top )
+			# LOG print( 'declaredClass: ', declaredClass, '\n' )
+			declaredClass->specializationOf = classObj
+			# $$->typeListMapEl = classObj->typeListMap.insert( typeList, declaredClass );
+		}
+
+		# Push the found/new class.
+		lookupNs.push( declaredClass )
+		declNs.push( declaredClass )
+	}
+
+def class_body_end 
+	[]
+	{
+		# Pop the class ns.
+		lookupNs.pop()
+		declNs.pop()
+
+		# LOG print( 'closing off class\n' )
+	}
+
+def class_head_name
+	[class_id]
+|	[templ_class_id]
+|	[namespace_id]
+|	[typedef_id]
+|	[enum_id]
+|	[unknown_id]
+|	[identifier]
+|	[template_id]
+
+def class_key 
+	['class']
+|	['struct']
+|	['union']
+
+def class_member_rep 
+	[class_member_rep class_member]
+|	[]
+
+def class_member 
+	[member_declaration]
+|	[access_specifier ':']
+
+def member_declaration 
+	[declaration_start member_declaration_forms declaration_end ';']
+|	[class_function_definition]
+|	[using_declaration]
+|	[template_declaration]
+
+def class_function_definition
+	[function_def_declaration ctor_initializer_opt class_function_body function_def_end]
+
+lex cfb_conts
+{
+	token cfb_open /'{'/
+	token cfb_close /'}'/
+	token cfb_string /
+				"'" ( [^'\\\n] | '\\' any )* "'" |
+				'"' ( [^"\\\n] | '\\' any )* '"'/
+	token cfb_comment /
+				( '/*' (any | '\n')* :>> '*/' ) |
+				( '//' any* :> '\n' )/
+	token cfb_data /[^{}'"/]+ | '/'/
+}
+
+def cfb_item
+	[cfb_data]
+|	[cfb_string]
+|	[cfb_comment]
+|	[cfb_open cfb_item* cfb_close]
+
+def cfb_conts
+	[cfb_item* cfb_close]
+
+
+
+def class_function_body
+#	['{' cfb_conts]
+#|	[function_body]
+	[function_body]
+
+# Get better performance if the form with decl_specifier_sing comes first.
+def member_declaration_forms
+	[decl_specifier_mult_seq_opt decl_specifier_sing 
+		decl_specifier_mult_seq_opt member_declarator_list_opt]
+
+def member_declaration_forms
+	[decl_specifier_mult_seq_opt member_declarator_list_opt]
+
+def member_declarator_list_opt 
+	[member_declarator_list]
+|	[]
+
+def member_declarator_list 
+	[member_declarator_list ',' member_declarator]
+|	[member_declarator]
+
+def member_declarator 
+	[declarator]
+|	[declarator '=' constant_expression]
+|	[declarator ':' constant_expression]
+|	[':' constant_expression]
+
+def access_specifier 
+	['private']
+|	['protected']
+|	['public']
+
+def access_specifier_opt 
+	[access_specifier]
+|	[]
+
+def using_declaration
+	['using' id_expression ';']
+	{
+		ptr lang_object obj = r2.lookupId.obj
+		if obj
+			insertObject( declNs.top, obj->name, obj )
+	}
+
+|	['using' type_id ';']
+	{
+		ptr lang_object obj = r2.lookupId.obj
+		if obj
+			insertObject( declNs.top, obj->name, obj )
+	}
+
+def using_directive
+	['using' 'namespace' root_qual_opt nested_name_specifier_opt 
+		namespace_id ';']
+	{
+		# This uses a simple, incomplete guard against cycles in the graph of
+		# using namespaces. A more sophisticated and complete guard would look
+		# for longer cycles as well. Note that even gcc 3.3.5 does not bother.
+		match r5 [Id: lookup_id]
+		ptr lang_object usingObject = Id.obj
+		ptr lang_object inObject = declNs.top
+		if usingObject != inObject
+			inObject->inherited.append( usingObject )
+	}
+
+
+#
+# Derived classes
+#
+
+def base_clause_opt 
+	[base_clause]
+|	[]
+
+def base_clause 
+	[':' base_specifier_list]
+
+def base_specifier_list 
+	[base_specifier_list ',' base_specifier]
+|	[base_specifier]
+
+int addBaseSpecifier( ptr lang_object inObject, ptr lang_object inheritedObject )
+{
+	# Resolve typedefs.
+	if inheritedObject->typeId == TypedefType
+		inheritedObject = inheritedObject->typedefOf
+
+	inObject->inherited.append( inheritedObject )
+}
+
+def base_specifier 
+	[root_qual_opt nested_name_specifier_opt type_name]
+	{
+		addBaseSpecifier( declNs.top, r3.lookupId.obj )
+	}
+
+|	['virtual' access_specifier_opt root_qual_opt nested_name_specifier_opt type_name]
+	{
+		addBaseSpecifier( declNs.top, r5.lookupId.obj )
+	}
+
+|	[access_specifier virtual_opt root_qual_opt nested_name_specifier_opt type_name]
+	{
+		addBaseSpecifier( declNs.top, r5.lookupId.obj )
+	}
+
+def virtual_opt 
+	['virtual']
+|	[]
+
+#
+# Special member functions
+#
+
+def conversion_function_id 
+	['operator' conversion_type_id]
+
+def conversion_type_id 
+	[necs_type_specifier_seq ptr_operator_seq_opt]
+
+def ctor_initializer_opt 
+	[ctor_initializer]
+|	[]
+
+def ctor_initializer
+	[':' mem_initializer_list]
+
+def mem_initializer_list 
+	[mem_initializer_list ',' mem_initializer]
+|	[mem_initializer]
+
+def mem_initializer 
+	[mem_initializer_id '(' expression_opt ')']
+
+def mem_initializer_id 
+	[root_qual_opt nested_name_specifier_opt unknown_id]
+|	[root_qual_opt nested_name_specifier_opt identifier]
+|	[root_qual_opt nested_name_specifier_opt type_name]
+|	[root_qual_opt nested_name_specifier_opt template_name]
+
+
+#
+# Overloading
+#
+def operator_function_id 
+	['operator' operator]
+
+def operator 
+	['+'] | ['-'] | ['*'] | ['/'] | ['='] | ['<'] | ['>'] | ['&'] | ['|'] |
+	['^'] | ['%'] | ['~'] |	['!'] | ['(' ')'] | ['[' ']'] | ['new'] |
+	['delete'] | ['->'] | ['++'] | ['--'] | ['*='] | ['/='] | ['%='] |
+	['+='] | ['-='] | ['>>='] | ['<<='] | ['&='] | ['^='] | ['|='] | ['=='] |
+	['!='] | ['&&'] | ['||'] | [lt_eq] | [gt_eq] | [shift_left] | [shift_right]
+
+def lt_eq 
+	['<' '=']
+#	try {
+#		if ( $2->leader != 0 ) {
+#			#ifdef LOG_REDUCE
+#			cerr << "rejecting less-than equals-to" << endl;
+#			#endif
+#			reject();
+#		}
+#	};
+
+def gt_eq 
+	['>' '=']
+#	try {
+#		if ( $2->leader != 0 ) {
+#			#ifdef LOG_REDUCE
+#			cerr << "rejecting greater-than equals-to" << endl;
+#			#endif
+#			reject();
+#		}
+#	};
+
+def shift_left 
+	['<' '<']
+#	try {
+#		if ( $2->leader != 0 ) {
+#			#ifdef LOG_REDUCE
+#			cerr << "rejecting shift left" << endl;
+#			#endif
+#			reject();
+#		}
+#	};
+
+def shift_right 
+	['>' '>']
+#	try {
+#		if ( $2->leader != 0 ) {
+#			#ifdef LOG_REDUCE
+#			cerr << "rejecting shift right" << endl;
+#			#endif
+#			reject();
+#		}
+#	};
+
+#
+# Templates
+#
+
+def template_declaration 
+	[template_declaration_params declaration]
+	{
+		templDecl.pop()
+		templateParamNs.pop()
+	}
+
+def template_declaration_params
+	['template' '<' tpl_start template_parameter_list '>']
+	{
+		templDecl.push( 1 )
+	}
+
+|	['export' 'template' '<' tpl_start template_parameter_list '>']
+	{
+		templDecl.push( 1 )
+	}
+
+def tpl_start 
+	[]
+	{
+		# Create a new scope for the template parameters.
+		ptr lang_object newTemplateParamScope = 
+			createLangObject( 0, '<tpl_start>', lookupNs.top )
+		templateParamNs.push( newTemplateParamScope )
+	}
+
+def template_parameter_list 
+	[template_parameter_list ',' template_parameter]
+|	[template_parameter]
+
+def template_parameter 
+	[type_parameter]
+|	[template_parameter_declaration]
+
+def template_parameter_declaration
+	[declaration_start template_parameter_declaration_forms declaration_end]
+
+def template_parameter_declaration_forms
+	[decl_specifier_mult_seq param_maybe_declarator maybe_parameter_init]
+
+|	[temp_param_decl_specifier_sing decl_specifier_mult_seq_opt 
+		param_maybe_declarator maybe_parameter_init]
+
+|	[decl_specifier_mult_seq temp_param_decl_specifier_sing 
+		decl_specifier_mult_seq_opt param_maybe_declarator maybe_parameter_init]
+
+def temp_param_decl_specifier_sing 
+	[temp_param_type_specifier_sing]
+
+# Template parameters cannot support elaborated type specifer or class specifier.
+def temp_param_type_specifier_sing 
+	[templ_simple_type_specifier]
+|	[enum_specifier]
+
+def templ_simple_type_specifier 
+	[simple_type_specifier_name]
+|	[simple_type_specifier_kw_seq]
+
+def type_parameter
+	['class' type_param_id type_param_init_opt]
+	{
+		lookup_id Id = lookup_id in r2
+		if Id {
+			# The lookup ns should be a template param scope.
+			ptr lang_object newClass = 
+				createLangObject( ClassType, Id.data, lookupNs.top )
+			insertObject( templateParamNs.top, Id.data, newClass )
+		}
+	}
+
+|	['typename' type_param_id type_param_init_opt]
+	{
+		lookup_id Id = lookup_id in r2
+		if Id {
+			# The lookup ns should be a template param scope.
+			ptr lang_object newClass = 
+				createLangObject( ClassType, Id.data, lookupNs.top )
+			insertObject( templateParamNs.top, Id.data, newClass )
+		}
+	}
+
+|	['template' '<' tpl_start template_parameter_list '>'
+			'class' type_param_id templ_type_param_init_opt]
+	{
+		lookup_id Id = lookup_id in r7
+		if Id {
+			ptr lang_object newClass = 
+				createLangObject( TemplateClassType, Id.data, lookupNs.top )
+			insertObject( templateParamNs.top, Id.data, newClass )
+		}
+	}
+
+def templ_type_param_init_opt 
+	['=' id_expression]
+|	[]
+
+def type_param_init_opt 
+	['=' type_id]
+|	[]
+
+def type_param_id 
+	[namespace_id]
+|	[typedef_id]
+|	[enum_id]
+|	[class_id] 
+|	[templ_class_id]
+|	[identifier]
+|	[template_id]
+|	[unknown_id]
+|	[] 
+
+def template_argument_list_opt 
+	[template_argument_list]
+|	[]
+
+def template_argument_list 
+	[template_argument_list ',' template_argument]
+|	[template_argument]
+
+def template_argument 
+	[type_id]
+|	[assignment_expression]
+
+def explicit_instantiation 
+	['template' declaration]
+|	[declaration_start decl_specifier_mult_seq 'template' declaration declaration_end]
+
+def explicit_specialization 
+	['template' '<' '>' declaration]
+
+## Not sure what this one is about?
+#explicit_specialization: 
+#	declaration_start decl_specifier_mult_seq KW_Template '<' '>' 
+#	declaration declaration_end;
+
+
+#
+# Original namespace definition
+#
+
+def original_namespace_definition
+	[orig_namespace_def_name '{' declaration* namespace_end '}']
+
+def orig_namespace_def_name ['namespace' unknown_id]
+	{
+		match r2 [Id: lookup_id]
+		ptr lang_object nspace = createLangObject(
+				NamespaceType, Id.data, lookupNs.top )
+
+		# Insert the new object into the dictionary of the parent.
+		insertObject( curNamespace.top, Id.data, nspace )
+
+		# Push the namespace 
+		curNamespace.push( nspace )
+		declNs.push( nspace )
+		lookupNs.push( nspace )
+
+		# LOG print( 'created original namespace: ', Id.data, '\n' )
+	}
+
+def namespace_end []
+	{
+		# Pop the namespace.
+		curNamespace.pop()
+		declNs.pop()
+		lookupNs.pop()
+
+		# LOG print( 'closed namespace\n' )
+	}
+
+#
+# Extension namespace definition
+#
+
+def extension_namespace_definition
+	[ext_namespace_def_name '{' declaration* namespace_end '}']
+
+def ext_namespace_def_name ['namespace' namespace_id]
+	{
+		match r2 [Id: lookup_id]
+		ptr lang_object nspace = Id.obj
+
+		# Push the namespace 
+		curNamespace.push( nspace )
+		declNs.push( nspace )
+		lookupNs.push( nspace )
+
+		# LOG print( 'found extended namespace: ', Id.data, '\n' )
+	}
+
+#
+# Unnamed namespace definition
+#
+def unnamed_namespace_definition
+	[unnamed_namespace_def_name '{' declaration* namespace_end '}']
+
+def unnamed_namespace_def_name ['namespace']
+	{
+		ptr lang_object nspace = createLangObject(
+				NamespaceType, '<unnamed_namespace>',
+				lookupNs.top )
+
+		# Push the namespace 
+		curNamespace.push( nspace )
+		declNs.push( nspace )
+		lookupNs.push( nspace )
+
+		# LOG print( 'parsed unnamed namespace\n' )
+	}
+
+#
+# linkage_specification
+#
+def linkage_specification 
+	['extern' TK_DoubleLit '{' declaration* '}']
+|	['extern' TK_DoubleLit declaration]
+
+#
+# Exception Handling.
+#
+
+def try_block 
+	['try' compound_statement handler_seq]
+
+def handler_seq 
+	[handler_seq handler]
+|	[handler]
+
+def handler 
+	['catch' '(' exception_declaration ')' compound_statement]
+
+def exception_declaration 
+	[type_specifier_seq declarator]
+|	[type_specifier_seq abstract_declarator]
+|	[type_specifier_seq]
+
+def exception_declaration 
+	['...']
+
+def throw_expression 
+	['throw' assignment_expression]
+|	['throw']
+
+def exception_specification_opt 
+	[exception_specification]
+|	[]
+
+def exception_specification 
+	['throw' '(' type_id_list_opt ')']
+
+def type_id_list_opt 
+	[type_id_list]
+|	[]
+
+def type_id_list 
+	[type_id_list ',' type_id]
+|	[type_id]
+
+def start
+	[declaration*]
+
+#
+# Grammar done.
+#
+
+int printObject( str indent, ptr lang_object obj )
+{
+	print( indent, obj->name )
+	
+	if obj->objectMap.length > 0
+		print( ' {\n' )
+	
+	object_map ChildNames = obj->objectMap
+	for MapEl: object_list in child( ChildNames ) {
+		for Obj: ptr lang_object in MapEl
+			printObject( indent + '  ', Obj )
+	}
+
+	if obj->objectMap.length > 0
+		print( indent, '}' )
+
+	print( '\n' )
+}
+
+int printNamespace()
+{
+	printObject( '', rootNamespace )
+}
+
+start S = parse start( stdin )
+#printNamespace()
+#print( '***** SUCCESS *****\n' )
+#print_xml( S )
diff --git a/test/cxx/input01.cpp b/test/cxx/input01.cpp
new file mode 100644
index 00000000..e2b125f4
--- /dev/null
+++ b/test/cxx/input01.cpp
@@ -0,0 +1,17 @@
+namespace ns1
+{
+	namespace sub1 { class A {}; }
+	namespace sub2 { class B {}; }
+}
+
+namespace ns2
+{
+//	int i = b;
+	class C
+	{
+	};
+
+	using namespace ns1;
+}
+
+ns2::sub1::A a;
diff --git a/test/cxx/input02.cpp b/test/cxx/input02.cpp
new file mode 100644
index 00000000..65ebe0db
--- /dev/null
+++ b/test/cxx/input02.cpp
@@ -0,0 +1,16 @@
+
+struct A
+{
+	struct B {};
+};
+
+struct C
+{
+	struct D : virtual public A {};
+};
+
+C::D::A d;
+
+C c;
+
+
diff --git a/test/cxx/input03.cpp b/test/cxx/input03.cpp
new file mode 100644
index 00000000..bccfbf0e
--- /dev/null
+++ b/test/cxx/input03.cpp
@@ -0,0 +1,19 @@
+
+struct C
+{
+
+};
+
+enum E
+{
+	C,
+	b
+};
+
+E e;
+
+enum E
+{
+	C,
+	b
+};
diff --git a/test/cxx/input04.cpp b/test/cxx/input04.cpp
new file mode 100644
index 00000000..9741a82b
--- /dev/null
+++ b/test/cxx/input04.cpp
@@ -0,0 +1,17 @@
+
+
+int i;
+class C
+{
+	int j;
+};
+
+class D
+{
+	int ~D();
+};
+
+int C::k;
+int C::~C;
+
+typedef int Int;
diff --git a/test/cxx/input05.cpp b/test/cxx/input05.cpp
new file mode 100644
index 00000000..7936ce09
--- /dev/null
+++ b/test/cxx/input05.cpp
@@ -0,0 +1,8 @@
+
+class C {};
+void ~C( );
+void C::operator +( int i );
+
+int i;
+
+//void operator C( void k );
diff --git a/test/cxx/input06.cpp b/test/cxx/input06.cpp
new file mode 100644
index 00000000..008edd4b
--- /dev/null
+++ b/test/cxx/input06.cpp
@@ -0,0 +1,7 @@
+
+class C
+{
+	
+};
+
+int C::f( int i, int j( void v ) );
diff --git a/test/cxx/input07.cpp b/test/cxx/input07.cpp
new file mode 100644
index 00000000..474ba9a1
--- /dev/null
+++ b/test/cxx/input07.cpp
@@ -0,0 +1,18 @@
+class C 
+{
+	class D {};
+
+	typedef C I;
+
+	I::D i;
+};
+
+C c;
+
+void function( int i, int j );
+{
+	asdlkf
+}
+
+
+
diff --git a/test/cxx/input08.cpp b/test/cxx/input08.cpp
new file mode 100644
index 00000000..2e9ec7a0
--- /dev/null
+++ b/test/cxx/input08.cpp
@@ -0,0 +1,13 @@
+class B { class Find {}; };
+
+typedef B T;
+
+class C : public T
+{
+	Find find;
+};
+
+
+
+
+
diff --git a/test/cxx/input09.cpp b/test/cxx/input09.cpp
new file mode 100644
index 00000000..373f4373
--- /dev/null
+++ b/test/cxx/input09.cpp
@@ -0,0 +1,7 @@
+template <class X> struct C
+{
+	X t;
+	void f();
+};
+
+template <class X> void C<X>::f();
diff --git a/test/cxx/input10.cpp b/test/cxx/input10.cpp
new file mode 100644
index 00000000..98b6a96a
--- /dev/null
+++ b/test/cxx/input10.cpp
@@ -0,0 +1,11 @@
+template <class X> struct C
+{
+	class Y {};
+};
+
+class C<int>
+{
+	int i;
+};
+
+//void f( class C<int> i, int j );
diff --git a/test/cxx/input11.cpp b/test/cxx/input11.cpp
new file mode 100644
index 00000000..d9714571
--- /dev/null
+++ b/test/cxx/input11.cpp
@@ -0,0 +1,2 @@
+
+int f( int (*) [](), void );
diff --git a/test/cxx/input12.cpp b/test/cxx/input12.cpp
new file mode 100644
index 00000000..c135c8da
--- /dev/null
+++ b/test/cxx/input12.cpp
@@ -0,0 +1,8 @@
+void f();
+class C
+{
+	class D {};
+	void g();
+};
+
+typename C c;
diff --git a/test/cxx/input13.cpp b/test/cxx/input13.cpp
new file mode 100644
index 00000000..67fd42fd
--- /dev/null
+++ b/test/cxx/input13.cpp
@@ -0,0 +1,14 @@
+
+class C
+{
+	class D {};
+	int f();
+};
+
+int f()
+{
+}
+int C::f()
+{
+	D d;
+}
diff --git a/test/cxx/preproc b/test/cxx/preproc
new file mode 100755
index 00000000..14e8fe6b
--- /dev/null
+++ b/test/cxx/preproc
@@ -0,0 +1,4 @@
+#!/bin/bash
+#
+
+g++ -E -undef -D'__attribute__(xyz)=' "$@" | sed 's/#.*$//'
diff --git a/test/diff/Makefile b/test/diff/Makefile
new file mode 100644
index 00000000..25a0b6d3
--- /dev/null
+++ b/test/diff/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/diff/diff.lm b/test/diff/diff.lm
new file mode 100644
index 00000000..37232025
--- /dev/null
+++ b/test/diff/diff.lm
@@ -0,0 +1,84 @@
+
+
+token newline / '\n' /
+token index / 'Index:' [ \t]* /
+token consume_line / [^\n]* /
+
+
+def index_stmt [index consume_line newline]
+
+token separator_line / '='+ '\n' /
+
+# Whitespace separated word list
+lex word_list
+{
+	token word /[^\t \n]+/
+	ignore /[\t ]+/
+
+	def word_list 
+		[word word_list]
+	|	[]
+}
+
+token old_file_start / '---' [\t ]+ /
+token new_file_start / '+++' [\t ]+ /
+
+def old_file 
+	[old_file_start word_list newline]
+
+def new_file 
+	[new_file_start word_list newline]
+
+def file_header 
+	[index_stmt separator_line old_file new_file]
+
+token hunk_header / '@@' any* :>> '@@' '\n' /
+token hunk_line / ( ' ' | '-' | '+' ) [^\n]* '\n' /
+
+def hunk_body 
+	[hunk_line*]
+
+def hunk 
+	[hunk_header hunk_body]
+
+# diff of a single file: header followed by a hunk list.
+def file_diff 
+	[file_header hunk*]
+
+def start 
+	[file_diff*]
+
+
+start S = parse start( stdin )
+
+for OF:old_file in S {
+	print( 'old file: ', OF )
+	# Get the first word and check if it is 
+	# the file we are interested in.
+	if match OF [
+			"--- fsmrun.cpp" 
+				Rest: word_list 
+			"\n"
+		]
+	{
+		OF = construct old_file
+			["--- newfilename.cpp" Rest "\n"]
+		print_xml( OF )
+	}
+}
+
+print( S )
+
+#		for Header: file_header in lhs {
+#			old_file OF = old_file in Header
+#			if match OF 
+#				[old_file_start "lmparse.kl" word_list newline]
+#			{
+#				Header = construct file_header
+#					~Index: rewritten
+#					~===================================================================
+#					~--- this is the file (asldkfj)
+#					~+++ this is the file (ewir)
+#			}
+#		}
+
diff --git a/test/diff/input1.diff b/test/diff/input1.diff
new file mode 100644
index 00000000..b0021f67
--- /dev/null
+++ b/test/diff/input1.diff
@@ -0,0 +1,86 @@
+Index: fsmrun.cpp
+===================================================================
+--- fsmrun.cpp	(revision 4555)
++++ fsmrun.cpp	(working copy)
+@@ -150,7 +150,7 @@
+ 	peof = 0;
+ 	if ( parser != 0 ) {
+ 		region = parser->getNextRegion();
+-		cs = getStateFromNextRegion();
++		cs = tables->entryByRegion[region];
+ 	}
+ 	else {
+ 		region = 0;
+@@ -189,7 +189,7 @@
+ 
+ 	tokstart = 0;
+ 	region = parser->getNextRegion();
+-	cs = getStateFromNextRegion();
++	cs = tables->entryByRegion[region];
+ }
+ 
+ void FsmRun::sendToken( int id )
+@@ -222,7 +222,7 @@
+ 		parser = newParser;
+ 
+ 		region = parser->getNextRegion();
+-		cs = getStateFromNextRegion();
++		cs = tables->entryByRegion[region];
+ 	}
+ 	else {
+ 		#ifdef LOG_ACTIONS
+@@ -355,7 +355,7 @@
+ 
+ 			/* Set the current state from the next region. */
+ 			region = parser->getNextRegion();
+-			cs = getStateFromNextRegion();
++			cs = tables->entryByRegion[region];
+ 		}
+ 	}
+ 
+@@ -452,7 +452,7 @@
+ 		/* First thing check for error. */
+ 		if ( cs == tables->errorState ) {
+ 			if ( parser != 0 ) {
+-				if ( getStateFromNextRegion( 1 ) != 0 ) {
++				if ( parser->getNextRegion( 1 ) != 0 ) {
+ 					#ifdef LOG_BACKTRACK
+ 					cerr << "scanner failed, trying next region" << endl;
+ 					#endif
+@@ -462,7 +462,7 @@
+ 
+ 					parser->nextRegionInd += 1;
+ 					region = parser->getNextRegion();
+-					cs = getStateFromNextRegion();
++					cs = tables->entryByRegion[region];
+ 					cerr << "new token region: " << 
+ 							parser->tables->gbl->regionInfo[region].name << endl;
+ 					continue;
+@@ -495,7 +495,7 @@
+ 					}
+ 					else {
+ 						region = parser->getNextRegion();
+-						cs = getStateFromNextRegion();
++						cs = tables->entryByRegion[region];
+ 						cerr << "new token region: " << 
+ 								parser->tables->gbl->regionInfo[region].name << endl;
+ 						continue;
+Index: junk.cpp
+===================================================================
+--- 
++++ junk.cpp	(working copy)
+Index: fsmrun.h
+===================================================================
+--- fsmrun.h	(revision 4557)
++++ fsmrun.h	(working copy)
+@@ -197,10 +197,6 @@
+ 	void runOnInputStream( PdaRun *parser, InputStream &in );
+ 	void execute();
+ 
+-	/* Offset can be used to look at the next nextRegionInd. */
+-	int getStateFromNextRegion( int offset = 0 )
+-		{ return tables->entryByRegion[parser->getNextRegion(offset)]; }
+-
+ 	FsmTables *tables;
+ 	PdaRun *parser;
+ 	InputStream *inputStream;
diff --git a/test/dns/Makefile b/test/dns/Makefile
new file mode 100644
index 00000000..27b04782
--- /dev/null
+++ b/test/dns/Makefile
@@ -0,0 +1,20 @@
+#
+#   Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+extract: extract.c
+	gcc -Wall -o extract extract.c -lpcap
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f dns.cpp dns.bin extract
diff --git a/test/dns/dns.lm b/test/dns/dns.lm
new file mode 100644
index 00000000..29f0cdbe
--- /dev/null
+++ b/test/dns/dns.lm
@@ -0,0 +1,488 @@
+
+# Used for most of the grammar.
+token octet /any/
+
+# Filled in during the parsing of resource records. Determine what RR_UNKNOWN
+# translates to.
+global int rr_type_value
+global int rr_class_value
+
+# Tokens generated from RR_UNKNOWN. Used to pick the kind 
+# of resource record to attempt to parse.
+token RR_A //        # 1 a host address
+token RR_NS //       # 2 an authoritative name server
+token RR_MD //       # 3 a mail destination (Obsolete - use MX)
+token RR_MF //       # 4 a mail forwarder (Obsolete - use MX)
+token RR_CNAME //    # 5 the canonical name for an alias
+token RR_SOA //      # 6 marks the start of a zone of authority
+token RR_MB //       # 7 a mailbox domain name (EXPERIMENTAL)
+token RR_MG //       # 8 a mail group member (EXPERIMENTAL)
+token RR_MR //       # 9 a mail rename domain name (EXPERIMENTAL)
+token RR_NULL //     # 10 a null RR (EXPERIMENTAL)
+token RR_WKS //      # 11 a well known service description
+token RR_PTR //      # 12 a domain name pointer
+token RR_HINFO //    # 13 host information
+token RR_MINFO //    # 14 mailbox or mail list information
+token RR_MX //       # 15 mail exchange
+token RR_TXT //       # 16 text strings
+
+token RR_UNKNOWN 
+	/''/
+	{
+		int id = typeid RR_UNKNOWN
+		if rr_type_value == 1
+			id = typeid RR_A
+		elsif rr_type_value == 2
+			id = typeid RR_NS
+		elsif rr_type_value == 5
+			id = typeid RR_CNAME
+		elsif rr_type_value == 12
+			id = typeid RR_PTR
+		elsif rr_type_value == 15
+			id = typeid RR_MX
+		elsif rr_type_value == 16
+			id = typeid RR_TXT
+
+		send( make_token( id, '' ) )
+	}
+
+# Convert two octets in network order into an unsigned 16 bit value.
+int network_uord16( octet o1, octet o2 )
+{
+	return o1.data.uord8() * 256 + o2.data.uord8()
+}
+
+
+def message
+	[header questions answers authorities additionals]
+
+global int question_count
+global int answer_count
+global int authority_count
+global int additional_count
+
+#    Message Header
+#
+#                                    1  1  1  1  1  1
+#      0  1  2  3  4  5  6  7  8  9  0  1  2  3  4  5
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |                      ID                       |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |QR|   Opcode  |AA|TC|RD|RA|   Z    |   RCODE   |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |                    QDCOUNT                    |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |                    ANCOUNT                    |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |                    NSCOUNT                    |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#    |                    ARCOUNT                    |
+#    +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+def header
+	[header_id header_fields count count count count]
+	{
+		question_count = r3.count
+		answer_count = r4.count
+		authority_count = r5.count
+		additional_count = r6.count
+	}
+
+def header_id
+	[octet octet]
+
+def header_fields
+	[octet octet]
+
+def count
+	int count
+
+	[octet octet]
+	{
+		lhs.count = network_uord16( r1, r2 )
+	}
+
+#
+# Counting Primitives
+#
+# Uses a global stack of lengths. Using a stack allows for counted lists to be
+# nested. As the list is consumed it brings the count down to zero. To use it,
+# push a new count value to the list and include it in a right-recursive list
+# like so:
+#
+# def LIST
+#     [count_inc ITEM LIST]
+#     [count_end]
+# end
+#
+
+list count_stack [int]
+global count_stack CL = construct count_stack []
+
+int start_list( int count )
+{
+	CL.push( count )
+}
+
+def count_inc
+	[]
+	{
+		if CL.top == 0 {
+			reject
+		} else {
+			CL.top = CL.top - 1
+		}
+	}
+
+def count_end
+	[]
+	{
+		if CL.top != 0 {
+			reject
+		} else {
+			CL.pop()
+		}
+	}
+
+#
+# Octet List
+#
+
+# General octet list. Length must be set to use this.
+def octet_list
+	[count_inc octet octet_list]
+|	[count_end]
+
+
+#
+# Names
+#
+
+def name
+	[name_part* name_end]
+
+# Name part lists are terminated by a zero length or a pointer.
+def name_end
+	# Zero length ending
+	[octet]
+	{
+		int val = r1.data.uord8()
+		if val != 0 {
+			reject
+		}
+	}
+
+	# Pointer ending
+	#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+	#   | 1  1|                OFFSET                   |
+	#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+|	[octet octet]
+	{
+		int val = r1.data.uord8()
+		if val < 64 {
+			reject
+		}
+	}
+
+#
+# Get some number of bytes.
+#
+
+# How many to get
+global int nbytes
+
+# We use this token to eliminate the lookahead that would be needed to cause a
+# reduce of part_len. This forces whatever comes before nbytes to be reduced before 
+# nbytes_data token is fetched from the scanner. We need this because nbytes_data
+# depends on the nbytes global and we need to ensure that it is set.
+token nb_empty /''/
+
+# Fetch nbytes bytes.
+token nbytes_data
+	/''/
+	{
+		send( make_token( typeid nbytes_data, pull(stdin, nbytes) ) )
+	}
+
+def nbytes
+	[nb_empty nbytes_data]
+
+def name_part
+	[part_len nbytes]
+
+
+def part_len
+	[octet]
+	{
+		# A name part list is terminated either by a zero length or a pointer,
+		# which must have the two high bits set.
+		int count = r1.data.uord8()
+		if count == 0 || count >= 64 {
+			reject
+		} else {
+			# Set the number of bytes to get for the name part.
+			nbytes = count
+		}
+	}
+
+#
+#   Resource Records
+#
+
+#                                   1  1  1  1  1  1
+#     0  1  2  3  4  5  6  7  8  9  0  1  2  3  4  5
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                                               |
+#   /                                               /
+#   /                      NAME                     /
+#   |                                               |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                      TYPE                     |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                     CLASS                     |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                      TTL                      |
+#   |                                               |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                   RDLENGTH                    |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--|
+#   /                     RDATA                     /
+#   /                                               /
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+
+def resource_record
+	[name rr_type rr_class ttl rdlength rdata]
+
+def rr_type 
+	[octet octet]
+	{
+		rr_type_value = network_uord16( r1, r2 )
+	}
+
+def rr_class 
+	int value
+	[octet octet]
+	{
+		rr_class_value = network_uord16( r1, r2 )
+	}
+
+def ttl 
+	[octet octet octet octet]
+
+token rdata_bytes
+	/''/
+	{
+		send( make_token( typeid rdata_bytes, pull(stdin, rdata_length) ) )
+	}
+
+def rdlength 
+	[octet octet]
+	{
+		rdata_length = network_uord16( r1, r2 )
+	}
+
+global int rdata_length
+	
+def rdata
+	[RR_UNKNOWN rdata_bytes]
+|	[RR_A address]
+|	[RR_NS name]
+|	[RR_CNAME name]
+|	[RR_PTR name]
+|	[RR_MX octet octet name]
+|	[RR_TXT rdata_bytes]
+
+
+#
+# Address
+#
+def address [octet octet octet octet]
+
+#
+# List of Questions
+#
+
+def questions
+	[load_question_count question_list]
+
+def load_question_count
+	[]
+	{
+		start_list( question_count )
+	}
+
+def question_list
+	[count_inc question question_list]
+|	[count_end]
+
+#
+#   Question
+#
+
+#                                   1  1  1  1  1  1
+#     0  1  2  3  4  5  6  7  8  9  0  1  2  3  4  5
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                                               |
+#   /                     QNAME                     /
+#   /                                               /
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                     QTYPE                     |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+#   |                     QCLASS                    |
+#   +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
+
+def question
+	[name qtype qclass]
+
+def qtype
+	[octet octet]
+
+def qclass
+	[octet octet]
+
+#
+# List of Answers
+#
+
+def answers
+	[load_answer_count answer_list]
+
+def load_answer_count
+	[]
+	{
+		start_list( answer_count )
+	}
+
+def answer_list
+	[count_inc answer answer_list]
+|	[count_end]
+
+#
+# Answer
+#
+
+def answer
+	[resource_record]
+
+#
+# List of Authorities
+#
+
+def authorities
+	[load_authority_count authority_list]
+
+def load_authority_count
+	[]
+	{
+		start_list( authority_count )
+	}
+
+def authority_list
+	[count_inc authority authority_list]
+|	[count_end]
+
+#
+# Authority
+#
+
+def authority
+	[resource_record]
+
+#
+# List of Additionals
+#
+
+def additionals
+	[load_additional_count additional_list]
+
+def load_additional_count
+	[]
+	{
+		start_list( additional_count )
+	}
+
+def additional_list
+	[count_inc additional additional_list]
+|	[count_end]
+
+#
+# Additional
+#
+
+def additional
+	[resource_record]
+
+
+def start
+	[message*]
+
+#
+# Grammar End.
+#
+
+int print_RR_UNKNOWN( start s )
+{
+	for I:rdata in s {
+		if match I [u:RR_UNKNOWN rdata_bytes] {
+			print( 'UNKNOWN TYPE\n' )
+		}
+	}
+}
+
+int print_RR_A( start s )
+{
+	for I:rdata in s {
+		if match I [RR_A o1:octet o2:octet o3:octet o4:octet] {
+			print( 'RR_A: ', o1.data.uord8(), '.', o2.data.uord8(), '.', 
+					o3.data.uord8(), '.', o4.data.uord8(), '\n' )
+		}
+	}
+}
+
+map name_map [int name]
+
+int print_name( name n, name_map m )
+{
+	for P: name_part in n {
+		match P [part_len D:nbytes]
+		print( D, '.' )
+	}
+
+	for E:name_end in n {
+		if match E [o1:octet o2:octet] {
+			int val = (o1.data.uord8() - 192) * 256 + o2.data.uord8()
+			print( '[', val, ']' )
+			name nameInMap = m.find( val )
+			print_name( nameInMap, m )
+		}
+	}
+}
+
+int print_all_names( start s )
+{
+	for M:message in s {
+		name_map m = construct name_map []
+
+		octet O = octet in M
+
+		for N:name in M {
+			match N [name_part* E:name_end]
+
+			for NP: name_part* in N {
+				if match NP [L:octet nbytes name_part*] {
+					int messageOffset = L.pos - O.pos
+					name n = construct name [NP E]
+					m.insert( messageOffset, n )
+				}
+			}
+		}
+
+		for I:name in M {
+			print_name( I, m )
+			print( '\n' )
+		}
+	}
+}
+
+start S = parse start( stdin )
+print_all_names( S )
+print( '*** SUCCESS ***\n' )
diff --git a/test/dns/dumpdns b/test/dns/dumpdns
new file mode 100644
index 00000000..3409afee
--- /dev/null
+++ b/test/dns/dumpdns
@@ -0,0 +1,11 @@
+#!/bin/bash
+#
+
+# Use this script to capture dns packets to a dump file. Then use extract to
+# break up the packets and strip the headers, leaving just dns packets.
+#
+# usage: bash dumpdns <dumpfile>
+
+[ -z "$1" ] && exit
+
+tcpdump -s 0 -w $1 udp port 53
diff --git a/test/dns/extract.c b/test/dns/extract.c
new file mode 100644
index 00000000..8af026a3
--- /dev/null
+++ b/test/dns/extract.c
@@ -0,0 +1,48 @@
+#include <pcap.h>
+
+/*
+ * Break up a dump file and strip headers, leaving just 
+ * the dns portion of packets.
+ */
+
+char outname[1024];
+char errbuf[PCAP_ERRBUF_SIZE];
+
+int main( int argc, char **argv )
+{
+	int packet;
+	pcap_t *p;
+	if ( argc != 3 ) {
+		fprintf( stderr, "usage: get <dumpfile> <rootname>\n" );
+		return 1;
+	}
+
+	p = pcap_open_offline( argv[1], errbuf );
+
+	for ( packet = 0; ; packet++ ) {
+		FILE *file;
+		unsigned long len;
+		struct pcap_pkthdr h;
+		const u_char *data;
+		
+		data = pcap_next( p, &h );
+		if ( data == 0 )
+			break;
+
+		if ( h.caplen < h.len )
+			fprintf( stderr, "warning: packet number %02d is short\n", packet );
+
+		/* The magic number is the size of the headers we want to strip. */
+		data += 42;
+		len = h.caplen - 42;
+
+		sprintf( outname, "%s-%04d", argv[2], packet );
+		file = fopen( outname, "wb" );
+		fwrite( data, 1, len, file );
+		fclose( file );
+	}
+
+	pcap_close( p );
+
+	return 0;
+}
diff --git a/test/heredoc.in b/test/heredoc.in
new file mode 100644
index 00000000..c9638ca9
--- /dev/null
+++ b/test/heredoc.in
@@ -0,0 +1,3 @@
+hello
+random 9392af j9 stuff
+hello
diff --git a/test/heredoc.lm b/test/heredoc.lm
new file mode 100644
index 00000000..54dcc33d
--- /dev/null
+++ b/test/heredoc.lm
@@ -0,0 +1,45 @@
+rl ident_char /[a-zA-Z_]/
+
+lex start
+{
+	# Tokens
+	token other /(^(ident_char|0|'\n'))+/
+
+	token here_close //
+	token id 
+		/ident_char+/
+		{
+			if HereId && HereId == match_text {
+				send( make_token( 
+					typeid here_close,
+					pull(stdin, match_length - 1) ) )
+			} else {
+				send( make_token( typeid id, pull(stdin, match_length) ) )
+			}
+		}
+
+	token nl /'\n'/
+}
+
+def here_name 
+	[id]
+	{
+		HereId = r1.data
+	}
+
+global str HereId
+
+def here_data 
+	[here_data_item*]
+
+def here_data_item 
+	[id]
+|	[other]
+|	[nl]
+
+def heredoc 
+	[here_name here_data here_close id nl]
+
+
+heredoc S = parse heredoc( stdin )
+print_xml(S)
diff --git a/test/html/Makefile b/test/html/Makefile
new file mode 100644
index 00000000..25a0b6d3
--- /dev/null
+++ b/test/html/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/html/html-lextag.lm b/test/html/html-lextag.lm
new file mode 100644
index 00000000..0869538c
--- /dev/null
+++ b/test/html/html-lextag.lm
@@ -0,0 +1,324 @@
+#
+# Regular Definitions
+#
+rl def_name_char /[\-A-Za-z0-9._:?]/
+rl def_name /[A-Za-z_:] def_name_char*/
+rl def_system_literal /'"' [^"]* '"' | "'" [^']* "'"/
+
+#
+# Scanner for tag names.
+#
+lex TAG_NAME
+{
+	ignore /space+/
+	token tag_id /def_name/
+}
+
+#
+# Scanner for attributes names
+#
+lex ATTR_NAME
+{
+	ignore  /space+/
+	token attr_name /def_name_char+/
+	literal '='
+}
+
+# Scanner for attribute values.
+lex ATTR_VAL
+{
+	ignore  /space+/
+	literal '>', '/>'
+	token dquote_val /'"' ([^"] | '\\' any)* '"'/
+	token squote_val /"'" ([^'] | '\\' any)* "'"/
+	token unq_val /[^ \t\r\n<>"'] [^ \t\r\n<>]*/
+}
+
+#
+# Tokens
+#
+
+lex START
+{
+	ignore /space+/
+
+	literal '<', '</', '<!DOCTYPE'
+	token close_tag 
+		/'</' [\t ]* id: [a-zA-Z]+ '>'/
+
+	token doc_data /[^<]+/
+  	token comment /'<!--' any* :>> '-->'/
+}
+
+#
+# Tags
+#
+
+bool inTagStack( str id )
+{
+	tag_stack LocalTagStack = TagStack
+	for Tag:tag_id in LocalTagStack {
+		if id == Tag.data
+			return true
+	}
+	return false
+}
+
+# This scanner is just for the id in close tags. The id needs to be looked up
+# in the tag stack so we can determine if it is a stray. 
+lex close_id
+{
+	# Ignore whitespace.
+	ignore /space+/
+
+	token stray_close_id //
+	token missing_close_id //
+
+	token close_id /def_name/
+	{
+		# If it is in the tag stack then it is a close_id. If not then it's a
+		# stray_close_id.
+		int send_id = typeid stray_close_id
+
+		if ( inTagStack( match_text ) ) {
+			print( 'CLOSE \'', match_text, '\' IN TAG STACK\n' )
+
+			# The tag is in the stack, send missing close tags until we get to it.
+			match TagStack [Top:tag_id Rest:tag_stack] 
+			TagStack = Rest
+			while ( Top.data != match_text ) {
+				print( 'SENDING missing close\n' )
+				send( make_token( typeid missing_close_id, '' ) )
+				match TagStack [Top2:tag_id Rest2:tag_stack] 
+				Top = Top2
+				TagStack = Rest2
+			}
+
+			print( 'SENDING close\n' )
+			send( make_token( typeid close_id, pull( stdin, match_length ) ) )
+		}
+		else {
+			print( 'CLOSE \'', match_text, '\' NOT IN TAG STACK\n' )
+			# The tag is not in the tag stack so send the id as a stray close.
+			send( make_token( typeid stray_close, pull( stdin, match_length ) ) )
+		}
+	}
+}
+
+#
+# Tag Stack
+#
+
+def tag_stack 
+	[tag_id tag_stack]
+|	[]
+
+global tag_stack TagStack = construct tag_stack []
+
+#
+# Document Type
+#
+# This scanner handles inside DOCTYPE tags (except keywords).
+lex DOCTYPE
+{
+	ignore /space+/
+	token dt_name /def_name/
+	token dt_literal /def_system_literal/
+	token dt_bl /"[" [^\]]* "]"/
+	token dt_close /'>'/
+}
+
+# Using a separate scanner for the keywords in DOCTYPE prevents them from
+# covering dt_name
+lex DOCTYPE_KW
+{
+	ignore /space+/
+	literal 'SYSTEM', 'PUBLIC'
+}
+
+def DOCTYPE ['<!DOCTYPE' dt_name external_id dt_bl? dt_close]
+
+def external_id
+	['SYSTEM' dt_literal?]
+|	['PUBLIC' dt_literal dt_literal?]
+
+#
+# Tags, with optionanal close.
+#
+
+def tag 
+	[open_tag item* close_tag]
+
+def unclosed_tag 
+	[open_tag item* missing_close_id]
+
+def open_tag 
+	['<' tag_id attr* '>']
+	{
+		TagStack = construct tag_stack 
+			[r2 TagStack]
+	}
+
+#
+# Empty tags
+#
+def empty_tag 
+	['<' tag_id attr* '/>']
+
+#
+# Stray close tags
+#
+def stray_close 
+	[close_tag]
+
+
+#
+# Attributes
+#
+
+def attr
+	[attr_name eql_attr_val?]
+
+def eql_attr_val ['=' attr_val]
+
+def attr_val
+	[squote_val]
+|	[dquote_val]
+|	[unq_val]
+|	[]
+
+#
+# Items
+#
+
+def item 
+	[DOCTYPE]
+|	[tag]
+|	[unclosed_tag]
+|	[empty_tag]
+|	[stray_close]
+|	[doc_data]
+|	[comment]
+
+
+token trailing /any*/
+
+def start 
+	[item* trailing]
+
+#
+# END GRAMMAR
+#
+
+int addDefaultAltTags( ref start Start )
+{
+	for T: open_tag in Start {
+		require T 
+			["<img" AttrList: attr* '>']
+		
+		bool haveAlt = false
+		for A: attr in T {
+			if match A ["alt=" attr_val]
+				haveAlt = true
+		}
+
+		if !haveAlt {
+			for AL: attr* in T {
+				if match AL [] {
+					AL = construct attr* 
+						[" alt=\"default alt\""]
+					break
+				}
+			}
+		}
+	}
+}
+
+int printLinks( start Start )
+{
+	for A:tag in Start {
+		require A
+			["<a" AttrList: attr* ">" I: item* "</a>"]
+
+		for Attr: attr in AttrList {
+			if match Attr ["href = " AttrVal: attr_val]
+				print( 'link: ', I, '\ntarget: ', AttrVal, '\n\n' )
+		}
+	}
+}
+
+
+bool should_close( tag_id TI )
+{
+	return true
+}
+
+bool should_flatten( tag_id TI )
+{
+	return true
+}
+
+# Finds unclosed tags and puts the content after the tag. Afterwards
+# all unclosed tags will be empty 'inside'.
+#int flatten( ref start Start )
+#{
+#    for TL: item* in Start {
+#        require TL
+#            [OT: open_tag Inside: item* Trailing: item*]
+#
+#		match OT 
+#			['<' TagId: tag_id attr* '>']
+#
+#		if should_flatten( TagId )
+#		{
+#			require Inside
+#				[item item*]
+#			
+#			# Put Trailing at the end of inside.
+#			for END: item* in Inside {
+#				if match END [] {
+#					END = Trailing
+#					break
+#				}
+#			}
+#
+#			str empty = ''
+#			missing_close_id Missing = construct missing_close_id [empty]
+#			opt_close_tag EmptyCloseTag = 
+#				construct opt_close_tag [Missing]
+#
+#			# Close the tag and put inside after it.
+#			TL = construct item*
+#				[OT EmptyCloseTag Inside]
+#		}
+#    }
+#}
+#
+#int close( ref start Start )
+#{
+#    for TL: item in Start {
+#        require TL
+#            [OpenTag: open_tag Inside: item*]
+#
+#        match OpenTag 
+#            ['<' TagId: tag_id attr* '>']
+#
+#        if should_close( TagId )
+#        {
+#			close_id CloseId = construct close_id 
+#				[TagId.data]
+#
+#            opt_close_tag CloseTag = 
+#                construct opt_close_tag ['</' CloseId '>']
+#
+#            # Close the tag and put inside after it.
+#            TL = construct item
+#                [OpenTag Inside CloseTag]
+#        }
+#    }
+#}
+
+start HTML = parse start( stdin )
+print_xml( HTML )
+for C: close_tag in HTML 
+	print( C.id, '\n' )
diff --git a/test/html/html.lm b/test/html/html.lm
new file mode 100644
index 00000000..98573f2e
--- /dev/null
+++ b/test/html/html.lm
@@ -0,0 +1,307 @@
+#
+# Regular Definitions
+#
+rl def_name_char /[\-A-Za-z0-9._:?]/
+rl def_name /[A-Za-z_:] def_name_char*/
+rl def_system_literal /'"' [^"]* '"' | "'" [^']* "'"/
+
+#
+# Scanner for tag names.
+#
+lex TAG_NAME
+{
+	ignore /space+/
+	token tag_id /def_name/
+}
+
+#
+# Scanner for attributes names
+#
+lex ATTR_NAME
+{
+	ignore  /space+/
+	token attr_name /def_name_char+/
+	literal '='
+}
+
+# Scanner for attribute values.
+lex ATTR_VAL
+{
+	ignore  /space+/
+	literal '>', '/>'
+	token dquote_val /'"' ([^"] | '\\' any)* '"'/
+	token squote_val /"'" ([^'] | '\\' any)* "'"/
+	token unq_val /[^ \t\r\n<>"'] [^ \t\r\n<>]*/
+}
+
+#
+# Tokens
+#
+
+lex START
+{
+	ignore /space+/
+	literal '<', '</', '<!DOCTYPE'
+	token doc_data /[^<]+/
+  	token comment /"<!--" any* :>> "-->"/
+}
+
+#
+# Tags
+#
+
+# This scanner is just for the id in close tags. The id needs to be looked up
+# in the tag stack so we can determine if it is a stray. 
+lex close_id
+{
+	# Ignore whitespace.
+	ignore /space+/
+
+	token stray_close_id //
+	token close_id /def_name/
+	{
+		# If it is in the tag stack then it is a close_id. If not then it's a
+		# stray_close_id.
+		int send_id = typeid stray_close_id
+
+		tag_stack LocalTagStack = TagStack
+		for Tag:tag_id in LocalTagStack {
+			tag_id T = Tag
+			if match_text == T.data {
+				send_id = typeid close_id
+				break
+			}
+		}
+
+		send( make_token( send_id, pull(stdin, match_length) ) )
+	}
+}
+
+#
+# Tag Stack
+#
+
+def tag_stack 
+	[tag_id tag_stack]
+|	[]
+
+global tag_stack TagStack = construct tag_stack []
+
+#
+# Document Type
+#
+# This scanner handles inside DOCTYPE tags (except keywords).
+lex DOCTYPE
+{
+	ignore /space+/
+	token dt_name /def_name/
+	token dt_literal /def_system_literal/
+	token dt_bl /"[" [^\]]* "]"/
+	token dt_close /'>'/
+}
+
+# Using a separate scanner for the keywords in DOCTYPE prevents them from
+# covering dt_name
+lex DOCTYPE_KW
+{
+	ignore /space+/
+	literal 'SYSTEM', 'PUBLIC'
+}
+
+def DOCTYPE ['<!DOCTYPE' dt_name external_id dt_bl? dt_close]
+
+def external_id
+	['SYSTEM' dt_literal?]
+|	['PUBLIC' dt_literal dt_literal?]
+
+#
+# Tags, with optionanal close.
+#
+
+def tag 
+	[open_tag item* opt_close_tag]
+
+def open_tag 
+	['<' tag_id attr* '>']
+	{
+		TagStack = construct tag_stack 
+			[r2 TagStack]
+	}
+
+def opt_close_tag
+	['</' close_id '>']
+	{
+		match TagStack [Top:tag_id Rest:tag_stack] 
+		if r2.data == Top.data
+			TagStack = Rest
+		else
+			reject
+	}
+
+|	[]
+	{
+		match TagStack [Top:tag_id Rest:tag_stack] 
+		TagStack = Rest
+	}
+
+#
+# Empty tags
+#
+def empty_tag 
+	['<' tag_id attr* '/>']
+
+#
+# Stray close tags
+#
+def stray_close 
+	['</' stray_close_id '>']
+
+
+#
+# Attributes
+#
+
+def attr
+	[attr_name eql_attr_val?]
+
+def eql_attr_val ['=' attr_val]
+
+def attr_val
+	[squote_val]
+|	[dquote_val]
+|	[unq_val]
+|	[]
+
+#
+# Items
+#
+
+def item 
+	[DOCTYPE]
+|	[tag]
+|	[empty_tag]
+|	[stray_close]
+|	[doc_data]
+|	[comment]
+
+
+token trailing /any*/
+
+def start 
+	[item* trailing]
+
+#
+# END GRAMMAR
+#
+
+int addDefaultAltTags( ref start Start )
+{
+	for T: open_tag in Start {
+		require T 
+			["<img" AttrList: attr* '>']
+		
+		bool haveAlt = false
+		for A: attr in T {
+			if match A ["alt=" attr_val]
+				haveAlt = true
+		}
+
+		if !haveAlt {
+			for AL: attr* in T {
+				if match AL [] {
+					AL = construct attr* 
+						[" alt=\"default alt\""]
+					break
+				}
+			}
+		}
+	}
+}
+
+int printLinks( start Start )
+{
+	for A:tag in Start {
+		require A
+			["<a" AttrList: attr* ">" I: item* "</a>"]
+
+		for Attr: attr in AttrList {
+			if match Attr ["href = " AttrVal: attr_val]
+				print( 'link: ', I, '\ntarget: ', AttrVal, '\n\n' )
+		}
+	}
+}
+
+
+bool should_close( tag_id TI )
+{
+	return true
+}
+
+bool should_flatten( tag_id TI )
+{
+	return true
+}
+
+# Finds unclosed tags and puts the content after the tag. Afterwards
+# all unclosed tags will be empty 'inside'.
+int flatten( ref start Start )
+{
+    for TL: item* in Start {
+        require TL
+            [OT: open_tag Inside: item* Trailing: item*]
+
+		match OT 
+			['<' TagId: tag_id attr* '>']
+
+		if should_flatten( TagId )
+		{
+			require Inside
+				[item item*]
+			
+			# Put Trailing at the end of inside.
+			for END: item* in Inside {
+				if match END [] {
+					END = Trailing
+					break
+				}
+			}
+
+			opt_close_tag EmptyCloseTag = 
+				construct opt_close_tag []
+
+			# Close the tag and put inside after it.
+			TL = construct item*
+				[OT EmptyCloseTag Inside]
+		}
+    }
+}
+
+int close( ref start Start )
+{
+    for TL: item in Start {
+        require TL
+            [OpenTag: open_tag Inside: item*]
+
+        match OpenTag 
+            ['<' TagId: tag_id attr* '>']
+
+        if should_close( TagId )
+        {
+			close_id CloseId = construct close_id 
+				[TagId.data]
+
+            opt_close_tag CloseTag = 
+                construct opt_close_tag ['</' CloseId '>']
+
+            # Close the tag and put inside after it.
+            TL = construct item
+                [OpenTag Inside CloseTag]
+        }
+    }
+}
+
+start HTML = parse start( stdin )
+flatten( HTML )
+#print_xml( HTML )
+printLinks( HTML )
+
diff --git a/test/html/input01.html b/test/html/input01.html
new file mode 100644
index 00000000..cf783d63
--- /dev/null
+++ b/test/html/input01.html
@@ -0,0 +1,8 @@
+<t1>
+
+  <t2>
+  <a href="foo">FOO</a>
+  <t3>
+  </t3>
+
+</t1>
diff --git a/test/http/Makefile b/test/http/Makefile
new file mode 100644
index 00000000..25a0b6d3
--- /dev/null
+++ b/test/http/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/http/http.lm b/test/http/http.lm
new file mode 100644
index 00000000..d914ab6f
--- /dev/null
+++ b/test/http/http.lm
@@ -0,0 +1,68 @@
+#
+# Character classes
+#
+rl CTL /0..31 | 127/
+rl CR /13/
+rl LF /10/
+rl SP /32/
+rl HT /9/
+rl CHAR /0..127/
+
+rl separators / '(' | ')' | '<' | '>' 
+		| '@' | ',' | ';' | ':' | '\\' 
+		| '"' | '/' | '[' | ']' | '?' 
+		| '=' | '{' | '}' | SP | HT /
+
+rl token_char /CHAR - CTL - separators/
+
+#
+# Literal tokens
+#
+
+literal 'HTTP/', ' ', ':'
+token CRLF /CR LF/
+
+#
+# Request Line
+#
+
+token method /token_char+/
+
+token request_uri /(^SP)+/
+
+token http_number /digit+ '.' digit+/
+
+def http_version 
+	[ 'HTTP/' http_number ]
+
+def request_line 
+	[method ' ' request_uri 
+	 ' ' http_version CRLF]
+
+#
+# Header
+#
+
+token field_name /token_char+/
+
+token field_value 
+	/(^(CR|LF) | CR LF (SP|HT))* CR LF/
+
+def header 
+	[field_name ':' field_value]
+
+#
+# Request
+#
+
+def request
+	[request_line header* CRLF]
+
+request R = parse_stop request( stdin )
+
+print( 'HTTP/1.0 200 OK\r\n' )
+print( 'Date: Fri, 31 Dec 1999 23:59:59 GMT\r\n' )
+print( 'Content-Type: text/plain\r\n' )
+print( '\r\n' )
+print_xml( R )
+
diff --git a/test/http/input1 b/test/http/input1
new file mode 100644
index 00000000..c1416f84
--- /dev/null
+++ b/test/http/input1
@@ -0,0 +1,2 @@
+GET /hi/there/ HTTP/1.1
+
diff --git a/test/http/input2 b/test/http/input2
new file mode 100644
index 00000000..076222d5
--- /dev/null
+++ b/test/http/input2
@@ -0,0 +1,13 @@
+GET /hithere/ HTTP/1.1
+Host: localhost:3535
+User-Agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.12) Gecko/20080207 Ubuntu/7.10 (gutsy) Firefox/2.0.0.12
+Accept: text/xml,application/xml,application/xhtml+xml,text/html;q=0.9,text/plain;q=0.8,image/png,*/*;q=0.5
+Accept-Language: en-us,en;q=0.5
+Accept-Encoding: gzip,deflate
+Accept-Charset: ISO-8859-1,utf-8;q=0.7,*;q=0.7
+Keep-Alive: 300
+Connection: keep-alive
+Cache-Control: max-age=0
+
+adslfkj
+alkfj
diff --git a/test/http/input3 b/test/http/input3
new file mode 100644
index 00000000..16b817f1
--- /dev/null
+++ b/test/http/input3
@@ -0,0 +1,8 @@
+GET foo HTTP/1.1
+hello: foo
+hi: there
+	my
+ friend
+ 
+ from outter space
+
diff --git a/test/http/xinetd.conf b/test/http/xinetd.conf
new file mode 100644
index 00000000..5c95545c
--- /dev/null
+++ b/test/http/xinetd.conf
@@ -0,0 +1,10 @@
+service colm_http
+{
+	type            = unlisted
+	socket_type	= stream
+	protocol	= tcp
+	port            = 3535
+	wait		= no
+	user		= thurston
+	server		= /home/thurston/devel/colm/test/http/http.bin
+}                                                                               
diff --git a/test/island.in b/test/island.in
new file mode 100644
index 00000000..d34467bb
--- /dev/null
+++ b/test/island.in
@@ -0,0 +1,19 @@
+class
+{ 
+	1;
+	"string";
+	foo;
+	func() 
+	{ 
+		func()
+		{ 
+			1+{2}
+		}
+	} 
+}
+
+func()
+{
+	"data"
+	{a}
+} 
diff --git a/test/island.lm b/test/island.lm
new file mode 100644
index 00000000..c407aa28
--- /dev/null
+++ b/test/island.lm
@@ -0,0 +1,57 @@
+
+lex function_body
+{
+	token func_chr /[^{}]+/
+	token func_open /'{'/
+	token func_close /'}'/
+}
+
+def func_item 
+	[func_chr]
+|	[func_open func_body func_close]
+
+def func_body 
+	[func_item*]
+
+def func 
+	[ident '(' ')' '{' func_body func_close ]
+
+lex start
+{
+	token ident /[a-zA-Z_]+/
+	token number /[0-9]+/
+
+	rl s_string / "'" ([^'\\\n] | '\\' any )* "'" /
+	rl d_string / '"' ([^"\\\n] | '\\' any )* '"' /
+	token string /s_string | d_string/
+
+	literal '+', '*', ';', '(', ')', '{', '}'
+
+	ignore wp / [ \t\n]+ /
+}
+
+def class_item
+	[func]
+|	[class]
+|	[ident ';']
+|	[number ';']
+|	[string ';']
+
+def class_body 
+	[class_item*]
+
+def class 
+	[ident '{' class_body '}' ]
+
+def top_item 
+	[func]
+|	[class]
+
+def start 
+	[top_item*]
+	{
+		print_xml(lhs)
+	}
+
+#pattern start
+#	~class { func() { func() { 1+{2}} } } func() {{a}} 
diff --git a/test/liftattrs.in b/test/liftattrs.in
new file mode 100644
index 00000000..5a50f377
--- /dev/null
+++ b/test/liftattrs.in
@@ -0,0 +1,3 @@
+<t1 a=b foo=bar1 c=d>
+	<t2 foo=bar2 e=f></t2>
+</t1>
diff --git a/test/liftattrs.lm b/test/liftattrs.lm
new file mode 100644
index 00000000..305a805b
--- /dev/null
+++ b/test/liftattrs.lm
@@ -0,0 +1,74 @@
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+
+#
+# Tokens
+#
+
+lex start
+{
+	literal '=', '<', '>', '/'
+
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	# Open and close id
+	token id /rl_id/
+}
+
+#
+# Productions
+#
+
+def attr [id '=' id]
+
+def attr_list 
+	[attr_list attr]
+|	[]
+
+def open_tag 
+	['<' id attr_list '>']
+
+def close_tag
+	['<' '/' id '>']
+
+def tag 
+	[open_tag item_list close_tag]
+
+def item_list 
+	[item_list tag]
+|	[]
+
+item_list IL = parse item_list(stdin)
+
+# Get the item list
+match IL [RootItemList: item_list]
+
+# List for collecting the attrs we pull out.
+attr_list CollectedAttrs = construct attr_list []
+
+# Iterate through all attributes
+for AttrListIter:attr_list in RootItemList {
+	# If the name of the attr is foo, remove it.
+	if match AttrListIter
+		[SubAttrList:attr_list "foo=" Val:id]
+	{
+		# Remove the attribute
+		AttrListIter = construct attr_list 
+			[SubAttrList]
+
+		# Add it to the colection
+		CollectedAttrs = construct attr_list 
+			[CollectedAttrs " foo=" Val]
+	}
+}
+
+# Reconstruct the left hand side with the 
+IL = construct item_list 
+	["<wrapper" CollectedAttrs ">" RootItemList "</wrapper>"]
+
+print( IL, '\n' )
diff --git a/test/mailbox.in b/test/mailbox.in
new file mode 100644
index 00000000..412f8bed
--- /dev/null
+++ b/test/mailbox.in
@@ -0,0 +1,29 @@
+From thurston  Tue Jan  2 21:16:50 2007
+Return-Path: <unknown>
+X-Spam-Level: *
+Received: from [109.111.71.111] (helo=twfmtr)
+	by zifreax with smtp (Exim 4.43)
+	id 1H1vfs-0005LN-HW; Tue, 2 Jan 2007 21:16:16 -0500
+Message-ID: <459B113F.8050903@immoarthabitatge.com>
+X-Keywords:                   
+X-UID: 1
+
+Content-Type: text/html; charset=ISO-8859-1
+</body>
+</html>
+
+From thurston  Wed Jan  3 02:35:48 2007
+Return-Path: <unknown>
+X-Spam-Checker-Version: SpamAssassin 3.1.1 (2006-03-10) on mambo.cs.queensu.ca
+X-Spam-Level: **
+X-Spam-Status: No, score=2.9 required=5.0 tests=BAYES_20,EXTRA_MPART_TYPE,
+	HTML_40_50,HTML_IMAGE_ONLY_16,HTML_MESSAGE,RCVD_IN_BL_SPAMCOP_NET 
+	autolearn=no version=3.1.1
+X-Bogosity: Unsure, tests=bogofilter, spamicity=0.971708, version=1.0.2
+Status: RO
+X-UID: 2
+
+------=_NextPart_000_0010_01C72F11.F137BD60
+	charset="windows-1252"
+Content-Transfer-Encoding: quoted-printable
+
diff --git a/test/mailbox.lm b/test/mailbox.lm
new file mode 100644
index 00000000..3387fcff
--- /dev/null
+++ b/test/mailbox.lm
@@ -0,0 +1,44 @@
+
+# lines, and fromlines 
+lex lines
+{
+	rl day /[A-Z][a-z][a-z]/
+	rl month /[A-Z][a-z][a-z]/
+	rl year /[0-9][0-9][0-9][0-9]/
+	rl time /[0-9][0-9] ':' [0-9][0-9]  ( ':' [0-9][0-9] )? /
+	rl letterZone /[A-Z][A-Z][A-Z]/
+	rl numZone /[+\-][0-9][0-9][0-9][0-9]/
+	rl zone / letterZone | numZone/
+	rl dayNum /[0-9 ][0-9]/
+
+	# These are the different formats of the date minus an obscure
+	# type that has a funny string 'remote from xxx' on the end. Taken
+	# from c-client in the imap-2000 distribution.
+	rl date / day ' ' month ' ' dayNum ' ' time ' '
+		( year | year ' ' zone | zone ' ' year ) /
+
+	# From lines separate messages. We will exclude from_line from a message
+	# body line.  This will cause us to stay in message line up until an
+	# entirely correct from line is matched.
+	token from_line / 'From ' (any-'\n')* ' ' date '\n' /
+	token simple_line / [^\n]* '\n' /
+}
+
+rl hchar /print - [ :]/
+token header_name /hchar+/
+
+token colon /':' ' '*/
+token header_content / ([^\n] | '\n' [ \t])* '\n'/
+token blank_line / '\n' /
+
+def header 
+	[header_name colon header_content]
+
+def message 
+	[from_line header* blank_line simple_line*]
+
+def start 
+	[message*]
+	{
+		print_xml( lhs )
+	}
diff --git a/test/matchex.in b/test/matchex.in
new file mode 100644
index 00000000..f458f2ad
--- /dev/null
+++ b/test/matchex.in
@@ -0,0 +1,3 @@
+<person name=adrian hometown=kingston>
+	<t1 foo=bar2 e=f></t2>
+</person>
\ No newline at end of file
diff --git a/test/matchex.lm b/test/matchex.lm
new file mode 100644
index 00000000..67b69238
--- /dev/null
+++ b/test/matchex.lm
@@ -0,0 +1,34 @@
+lex start
+{
+	token id /[a-zA-Z_][a-zA-Z0-9_]*/
+	literal '=', '<', '>', '/'
+	ignore /[ \t\n\r\v]+/
+}
+
+def attr 
+	[id '=' id]
+
+def open_tag 
+	['<' id attr* '>']
+
+def close_tag
+	['<' '/' id '>']
+
+def tag 
+	[open_tag item* close_tag]
+
+def item
+	[tag]
+|	[id]
+
+tag Tag = parse tag( stdin )
+
+# Style: List of literal text and types.
+match Tag ["<person name=" Val1:id attr*">" item* "</person>"]
+
+# Style: Literal text with embedded lists of types.
+match Tag "<person name=[Val2:id attr*]>[item*]</person>"
+
+print( Val1, '\n' )
+print( Val2, '\n' )
+
diff --git a/test/maxlen.lm b/test/maxlen.lm
new file mode 100644
index 00000000..19869634
--- /dev/null
+++ b/test/maxlen.lm
@@ -0,0 +1,44 @@
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+
+#
+# Tokens
+#
+
+lex start
+{
+	ignore /rl_ws/
+	token id /rl_id/
+}
+
+global int num
+global int allow = 3
+
+def item 
+	[id]
+	{
+		num = num + 1
+		int toomuch = allow+1
+		if num == toomuch {
+			reject
+		}
+	}
+
+def open
+	[]
+	{
+		num = 0
+	}
+
+def close []
+
+def restricted_list 
+	[open item*]
+
+def start 
+	[restricted_list id*]
+
diff --git a/test/nestedcomm.in b/test/nestedcomm.in
new file mode 100644
index 00000000..11789576
--- /dev/null
+++ b/test/nestedcomm.in
@@ -0,0 +1 @@
+hello there ( (this is a nested comment /*sdf;asd_++_stuff) ) and this is not
diff --git a/test/nestedcomm.lm b/test/nestedcomm.lm
new file mode 100644
index 00000000..cc28726e
--- /dev/null
+++ b/test/nestedcomm.lm
@@ -0,0 +1,41 @@
+#
+# Tokens
+#
+
+# Any single character can be a literal
+lex start
+{
+	# Ignore whitespace.
+	ignore /[ \t\n\r\v]+/
+
+	# Open and close id
+	token id /[a-zA-Z_][a-zA-Z0-9_]*/
+
+	token open_paren /'('/ 
+	{
+		send_ignore( parse_stop nested_comment( stdin ) )
+	}
+}
+
+#
+# Token translation
+#
+
+lex nc_scan
+{
+	literal '(', ')'
+	token nc_data /[^()]+/
+}
+
+def nc_item 
+	[nc_data]
+|	[nested_comment]
+
+def nested_comment 
+	['(' nc_item* ')']
+
+def nested [id*]
+
+nested P = parse nested( stdin )
+print_xml( P )
+print( P, '\n' )
diff --git a/test/python/Makefile b/test/python/Makefile
new file mode 100644
index 00000000..eeab1e53
--- /dev/null
+++ b/test/python/Makefile
@@ -0,0 +1,18 @@
+#
+#   Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/python/input1.py b/test/python/input1.py
new file mode 100644
index 00000000..22ffd2e1
--- /dev/null
+++ b/test/python/input1.py
@@ -0,0 +1,18 @@
+
+# dude, this is a comment
+ # some more
+hello
+def dude():
+    yes
+    awesome;
+
+    # Here we have a comment
+    def realy_awesome(): # hi there
+      in_more
+
+      same_level 
+      def one_liner(): first; second # both inside one_liner
+
+    back_down
+
+last_statement
diff --git a/test/python/input2.py b/test/python/input2.py
new file mode 100644
index 00000000..063825e1
--- /dev/null
+++ b/test/python/input2.py
@@ -0,0 +1,20 @@
+
+# dude, this is a comment
+ # some more
+hello
+if 1:
+    yes
+    awesome;
+
+    # Here we have a comment
+    if ('hello'): # hi there
+      in_more
+
+      same_level 
+      if ['dude', 'dudess'].horsie(): first; second # both inside one_liner
+      1
+
+    back_down
+
+last_statement
+
diff --git a/test/python/input3.py b/test/python/input3.py
new file mode 100644
index 00000000..90ecf3f9
--- /dev/null
+++ b/test/python/input3.py
@@ -0,0 +1 @@
+hello = 1.1(20);
diff --git a/test/python/input4.py b/test/python/input4.py
new file mode 100644
index 00000000..1a281c46
--- /dev/null
+++ b/test/python/input4.py
@@ -0,0 +1,10 @@
+
+# subscription
+a[1] = b[2];
+
+# simple slicing
+a[1:1] = b[2:2];
+
+# simple slicing
+a[1:1, 2:2] = b[3:3, 4:4];
+
diff --git a/test/python/python.lm b/test/python/python.lm
new file mode 100644
index 00000000..7d579955
--- /dev/null
+++ b/test/python/python.lm
@@ -0,0 +1,726 @@
+# Regular definitions
+rl ident_char /[a-zA-Z_]/
+
+# List used as a stack of indentations.
+list indent_stack [int]
+global indent_stack IndentStack = construct indent_stack []
+IndentStack.push( 0 )
+
+# Has a newline been sent for this '\n' .. whitespace match. 
+global int newline_sent = 0
+
+# Tokens. 
+lex start
+{
+	# Python keywords.
+	literal 'and', 'del', 'from', 'not', 'while', 'as', 'elif', 'global', 'or',
+		'with', 'assert', 'else', 'if', 'pass', 'yield', 'break', 'except',
+		'import', 'print', 'class', 'exec', 'in', 'raise', 'continue',
+		'finally', 'is', 'return', 'def', 'for', 'lambda', 'try'
+
+	# Identifiers
+	rl lowercase /'a'..'z'/
+	rl uppercase /'A'..'Z'/
+	rl letter /lowercase | uppercase/
+	token identifier /(letter|'_') (letter | digit | '_')*/
+
+	# Literals
+	rl escapeseq /'\\' any /
+	rl longstringchar /[^\\]/
+	rl shortstringchar_s /[^\\\n']/
+	rl shortstringchar_d /[^\\\n"]/
+	rl longstringitem /longstringchar | escapeseq/
+	rl shortstringitem_s /shortstringchar_s | escapeseq/
+	rl shortstringitem_d /shortstringchar_d | escapeseq/
+	rl longstring /"'''" longstringitem* :>> "'''" | '"""' longstringitem* :>> '"""'/
+	rl shortstring /"'" shortstringitem_s* "'" | '"' shortstringitem_d* '"'/
+	rl stringprefix /"r" | "u" | "ur" | "R" | "U" | "UR" | "Ur" | "uR"/
+	token stringliteral /stringprefix? (shortstring | longstring)/
+
+	# Integers
+	rl hexdigit /digit | 'a'..'f' | 'A'..'F'/
+	rl octdigit /'0'..'7'/
+	rl nonzerodigit /'1'..'9'/
+	rl hexinteger /'0' ('x' | 'X') hexdigit+/
+	rl octinteger /'0' octdigit+/
+	rl decimalinteger /nonzerodigit digit* | '0'/
+	token integer /decimalinteger | octinteger | hexinteger/
+	token longinteger /integer ('l' | 'L')/
+
+	# Floats.
+	rl exponent /('e' | 'E') ('+' | '-')? digit+/
+	rl fraction /'.' digit+/
+	rl intpart /digit+/
+	rl pointfloat /intpart? fraction | intpart '.'/
+	rl exponentfloat /(intpart | pointfloat) exponent/
+	token floatnumber /pointfloat | exponentfloat/
+
+	# Imaginaries.
+	token imagnumber /(floatnumber | intpart) ("j" | "J")/
+
+	# Operators.
+	literal '+', '-', '*', '**', '/', '//', '%', '<<', '>>', '&', '|', '^',
+		'~', '<', '>', '<=', '>=', '==', '!=', '<>'
+	
+	# Delimiters
+	literal '(', ')', '[', ']', '{', '}', '@', ',', ':', '.', '`', '=', ';',
+		'+=', '-=', '*=', '/=', '//=', '%=', '&=', '|=', '^=', '>>=', '<<=',
+		'**='
+	
+	literal '...'
+
+	# In general whitespace is ignored.
+	ignore WS /' '+/
+
+	# Find and ignore entire blank lines.
+	token BLANK_LINE 
+		/ '\n' [ \t]* ('#' [^\n]*)? '\n' /
+		{
+			# Need to shorten to take off the newline.
+			# Turn it into ignore.
+			send_ignore( make_token( typeid WS, pull(stdin, match_length - 1) ) )
+		}
+
+	# Find and ignore comments.
+	token COMMENT 
+		/ '#' [^\n]* '\n' /
+		{
+			# Need to shorten to take off the newline. Turn it into ignore.
+			send_ignore( make_token( typeid WS, pull(stdin, match_length - 1) ) )
+		}
+
+	# These tokens are generated
+	token INDENT //
+	token DEDENT //
+	token NEWLINE //
+	ignore IND_WS //
+
+	token INDENTATION 
+		/'\n' [ \t]*/
+		{
+			# First the newline.
+			send( make_token( typeid NEWLINE, '' ) )
+
+			# We have already sent the newline, compute the indentation level.
+			int data_length = match_length - 1
+
+			if data_length > IndentStack.top {
+				# The indentation level is more than the level on the top
+				# of the stack. This is an indent event. Send as an INDENT.
+				send( make_token( typeid INDENT, '' ) )
+
+				# Push to the stack as per python manual.
+				IndentStack.push( data_length )
+			} else {
+				while data_length < IndentStack.top {
+					# The indentation level is less than the level on the top of
+					# the stack. Pop the level and send one dedent. This flow of
+					# control will execute until we find the right indentation level
+					# to match up with.
+					IndentStack.pop()
+
+					# Send as a DEDENT
+					send( make_token( typeid DEDENT, '' ) )
+				}
+			}
+
+			# FIXME: if data.length is now > top of stack then error. This
+			# means the outdent does not match anything.
+
+			# We have squared up INDENTs and DEDENTs. Ignore the entire match.
+			send_ignore( make_token( typeid WS, pull(stdin, match_length) ) )
+		}
+}
+
+# Blank lines or comment lines at the beginning of the file.
+token LEADER / ( [ \t]* ('#' [^\n]*)? '\n' )* /
+
+int print_target_subscriptions_and_slicings( start Start )
+{
+	for TI: target_ext in Start {
+		if match TI [subscription] {
+			print( 'TARGET SUBSCRIPTION: ', TI, '\n' )
+		}
+
+		if match TI [simple_slicing] {
+			print( 'TARGET SIMPLE SLICING: ', TI, '\n' )
+		}
+
+		if match TI [extended_slicing] {
+			print( 'TARGET EXTENDED SLICING: ', TI, '\n' )
+		}
+	}
+	
+}
+
+int print_primary_subscriptions_and_slicings( start Start )
+{
+	for PI:primary_ext in Start {
+		if match PI [subscription] {
+			print( 'PRIMARY SUBSCRIPTION: ', PI, '\n' )
+		}
+
+		if match PI [simple_slicing] {
+			print( 'PRIMARY SIMPLE SLICING: ', PI, '\n' )
+		}
+
+		if match PI [extended_slicing] {
+			print( 'PRIMARY EXTENDED SLICING: ', PI, '\n' )
+		}
+	}
+}
+
+def start 
+	[file_input]
+
+def file_input 
+	[file_input_forms*]
+
+def file_input_forms 
+	[statement]
+|	[NEWLINE]
+
+def statement 
+	[stmt_list NEWLINE]
+|	[compound_stmt]
+
+def stmt_list 
+	[simple_stmt another_stmt* opt_semi]
+
+def another_stmt 
+	[';' simple_stmt]
+
+def opt_semi 
+	[';']
+|	[]
+
+def suite 
+	[stmt_list NEWLINE]
+|	[NEWLINE INDENT statement_seq DEDENT]
+
+def statement_seq 
+	[statement_seq statement]
+|	[statement]
+
+def compound_stmt 
+	[if_stmt]
+|	[while_stmt]
+|	[for_stmt]
+|	[try_stmt]
+|	[with_stmt]
+|	[funcdef]
+|	[classdef]
+
+def if_stmt 
+	['if' expression ':' suite elif_part* opt_else_part]
+
+def elif_part 
+	['elif' expression ':' suite]
+
+def opt_else_part 
+	['else' ':' suite]
+|	[]
+
+def while_stmt 
+	['while' expression ':' suite opt_else_part]
+
+def for_stmt 
+	['for' target_list 'in' expression_list ':' suite opt_else_part]
+
+def try_stmt 
+	['try' ':' suite except_list opt_else_part opt_finally_part]
+|	['try' ':' suite 'finally' ':' suite]
+
+def except_list 
+	[except_list except_part]
+|	[except_part]
+
+def except_part 
+	['except' ':' suite]
+|	['except' expression ':' suite]
+|	['except' expression ',' target ':' suite]
+
+def opt_finally_part 
+	['finally' ':' suite]
+|	[]
+  
+def with_stmt 
+	['with' expression ':' suite]
+|	['with' expression 'as' target ':' suite]
+
+def funcdef 
+	[decorators 'def' funcname '(' opt_parameter_list ')' ':' suite]
+
+def funcname 
+	[identifier]
+
+def decorators 
+	[decorators decorator]
+|	[]
+  
+def decorator 
+	['@' dotted_name opt_decorator_pal NEWLINE]
+
+def opt_decorator_pal 
+	[]
+|	['(' ')'] 
+|	['(' argument_list ')'] 
+|	['(' argument_list ',' ')'] 
+  
+def dotted_name 
+	[dotted_name '.' identifier]
+|	[identifier]
+
+def opt_parameter_list 
+	[parameter_list]
+|	[]
+
+def parameter_list 
+	[defparameter_list defparameter opt_comma]
+|	[defparameter_list '*' identifier]
+|	[defparameter_list '*' identifier '**' identifier]
+|	[defparameter_list '**' identifier]
+
+def defparameter_list 
+	[defparameter_list defparameter ',']
+|	[]
+  
+def defparameter 
+	[parameter]
+|	[parameter '=' expression]
+  
+def sublist 
+	[parameter_list opt_comma]
+
+def parameter_list 
+	[parameter_list ',' parameter]
+|	[parameter]
+  
+def parameter 
+	[identifier]
+|	['(' sublist ')']
+  
+def classdef 
+	['class' classname opt_inheritance ':' suite]
+
+def classname 
+	[identifier]
+
+def opt_inheritance 
+	['(' ')']
+|	['(' expression_list ')']
+|	[]
+
+def simple_stmt 
+	[expression_stmt]
+|	[assert_stmt]
+|	[assignment_stmt]
+|	[augmented_assignment_stmt]
+|	[pass_stmt]
+|	[del_stmt]
+|	[print_stmt]
+|	[return_stmt]
+|	[yield_stmt]
+|	[raise_stmt]
+|	[break_stmt]
+|	[continue_stmt]
+|	[import_stmt]
+|	[global_stmt]
+|	[exec_stmt]
+
+def expression_stmt 
+	[expression_list]
+
+def assert_stmt 
+	['assert' expression_list_core]
+
+def assignment_stmt 
+	[target_equals_list expression_list]
+
+def target_equals_list 
+	[target_equals_list target_equals]
+|	[target_equals]
+
+def target_equals 
+	[target_list '=']
+
+def target_list 
+	[target_list_core opt_comma]
+
+def target_list_core 
+	[target_list_core ',' target]
+|	[target]
+
+def target 
+	[target_atom target_ext_rep]
+
+def target_atom
+	[identifier]
+|	['(' target_list ')']
+|	['[' target_list ']']
+
+def target_ext_rep [target_ext target_ext_rep]
+def target_ext_rep []
+
+def target_ext
+	[attributeref]
+|	[subscription]
+|	[slicing]
+
+def augmented_assignment_stmt 
+	[target augop expression_list]
+  
+def augop 
+	['+='] | ['-='] | ['*='] | ['/=']
+|	['\%='] | ['**='] | ['>>='] | ['<<='] | ['\&=']
+|	['^'] | ['|=']
+
+def pass_stmt 
+	['pass']
+
+def del_stmt 
+	['del' target_list]
+
+def print_stmt 
+	['print' opt_expression_list]
+|	['print' '>>' expression_list]
+
+def return_stmt 
+	['return' opt_expression_list] 
+
+def yield_stmt 
+	['yield' expression_list]
+
+def raise_stmt 
+	['raise']
+|	['raise' expression]
+|	['raise' expression ',' expression]
+|	['raise' expression ',' expression ',' expression]
+
+def break_stmt 
+	['break']
+
+def continue_stmt 
+	['continue']
+
+def import_stmt 
+	['import' module opt_as_name more_imports]
+|	['from' module 'import' identifier opt_as_name more_imports]
+|	['from' module 'import' '(' identifier opt_as_name more_imports opt_comma ')']
+|	['from' module 'import' '*']
+
+def more_imports 
+	[more_imports ',' identifier opt_as_name]
+|	[]
+
+def module 
+	[module '.' identifier]
+|	[identifier]
+
+def opt_as_name 
+	['as' identifier]
+|	[]
+
+def global_stmt 
+	['global' identifer_list]
+
+def identifer_list 
+	[identifer_list ',' identifier]
+|	[identifier]
+
+def exec_stmt 
+	['exec' expression]
+|	['exec' expression 'in' expression]
+|	['exec' expression 'in' expression ',' expression]
+
+def opt_expression_list 
+	[expression_list]
+|	[]
+
+def expression_list 
+	[expression_list_core opt_comma]
+
+def expression_list_core 
+	[expression_list_core ',' expression]
+|	[expression]
+
+def opt_comma 
+	[',']
+|	[]
+
+def expression 
+	[or_test 'if' or_test 'else' test]
+|	[or_test]
+|	[lambda_form]
+
+def or_test 
+	[or_test 'or' and_test]
+|	[and_test]
+  
+def and_test 
+	[and_test 'and' not_test]
+|	[not_test]
+  
+def not_test 
+	[comparison]
+|	['not' not_test]
+
+def lambda_form 
+	['lambda' opt_parameter_list ':' expression]
+
+def test 
+	[or_test]
+|	[lambda_form]
+
+def comparison 
+	[or_expr comparison_part*]
+
+def comparison_part 
+	[comp_operator or_expr]
+
+def comp_operator 
+	['<'] | ['>'] | ['=='] | ['>='] | ['<='] | ['<>'] | ['!='] | ['is'] |
+	['is' 'not'] | ['in'] | ['not' 'in']
+
+def or_expr 
+	[or_expr '|' xor_expr]
+|	[xor_expr]
+
+def xor_expr 
+	[xor_expr '^' and_expr]
+|	[and_expr]
+
+def and_expr 
+	[and_expr '&' shift_expr]
+|	[shift_expr]
+
+def shift_expr 
+	[shift_expr '<<' a_expr]
+|	[shift_expr '>>' a_expr]
+|	[a_expr]
+
+def a_expr 
+	[a_expr '+' m_expr]
+|	[a_expr '-' m_expr]
+|	[m_expr]
+
+def m_expr 
+	[m_expr '*' u_expr]
+|	[m_expr '//' u_expr]
+|	[m_expr '/' u_expr]
+|	[m_expr '\%' u_expr]
+|	[u_expr]
+
+def u_expr 
+	[power]
+|	['-' u_expr]
+|	['+' u_expr]
+|	['\~' u_expr]
+
+def power 
+	[primary '**' u_expr]
+|	[primary] 
+
+def primary 
+	[atom primary_ext_rep]
+
+def atom 
+	[identifier]
+|	[pyliteral]
+|	[enclosure]
+
+def primary_ext_rep
+	[primary_ext primary_ext_rep]
+|	[]
+
+def primary_ext
+	[attributeref]
+|	[subscription]
+|	[slicing]
+|	[call]
+
+def pyliteral 
+	[stringliteral]
+|	[integer]
+|	[longinteger]
+|	[floatnumber]
+|	[imagnumber]
+
+def enclosure 
+	[parenth_form]
+|	[list_display]
+|	[generator_expression]
+|	[dict_display]
+|	[string_conversion]
+
+def parenth_form 
+	['(' opt_expression_list ')']
+
+def list_display 
+	['[' opt_listmaker ']']
+
+def opt_listmaker 
+	[listmaker]
+|	[]
+
+def listmaker 
+	[expression list_for]
+|	[expression listmaker_ext* opt_comma]
+
+def listmaker_ext
+	[',' expression]
+
+def opt_list_iter 
+	[list_iter]
+|	[]
+
+def list_iter 
+	[list_for] 
+|	[list_if]
+
+def list_if 
+	['if' test opt_list_iter]
+
+def list_for 
+	['for' expression_list 'in' testlist opt_list_iter]
+
+def testlist 
+	[test testlist_ext* opt_comma]
+
+def testlist_ext 
+	[',' test ]
+
+def generator_expression 
+	['(' test genexpr_for ')']
+
+def genexpr_for 
+	['for' expression_list 'in' test opt_genexpr_iter]
+
+def opt_genexpr_iter 
+	[genexpr_iter] 
+|	[] 
+
+def genexpr_iter 
+	[genexpr_for] 
+|	[genexpr_if]
+  
+def genexpr_if 
+	['if' test opt_genexpr_iter]
+
+def dict_display 
+	['\{' opt_key_datum_list '\}']
+
+def opt_key_datum_list 
+	[key_datum_list]
+|	[]
+
+def key_datum_list 
+	[key_datum key_datum_list_ext* opt_comma]
+
+def key_datum_list_ext 
+	[',' key_datum]
+
+def key_datum 
+	[expression ':' expression]
+
+def string_conversion 
+	['`' expression_list '`']
+
+def attributeref 
+	['.' identifier]
+
+def subscription 
+	['[' expression_list ']']
+
+# The natural ordered choice does not suffice here. Must force it.
+
+def slicing 
+	[simple_slicing]
+|	[extended_slicing]
+
+def simple_slicing 
+	['[' short_slice ']']
+
+def extended_slicing 
+	['[' slice_list ']']
+
+def slice_list 
+	[slice_item slice_list_ext* opt_comma]
+
+def slice_list_ext 
+	[',' slice_item]
+  
+def slice_item 
+	[expression]
+|	[proper_slice]
+|	[ellipsis]
+  
+def proper_slice 
+	[short_slice]
+|	[long_slice]
+  
+def short_slice 
+	[':']
+|	[':' upper_bound]
+|	[lower_bound ':']
+|	[lower_bound ':' upper_bound]
+  
+def long_slice 
+	[short_slice ':' stride]
+|	[short_slice ':']
+  
+def lower_bound 
+	[expression]
+  
+def upper_bound 
+	[expression]
+  
+def stride 
+	[expression]
+
+def ellipsis 
+	['...']
+
+def call 
+	['(' opt_argument_list ')']
+
+def opt_argument_list 
+	[argument_list opt_comma]
+|	[]
+  
+def argument_list 
+	[positional_arguments opt_comma_keyword_arguments
+		opt_comma_star_expr opt_comma_dstar_expr]
+|	[keyword_arguments opt_comma_star_expr opt_comma_dstar_expr]
+|	['*' expression opt_comma_dstar_expr]
+|	['**' expression]
+
+def opt_comma_star_expr 
+	[',' '*' expression] 
+|	[] 
+
+def opt_comma_dstar_expr 
+	[',' '**' expression] 
+|	[] 
+  
+def positional_arguments 
+	[positional_arguments ',' expression]
+|	[expression]
+  
+def opt_comma_keyword_arguments 
+	[',' keyword_arguments]
+|	[]
+
+def keyword_arguments 
+	[keyword_arguments ',' keyword_item]
+|	[keyword_item]
+
+def keyword_item 
+	[identifier '=' expression]
+
+
+start S = parse start( stdin )
+#print_xml( S )
+print_target_subscriptions_and_slicings( S )
+print_primary_subscriptions_and_slicings( S )
+print( '*** SUCCESS ***\n' )
diff --git a/test/ragelambig.in b/test/ragelambig.in
new file mode 100644
index 00000000..0b4439e5
--- /dev/null
+++ b/test/ragelambig.in
@@ -0,0 +1 @@
+1 - 1
diff --git a/test/ragelambig1.lm b/test/ragelambig1.lm
new file mode 100644
index 00000000..1c292fd1
--- /dev/null
+++ b/test/ragelambig1.lm
@@ -0,0 +1,65 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start 
+	[expression]
+	{
+		print_xml( lhs )
+	}
+
+def expression 
+	[expression '|' term]
+|	[expression '&' term]
+|	[expression '-' term]
+|	[expression '--' term]
+|	[term]
+
+def term 
+	[term factor_with_rep]
+	{
+		if match lhs [term '-' uint] {
+			reject
+		}
+	}
+|	[term '.' factor_with_rep]
+|	[term ':>' factor_with_rep]
+|	[term ':>>' factor_with_rep]
+|	[term '<:' factor_with_rep]
+|	[factor_with_rep]
+
+def factor_with_rep 
+	[factor_with_rep '*']
+|	[factor_with_rep '**']
+|	[factor_with_rep '?']
+|	[factor_with_rep '+']
+|	[factor_with_rep '{' factor_rep_num '}']
+|	[factor_with_rep '{' ',' factor_rep_num '}']
+|	[factor_with_rep '{' factor_rep_num ',' '}']
+|	[factor_with_rep '{' factor_rep_num ',' factor_rep_num '}']
+|	[factor_with_neg]
+
+def factor_rep_num [uint]
+
+def factor_with_neg 
+	['!' factor_with_neg]
+|	['^' factor_with_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+|	['-' uint]
diff --git a/test/ragelambig2.lm b/test/ragelambig2.lm
new file mode 100644
index 00000000..70e97c66
--- /dev/null
+++ b/test/ragelambig2.lm
@@ -0,0 +1,65 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start 
+	[expression]
+	{
+		print_xml( lhs )
+	}
+
+def expression 
+	[expression '|' term]
+|	[expression '&' term]
+|	[expression '-' term]
+|	[expression '--' term]
+|	[term]
+
+def term 
+	[factor_with_rep more_term]
+
+# Can resolve the ambiguity by making more_term shortest match.
+def more_term 
+	[]
+|	[factor_with_rep more_term]
+|	['.' factor_with_rep more_term]
+|	[':>' factor_with_rep more_term]
+|	[':>>' factor_with_rep more_term]
+|	['<:' factor_with_rep more_term]
+
+def factor_with_rep 
+	[factor_with_rep '*']
+|	[factor_with_rep '**']
+|	[factor_with_rep '?']
+|	[factor_with_rep '+']
+|	[factor_with_rep '{' factor_rep_num '}']
+|	[factor_with_rep '{' ',' factor_rep_num '}']
+|	[factor_with_rep '{' factor_rep_num ',' '}']
+|	[factor_with_rep '{' factor_rep_num ',' factor_rep_num '}']
+|	[factor_with_neg]
+
+def factor_rep_num 
+	[uint]
+
+def factor_with_neg 
+	['!' factor_with_neg]
+|	['^' factor_with_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+|	['-' uint]
diff --git a/test/ragelambig3.lm b/test/ragelambig3.lm
new file mode 100644
index 00000000..649038e5
--- /dev/null
+++ b/test/ragelambig3.lm
@@ -0,0 +1,64 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start 
+	[expression]
+	{
+		print_xml( lhs )
+	}
+
+def expression 
+	[expression '|' term_short]
+|	[expression '&' term_short]
+|	[expression '-' term_short]
+|	[expression '--' term_short]
+|	[term_short]
+
+def term_short 
+	reducefirst
+	[term]
+
+def term 
+	[term factor_with_rep]
+|	[term '.' factor_with_rep]
+|	[term ':>' factor_with_rep]
+|	[term ':>>' factor_with_rep]
+|	[term '<:' factor_with_rep]
+|	[factor_with_rep]
+
+def factor_with_rep 
+	[factor_with_rep '*']
+|	[factor_with_rep '**']
+|	[factor_with_rep '?']
+|	[factor_with_rep '+']
+|	[factor_with_rep '{' factor_rep_num '}']
+|	[factor_with_rep '{' ',' factor_rep_num '}']
+|	[factor_with_rep '{' factor_rep_num ',' '}']
+|	[factor_with_rep '{' factor_rep_num ',' factor_rep_num '}']
+|	[factor_with_neg]
+
+def factor_rep_num [uint]
+
+def factor_with_neg 
+	['!' factor_with_neg]
+|	['^' factor_with_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+|	['-' uint]
diff --git a/test/ragelambig4.lm b/test/ragelambig4.lm
new file mode 100644
index 00000000..d489bca3
--- /dev/null
+++ b/test/ragelambig4.lm
@@ -0,0 +1,69 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start 
+	[expression]
+	{
+		print_xml( lhs )
+	}
+
+def expression [term expression_op*]
+
+def expression_op
+	['|' term]
+|	['&' term]
+|	['-' term]
+|	['--' term]
+
+def term [factor_rep term_op_list_short]
+
+# This list is done manually to get shortest match.
+def term_op_list_short
+	[]
+|	[term_op term_op_list_short]
+
+def term_op
+	[factor_rep]
+|	['.' factor_rep]
+|	[':>' factor_rep]
+|	[':>>' factor_rep]
+|	['<:' factor_rep]
+
+def factor_rep 
+	[factor_neg factor_rep_op*]
+
+def factor_rep_op
+	['*']
+|	['**']
+|	['?']
+|	['+']
+|	['{' factor_rep_num '}']
+|	['{' ',' factor_rep_num '}']
+|	['{' factor_rep_num ',' '}']
+|	['{' factor_rep_num ',' factor_rep_num '}']
+
+def factor_rep_num [uint]
+
+def factor_neg 
+	['!' factor_neg]
+|	['^' factor_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+|	['-' uint]
diff --git a/test/rediv.in b/test/rediv.in
new file mode 100644
index 00000000..f1ef2a38
--- /dev/null
+++ b/test/rediv.in
@@ -0,0 +1 @@
+2 / /[^gu-zy].*o[\d-xa]*/;
diff --git a/test/rediv.lm b/test/rediv.lm
new file mode 100644
index 00000000..c3750351
--- /dev/null
+++ b/test/rediv.lm
@@ -0,0 +1,92 @@
+# Or-literal scanner
+lex orlit
+{
+	token orlit_dash /'-' /
+	token orlit_close /']'/
+
+	rl orlit_specials /[\-\]]/
+	token orlit_chr /^orlit_specials | '\\' any/
+}
+
+def orlit_item 
+	[orlit_chr]
+|	[orlit_chr orlit_dash orlit_chr]
+
+def orlit 
+	[orlit_item*]
+
+# Regex scanner
+lex regex
+{
+	token orlit_open /'['/
+	token orlit_neg_open /'[^'/
+	token regex_dot /'.'/
+	token regex_star /'*'/
+	token regex_close /'/'/
+
+	rl regex_specials /[\[\.\*\/\\]/
+	token regex_chr /(^regex_specials)* | '\\' any/
+}
+
+def regex_rep 
+	[regex_star]
+|	[]
+
+def regex_base 
+	[regex_chr]
+|	[regex_dot]
+|	[orlit_open orlit orlit_close]
+|	[orlit_neg_open orlit orlit_close]
+
+def regex_item 
+	[regex_base regex_rep]
+
+def regex_body
+	[regex_item*]
+
+rl s_string /"'" ([^'\\\n] | '\\' any )* "'"/
+rl d_string /'"' ([^"\\\n] | '\\' any )* '"'/
+
+# Root scanner
+lex start
+{
+	token ident /[a-zA-Z_]+/
+	token number /[0-9]+/
+	token string /s_string | d_string/
+
+	literal '+', '-', '*', ';', '/'
+	token slash /'/'/
+	token semi /';'/
+
+	ignore wp /[ \t\n]+/
+}
+
+def factor 
+	[ident]
+|	[number]
+|	[string]
+|	['/' regex_body regex_close]
+
+def term 
+	[term '*' factor]
+|	[term '/' factor]
+|	[factor]
+
+def expr 
+	[expr '+' term]
+|	[expr '-' term]
+|	[term]
+
+def statement 
+	[expr ';']
+
+def start 
+	[statement*]
+	{
+		for I:orlit_item in lhs {
+			if match I [orlit_chr] {
+				print( I, '\n' )
+			}
+		}
+		print_xml( lhs )
+	}
diff --git a/test/ruby/Makefile b/test/ruby/Makefile
new file mode 100644
index 00000000..22647b42
--- /dev/null
+++ b/test/ruby/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/ruby/ruby.lm b/test/ruby/ruby.lm
new file mode 100644
index 00000000..b9505515
--- /dev/null
+++ b/test/ruby/ruby.lm
@@ -0,0 +1,627 @@
+#
+# Grammar
+#
+
+# The items in this scanner may have newline in front of them.
+lex start
+{
+	# Reserved Words.
+	literal '__LINE__', '__FILE__', '__ENCODING__', 'BEGIN', 'END', 'alias',
+		'and', 'begin', 'break', 'case', 'class', 'def', 'defined?', 'do',
+		'else', 'elsif', 'end', 'ensure', 'false', 'for', 'in', 'module',
+		'next', 'nil', 'not', 'or', 'redo', 'rescue', 'retry', 'return',
+		'self', 'super', 'then', 'true', 'undef', 'when', 'yield', 'if',
+		'unless', 'while', 'until'
+
+	token tNTH_REF /'$' [0-9]+/
+	token tBACK_REF /'$' ( '&' | '`' | '\'' | '+' ) /
+
+	literal ')', ',', ']'
+	literal '{', '}', ':'
+	literal '.', '::'
+	literal '->'
+	
+	# Unary operators.
+	literal '!', '~'
+	token tUPLUS /'+'/
+	token tUMINUS /'-'/
+
+	token tLBRACK /'['/
+	token tLPAREN /'('/
+	token tSTAR /'*'/
+	token tBAR /'|'/
+	token tAMPER /'&'/
+
+	token tIDENTIFIER /[a-z][a-zA-Z_]*/
+	token tFID /[a-z][a-zA-Z_]* ('!'|'?')/
+	token tCONSTANT /[A-Z][a-zA-Z_]*/
+	token tGVAR /'$' [a-zA-Z_]+/
+	token tIVAR /'@' [a-zA-Z_]+/
+	token tCVAR /'@@' [a-zA-Z_]+/
+
+	token tINTEGER /[0-9]+/
+	token tFLOAT /[0-9]+ '.' [0-9]+/
+
+	token tDSTRING_BEG /'"'/
+	token tSSTRING_BEG /'\''/
+	token tXSTRING_BEG /'`'/
+
+	ignore /[ \t\n]+/
+	ignore comment /'#' [^\n]* '\n'/
+}
+
+# These items cannot appear at the beginning of a line (except maybe the first).
+lex expr_cont_ops
+{
+	ignore /[\t ]+/
+
+	literal '+', '-', '*', '**', '/', '%', '^'
+	literal '|', '&', '||', '&&'
+	literal '[', '('
+	literal '='
+	literal '<<', '>>'
+	literal '?'
+	literal '<=>'
+	literal '=>'
+	literal '[]', '[]='
+	literal '=~', '!~'
+	literal '<', '>', '>=', '<='
+	literal '!=', '==', '==='
+	literal '..', '...'
+}
+lex terms
+{
+	ignore /[\t ]+/
+	ignore /'#' [^\n]*/
+	literal ';'
+	literal '\n'
+}
+
+
+lex dstring_contents
+{
+	token dstring_contents /[^"]+/
+	token tDSTRING_END /'"'/
+}
+
+lex sstring_contents
+{
+	token sstring_contents /[^']+/
+	token tSSTRING_END /'\''/
+}
+
+lex xstring_contents
+{
+	token xstring_contents /[^`]+/
+	token tXSTRING_END /'`'/
+}
+
+def ruby
+	[compstmt]
+
+def compstmt
+	[stmts opt_terms]
+
+def bodystmt
+	[compstmt opt_rescue opt_else opt_ensure]
+
+def opt_rescue
+#	['rescue' exc_list exc_var then compstmt opt_rescue] |
+	[]
+
+def then
+	[term]
+|	['then']
+|	[term 'then']
+
+def do
+	[term]
+|	['do']
+
+def if_tail
+	[opt_else]
+|	['elsif' expr_value then compstmt if_tail]
+
+def opt_else
+	['else' compstmt]
+|	[]
+
+def opt_ensure
+	['ensure' compstmt]
+|	[]
+
+def stmts
+	[stmts terms stmt]
+|	[stmt]
+|	[]
+
+def opt_terms
+	[terms]
+|	[]
+
+def terms
+	[term]
+|	[terms ';']
+
+def term
+	[';']
+|	['\n']
+
+def stmt
+	['alias' fitem fitem]
+|	['undef' undef_list]
+|	[stmt 'if' expr_value]
+|	[stmt 'unless' expr_value]
+|	[stmt 'while' expr_value]
+|	[stmt 'until' expr_value]
+|	[stmt 'rescue' stmt]
+|	['BEGIN' '{' compstmt '}']
+|	['END' '{' compstmt '}']
+|	[lhs '=' mrhs]
+|	[mlhs '=' arg_value]
+|	[mlhs '=' mrhs]
+|	[expr]
+
+def mlhs
+	[mlhs_basic]
+|	[tLPAREN mlhs ')']
+
+def mlhs_basic
+	[mlhs_head]
+
+def mlhs_head
+	[mlhs_item ',' mlhs_head]
+|	[mlhs_item]
+
+def mlhs_item
+	[variable]
+|	['*' mlhs_item]
+|	['*']
+|	[primary_value '[' opt_call_args ']']
+|	[primary_value '.' tIDENTIFIER]
+|	[primary_value '.' tCONSTANT]
+|	[primary_value '::' tIDENTIFIER]
+|	[primary_value '::' tCONSTANT]
+|	['::' tCONSTANT]
+|	[backref]
+|	[tLPAREN mlhs ')']
+
+def lhs
+	[variable]
+|	[primary_value '[' opt_call_args ']']
+|	[primary_value '.' tIDENTIFIER]
+|	[primary_value '.' tCONSTANT]
+|	[primary_value '::' tIDENTIFIER]
+|	[primary_value '::' tCONSTANT]
+|	['::' tCONSTANT]
+|	[backref]
+
+def mrhs
+	[args ',' arg_value]
+|	[args ',' '*' arg_value]
+|	['*' arg_value]
+
+def expr
+	[expr 'and' expr]
+|	[expr 'or' expr]
+|	['not' expr]
+|	[arg]
+
+def expr_value
+	[expr]
+
+def opt_brace_block
+	[brace_block]
+|	[]
+
+def block_param_def
+	[tBAR opt_bv_decl tBAR]
+|	[tBAR block_param opt_bv_decl tBAR]
+
+def block_param
+	[block_arg_list]
+|	[]
+
+def block_arg_list
+	[block_arg_list ',' block_arg_item]
+|	[block_arg_item]
+
+def block_arg_item
+	[f_norm_arg]
+|	[f_rest_arg]
+|	[f_block_arg]
+|	['(' f_args ')']
+
+def opt_bv_decl
+	[';' bv_decls]
+|	[]
+
+def bv_decls
+	[bvar]
+|	[bv_decls ',' bvar]
+
+def bvar
+	[tIDENTIFIER]
+
+def opt_block_param
+	[block_param_def]
+|	[]
+
+def operation
+	[tIDENTIFIER]
+|	[tCONSTANT]
+|	[tFID]
+
+def operation2
+	[tIDENTIFIER]
+|	[tCONSTANT]
+|	[tFID]
+|	[op]
+
+def operation3
+	[tIDENTIFIER]
+|	[tFID]
+|	[op]
+
+def op
+	['|'] | ['^'] | ['&'] | ['<=>'] | ['=='] | ['==='] | ['=~'] | ['!~'] |
+	['>'] | ['>='] | ['<'] | ['<='] | ['!='] | ['<<'] | ['>>'] | ['+'] |
+	['-'] | ['*'] | ['/'] | ['%'] | ['**'] | ['!'] | ['~'] | ['[]'] | ['[]='] |
+	[tXSTRING_BEG]
+
+def opt_call_args
+	[call_args]
+|	[]
+
+def call_args
+	[args opt_block_arg]
+|	[assocs opt_block_arg]
+|	[args ',' assocs opt_block_arg]
+|	[block_arg]
+
+def args
+	[arg_value]
+|	['*' arg_value]
+|	[args ',' arg_value]
+|	[args ',' '*' arg_value]
+
+def arg_value
+	[arg]
+
+def opt_block_arg	
+	[',' block_arg]
+|	[]
+
+def block_arg
+	[tAMPER arg_value]
+
+def arg 
+	['defined?' arg]
+|	[arg_assign]
+
+def arg_assign
+	[lhs '=' arg_assign]
+|	[lhs '=' arg_assign 'rescue' arg]
+|	[arg_sel]
+
+def arg_sel
+	[arg_dot '?' arg_sel ':' arg_sel]
+|	[arg_dot]
+
+def arg_dot
+	[arg_logical '..' arg_dot]
+|	[arg_logical '...' arg_dot]
+|	[arg_logical]
+
+def arg_logical
+	[arg_eq '&&' arg_logical]
+|	[arg_eq '||' arg_logical]
+|	[arg_eq]
+
+def arg_eq
+	[arg_cmp '<=>' arg_eq]
+|	[arg_cmp '==' arg_eq]
+|	[arg_cmp '===' arg_eq]
+|	[arg_cmp '!=' arg_eq]
+|	[arg_cmp '=~' arg_eq]
+|	[arg_cmp '!~' arg_eq]
+|	[arg_cmp]
+
+def arg_cmp
+	[arg_bitor '>=' arg_cmp]
+|	[arg_bitor '<=' arg_cmp]
+|	[arg_bitor '>' arg_cmp]
+|	[arg_bitor '<' arg_cmp]
+|	[arg_bitor]
+
+def arg_bitor
+	[arg_bitand '|' arg_bitor]
+|	[arg_bitand '^' arg_bitor]
+|	[arg_bitand]
+
+def arg_bitand
+	[arg_shift '&' arg_bitand]
+|	[arg_shift]
+
+def arg_shift
+	[arg_add '<<' arg_shift]
+|	[arg_add '>>' arg_shift]
+|	[arg_add]
+
+def arg_add
+	[arg_mult '+' arg_add]
+|	[arg_mult '-' arg_add]
+|	[arg_mult]
+
+def arg_mult
+	[arg_pow '*' arg_mult]
+|	[arg_pow '/' arg_mult]
+|	[arg_pow '%' arg_mult]
+|	[arg_pow]
+
+def arg_pow
+	[arg_unary '**' arg_pow]
+|	[arg_unary]
+
+def arg_unary
+	['!' primary]
+|	['~' primary]
+|	[tUPLUS primary]
+|	[tUMINUS primary]
+|	[primary]
+
+def primary_value 
+	[primary]
+
+def primary
+	[pliteral]
+|	[strings]
+|	[xstring]
+#|	[regexp]
+#|	[words]
+#|	[qwords]
+|	[var_ref]
+|	[backref]
+|	[tFID]
+|	['begin' bodystmt 'end']
+|	[tLPAREN compstmt ')']
+|	[primary_value '::' tCONSTANT]
+|	['::' tCONSTANT]
+|	[tLBRACK aref_args ']']
+|	['{' assoc_list '}']
+|	['defined?' '(' expr ')']
+|	[operation brace_block]
+|	[method_call]
+|	[method_call brace_block]
+|	['->' lambda]
+|	['if' expr_value then compstmt if_tail 'end']
+|	['unless' expr_value then compstmt opt_else 'end']
+|	['while' expr_value do compstmt 'end']
+|	['until' expr_value do compstmt 'end']
+#|	['case' expr_value opt_terms case_body 'end']
+#|	['case' opt_terms case_body 'end']
+|	['for' for_var 'in' expr_value do compstmt 'end']
+|	['class' cpath superclass bodystmt 'end']
+|	['class' '<<' expr term bodystmt 'end']
+|	['module' cpath bodystmt 'end']
+|	['def' fname f_arglist bodystmt 'end']
+|	['def' singleton dot_or_colon fname f_arglist bodystmt 'end']
+|	['break']
+|	['next']
+|	['redo']
+|	['retry']
+
+def for_var
+	[lhs]
+|	[mlhs]
+
+def lambda
+	[f_larglist lambda_body]
+
+def f_larglist
+	['(' f_args opt_bv_decl ')']
+|	[f_args opt_bv_decl]
+
+def lambda_body
+	['{' compstmt '}']
+|	['do' compstmt 'end']
+
+def assoc_list
+	[assocs trailer]
+|	[]
+
+def assocs
+	[assocs ',' assoc]
+|	[assoc]
+
+def assoc
+	[arg_value '=>' arg_value]
+|	[':' arg_value]
+
+def singleton
+	[var_ref]
+|	['(' expr ')']
+
+def dot_or_colon
+	['.']
+|	['::']
+
+def aref_args
+	[args trailer]
+|	[args ',' assocs trailer]
+|	[assocs trailer]
+|	[]
+
+def trailer		
+	[',']
+|	[]
+
+def brace_block
+	['{' opt_block_param compstmt '}']
+|	['do' opt_block_param compstmt 'end']
+
+def f_arglist
+	['(' f_args ')']
+|	[f_args term]
+
+def f_args
+	[f_arg_list]
+|	[]
+
+def f_arg_list
+	[f_arg_list ',' f_arg_item]
+|	[f_arg_item]
+
+def f_arg_item
+	[f_norm_arg]
+|	[f_opt]
+|	[f_rest_arg]
+|	[f_block_arg]
+|	['(' f_args ')']
+
+def f_opt
+	[tIDENTIFIER '=' arg_value]
+
+def f_rest_arg
+	['*' tIDENTIFIER]
+|	['*']
+
+def f_block_arg
+	[tAMPER tIDENTIFIER]
+
+def f_norm_arg
+	[tIDENTIFIER]
+
+def backref
+	[tNTH_REF] | [tBACK_REF]
+
+def superclass	
+	[term]
+|	['<' expr_value term]
+
+def cpath
+	['::' cname]
+|	[cname]
+|	[primary_value '::' cname]
+
+def fname
+	[tIDENTIFIER]
+|	[tCONSTANT]
+|	[tFID]
+|	[op]
+|	[reswords]
+
+def reswords
+	['__LINE__'] |	['__FILE__'] |	['__ENCODING__'] |	['BEGIN'] |	['END'] |
+	['alias'] |	['and'] |	['begin'] |	['break'] |	['case'] |	['class'] |
+	['def'] |	['defined?'] |	['do'] |	['else'] |	['elsif'] |	['end'] |
+	['ensure'] |	['false'] |	['for'] |	['in'] |	['module'] |
+	['next'] |	['nil'] |	['not'] |	['or'] |	['redo'] |	['rescue'] |
+	['retry'] |	['return'] |	['self'] |	['super'] |	['then'] |	['true'] |
+	['undef'] |	['when'] |	['yield'] |	['if'] |	['unless'] |	['while'] |
+	['until']
+
+def cname
+	[tIDENTIFIER]
+|	[tCONSTANT]
+
+def pliteral
+	[numeric]
+|	[symbol]
+#|	[dsym]
+
+def strings
+	[string]
+
+def string
+#	[tCHAR]
+	[string1]
+|	[string string1]
+
+def string1
+	[tSSTRING_BEG sstring_contents? tSSTRING_END]
+|	[tDSTRING_BEG dstring_contents? tDSTRING_END]
+
+def xstring
+	[tXSTRING_BEG xstring_contents? tXSTRING_END]
+
+def numeric
+	[tINTEGER]
+|	[tFLOAT]
+
+def symbol
+	[':' sym]
+
+def sym
+	[fname]
+|	[tIVAR]
+|	[tGVAR]
+|	[tCVAR]
+
+def fitem
+	[fsym]
+#|	[dsym]
+
+def undef_list
+	[fitem]
+|	[undef_list ',' fitem]
+
+def fsym
+	[fname]
+|	[symbol]
+
+#def dsym
+#	[':' xstring_contents tDSTRING_END]
+
+def var_ref
+	[variable]
+
+def variable
+	[tIDENTIFIER] | [tIVAR] | [tGVAR] | [tCONSTANT] | [tCVAR] | ['nil'] |
+	['self'] | ['true'] | ['false'] | ['__FILE__'] | ['__LINE__'] |
+	['__ENCODING__']
+
+
+# Required whitespace, but newline is not allowed.
+token ws_no_nl
+	/[ \t]+[^ \t\n]/
+	{
+		send( make_token( typeid ws_no_nl, pull(stdin, match_length-1) ) )
+	}
+
+def method_call
+	[operation paren_args]
+|	[operation ws_no_nl call_args]
+|	[primary_value '.' operation2 opt_paren_args]
+|	[primary_value '.' operation2 ws_no_nl call_args]
+|	[primary_value '::' operation2 opt_paren_args]
+|	[primary_value '::' operation2 ws_no_nl call_args]
+|	[primary_value '.' paren_args]
+|	[primary_value '::' paren_args]
+|	['super' paren_args]
+|	['super' ws_no_nl call_args]
+|	['super']
+|	['yield' paren_args]
+|	['yield' ws_no_nl call_args]
+|	['yield']
+|	['return' call_args]
+|	['return']
+|	[primary_value '[' opt_call_args ']']
+
+def opt_paren_args
+	[paren_args]
+|	[]
+
+def paren_args
+	['(' opt_call_args ')']
+
+#
+# Grammar finished
+#
+
+ruby R = parse ruby(stdin)
+
+print_xml( R )
+
+#for T: primary in R
+#	print_xml( T, '\n\n' )
diff --git a/test/rubyhere.in b/test/rubyhere.in
new file mode 100644
index 00000000..a23dfead
--- /dev/null
+++ b/test/rubyhere.in
@@ -0,0 +1,8 @@
+print( <<DATA1, more, <<DATA2, 99 )
+"&^#(@ almost
+!arbitrary text!
+DATA1
+hello
+world
+DATA2
+. error here
diff --git a/test/rubyhere.lm b/test/rubyhere.lm
new file mode 100644
index 00000000..33fff4b7
--- /dev/null
+++ b/test/rubyhere.lm
@@ -0,0 +1,89 @@
+rl ident_pattern /[a-zA-Z_][a-zA-Z_0-9]*/
+rl number_pattern /[0-9]+/
+
+lex start
+{
+	ignore /[ \t\n]+/
+	token id /ident_pattern/
+	token number /number_pattern/
+	literal '<<', '*', ',', '(', ')'
+}
+
+global str HereId
+
+token rest_of_line /[^\n]*'\n'/
+
+lex here_start
+{
+	ignore /[ \t\n]+/
+	token here_id
+		here_data HereData
+		/ident_pattern/
+		{
+			# Take the text of the here_id from the input stream.
+			HereId = pull( stdin, match_length )
+
+			# Get the data up to the rest of the line.
+			rest_of_line ROL = parse_stop rest_of_line( stdin )
+
+			# Parse the heredoc data.
+			here_data HereData = parse_stop here_data( stdin )
+
+			# Push the rest-of-line data back to the input stream.
+			push( stdin, ROL )
+
+			# Send the here_id token. Attach the heredoc data as an attribute.
+			send( make_token( typeid here_id, HereId, HereData ) )
+		}
+}
+
+lex here_data
+{
+	token here_close_id 
+		/ ident_pattern '\n' /
+		{
+			if match_text == HereId + '\n' {
+				send( make_token( 
+					typeid here_close_id,
+					pull(stdin, match_length) ) )
+			}
+			else 
+				send( make_token( typeid here_line, pull(stdin, match_length) ) )
+		}
+
+	token here_line
+		/ [^\n]* '\n' /
+}
+
+def here_data
+	[here_line* here_close_id]
+
+def heredoc
+	['<<' here_id]
+
+def primary
+	[id]
+|	[number]
+|	[heredoc]
+
+def arglist
+	[primary arglist_more*]
+
+def arglist_more
+	[',' primary]
+
+def call
+	[id '(' arglist? ')']
+
+def statement
+	[primary]
+|	[call]
+
+token foobar /any*/
+
+def start 
+	[statement*]
+|	[foobar]
+
+start S = parse start( stdin )
+print_xml(S)
diff --git a/test/string.in b/test/string.in
new file mode 100644
index 00000000..8aef536f
--- /dev/null
+++ b/test/string.in
@@ -0,0 +1,2 @@
+a + "%{{"; 1 * 2;
+
diff --git a/test/string.lm b/test/string.lm
new file mode 100644
index 00000000..7da88215
--- /dev/null
+++ b/test/string.lm
@@ -0,0 +1,54 @@
+lex string
+{
+	token str_escape /'\\' any/
+	token str_chr /[^\\"]+/
+}
+
+def str_item 
+	[str_escape]
+|	[str_chr]
+
+def string 
+	['"' str_item* '"']
+
+lex start
+{
+	token ident /[a-zA-Z_]+/
+	token number /[0-9]+/
+
+	literal '+', '*', ';', '"', '\'', '(', ')'
+	literal '+=', '-=', '*='
+
+	ignore wp /[ \t\n]+/
+}
+
+def expr 
+	[expr '+' term]
+|	[term]
+
+def term 
+	[term '*' primary]
+|	[primary]
+
+def primary 
+	[number]
+|	[ident]
+|	[string]
+|	['(' expr ')']
+
+def expr_list 
+	[expr_list expr ';']
+|	[]
+
+def start 
+	[expr_list]
+	{
+		if match lhs 
+			~a + "%{{"; 1 * 2;
+		{
+			print( 'yes\n' )
+		}
+	}
+
+start S = parse start(stdin)
+print_xml( S )
diff --git a/test/superid.in b/test/superid.in
new file mode 100644
index 00000000..4002630f
--- /dev/null
+++ b/test/superid.in
@@ -0,0 +1 @@
+!a b b a;
diff --git a/test/superid.lm b/test/superid.lm
new file mode 100644
index 00000000..3a3eef59
--- /dev/null
+++ b/test/superid.lm
@@ -0,0 +1,59 @@
+
+lex start
+{
+	literal '!', 'a', ';\n'
+
+	token id /'a'|'b'/
+	{
+		#tok.id = trans_id_to
+	}
+	
+	token super_id //
+	token foo //
+
+	ignore ws / [ \n\t]+ /
+}
+
+global int trans_id_to
+
+def e1 
+	[]
+	{
+		print( 'old_id = ', trans_id_to, '\n' )
+		#trans_id_to = type_id foo
+		print( 'new_id = ', trans_id_to, '\n' )
+	}
+
+def item1 
+	str msg
+
+	[ e1 '!' 'a' super_id super_id 'a']
+	{
+		lhs.msg = 'this is item1\n'
+	}
+
+def e2 
+	[]
+	{
+		print( 'old_id = ', trans_id_to, '\n' )
+		#trans_id_to = type_id super_id
+		print( 'new_id = ', trans_id_to, '\n' )
+	}
+
+def item2 
+	str msg
+
+	[ e2 '!' 'a' super_id super_id 'a']
+	{
+		lhs.msg = 'this is item2\n'
+	}
+
+
+def start 
+	[item1 ';\n']
+|	[item2 ';\n']
+	{
+		match lhs [Item2:item2 ';\n']
+		print( Item2.msg )
+	}
+
diff --git a/test/tags.in b/test/tags.in
new file mode 100644
index 00000000..939f9b48
--- /dev/null
+++ b/test/tags.in
@@ -0,0 +1 @@
+a b b a;
diff --git a/test/tags.lm b/test/tags.lm
new file mode 100644
index 00000000..9e13ddd8
--- /dev/null
+++ b/test/tags.lm
@@ -0,0 +1,82 @@
+# Open and close tags by rewriting to generic close tags. Won't work if
+# interested in unclosed tags because a token can start as not close_id, but
+# then become a close id during the course of parsing.
+
+#
+# Regular Definitions
+#
+rl rl_ws /[ \t\n\r\v]+/
+rl rl_id /[a-zA-Z_][a-zA-Z0-9_]*/
+
+#
+# Tokens
+#
+
+# Any single character can be a literal
+lex start
+{
+	literal '!\n', ';\n'
+
+	# Ignore whitespace.
+	ignore /rl_ws/
+
+	# Open and close id
+	token id /rl_id/
+}
+
+#
+# Global Data
+#
+
+def tag_stack 
+	[id tag_stack]
+|	[]
+
+global tag_stack TS = construct tag_stack ["sentinal"]
+
+#
+# Productions
+#
+
+def open_tag 
+	[id]
+	{
+		match lhs [Id:id]
+		match TS [Top:id Rest:tag_stack]
+		if Id.data == Top.data {
+			reject
+		} else {
+			TS = construct tag_stack [Id TS]
+		}
+	}
+
+def close_tag 
+	[id]
+	{
+		match lhs [Id:id]
+		match TS [Top:id Rest:tag_stack]
+
+		if Id.data == Top.data {
+			TS = construct tag_stack [Rest]
+		} else {
+			reject
+		}
+	}
+
+def tag 
+	[open_tag tag* close_tag]
+
+def start
+	[tag* ';\n']
+	{
+		print_xml( TS )
+		print_xml( lhs )
+		print( 'got structure\n' )
+	}
+
+|	[id* ';\n']
+	{
+		print_xml( TS )
+		print_xml( lhs )
+		print( 'failed\n' )
+	}
diff --git a/test/til.in b/test/til.in
new file mode 100644
index 00000000..19b7bb19
--- /dev/null
+++ b/test/til.in
@@ -0,0 +1,14 @@
+
+var a;
+a := 1;
+
+head:
+
+a := a + 1;
+c := d;
+
+if a = 10 then
+	goto head;
+end
+
+hi := there;
diff --git a/test/til.lm b/test/til.lm
new file mode 100644
index 00000000..346fc50f
--- /dev/null
+++ b/test/til.lm
@@ -0,0 +1,124 @@
+lex start
+{
+	literal 'var', 'if', 'then', 'else', 'while', 'do', 'for', 'read', 'write',
+			'end', 'to', 'goto'
+	literal ':=', '!=', ';', '+', '-', '*', '/', '=', '(', ')', ':'
+
+	ignore /'//' [^\n]* '\n'/
+	ignore /[\n\t ]+/
+	token id /[a-zA-Z_]+/
+	token integernumber /[0-9]+/
+	token stringlit /'"' [^"]* '"'/
+}
+
+def program
+	[statement*]
+
+def statement
+	[declaration]
+|	[assignment_statement]
+|	[if_statement]
+|	[while_statement]
+|	[do_statement]
+|	[for_statement]
+|	[read_statement]
+|	[write_statement]
+|	[labelled_statement]
+|	[goto_statement]
+
+def declaration
+	['var' id ';']
+
+def assignment_statement
+	[id ':=' expression ';']
+
+def if_statement
+	['if' expression 'then' statement* opt_else_statement 'end']
+
+def opt_else_statement
+	['else' statement*]
+|	[]
+
+def while_statement
+	['while' expression 'do' statement* 'end']
+
+def do_statement
+	['do' statement* 'while' expression ';']
+
+def for_statement
+	['for' id ':=' expression 'to' expression 'do' statement* 'end']
+
+def read_statement
+	['read' id ';']
+
+def write_statement
+	['write' expression ';']
+
+def expression
+	[term]
+|	[expression eqop term]
+
+def eqop ['='] | ['!=']
+
+def term
+	[factor]
+|	[term addop factor]
+
+def addop ['+'] | ['-']
+
+def factor
+	[primary]
+|	[factor mulop primary]
+
+def mulop ['*'] | ['/']
+
+def primary
+	[id]
+|	[lit]
+|	['(' expression ')']
+
+def lit
+	[integernumber]
+|	[stringlit]
+
+def labelled_statement
+	[id ':' statement] 
+
+def goto_statement
+	['goto' id ';']
+
+program P = parse program(stdin)
+
+for S:statement* in P
+{
+	if match S [L0: id ':' 
+			First: statement 
+			Rest: statement*]
+	{
+		for Check: statement* in Rest
+		{
+			if match Check 
+				['if' E: expression 'then' 
+					'goto' Targ: id ';'
+				'end'
+				T: statement*] &&
+				Targ == L0
+			{
+				# This truncates Rest
+				Check = construct statement* []
+
+				# Replace the labeled statement through to the goto with a
+				# do ... while.
+				S = construct statement*
+					['do'
+						First
+						Rest
+					'while' E ';'
+					T]
+				break
+			}
+		}
+	}
+}
+
+print(P, '\n')
diff --git a/test/travs1.in b/test/travs1.in
new file mode 100644
index 00000000..e6cf5020
--- /dev/null
+++ b/test/travs1.in
@@ -0,0 +1 @@
+1 | 2 3
diff --git a/test/travs1.lm b/test/travs1.lm
new file mode 100644
index 00000000..e5820d8f
--- /dev/null
+++ b/test/travs1.lm
@@ -0,0 +1,144 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start [expression]
+
+def expression [term expression_op*]
+
+def expression_op
+	['|' term]
+|	['&' term]
+|	['-' term]
+|	['--' term]
+
+def term [factor_rep term_rest]
+
+# This list is done manually to get shortest match.
+def term_rest
+	[]
+|	[term_op term_rest]
+
+def term_op
+	[factor_rep]
+|	['.' factor_rep]
+|	[':>' factor_rep]
+|	[':>>' factor_rep]
+|	['<:' factor_rep]
+
+def factor_rep 
+	[factor_neg factor_rep_op*]
+
+def factor_rep_op
+	['*']
+|	['**']
+|	['?']
+|	['+']
+|	['{' factor_rep_num '}']
+|	['{' ',' factor_rep_num '}']
+|	['{' factor_rep_num ',' '}']
+|	['{' factor_rep_num ',' factor_rep_num '}']
+
+def factor_rep_num [uint]
+
+def factor_neg 
+	['!' factor_neg]
+|	['^' factor_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+
+start S = parse start(stdin)
+
+#
+# Top-Down, Left-Right
+#
+
+int do_topdown_leftright( ref any T )
+{
+	for C:any in child(T) {
+		yield C
+		do_topdown_leftright( C )
+	}
+}
+
+iter topdown_leftright( ref any T )
+{
+	do_topdown_leftright( T )
+}
+
+#
+# Bottom-Up, Left-Right
+#
+
+int do_bottomup_leftright( ref any T )
+{
+	for C:any in child(T) {
+		do_bottomup_leftright( C )
+		yield C
+	}
+}
+
+iter bottomup_leftright( ref any T )
+{
+	do_bottomup_leftright( T )
+}
+
+
+#
+# Top-Down, Right-Left
+#
+
+int do_topdown_rightleft( ref any T )
+{
+	for C:any in rev_child(T) {
+		yield C
+		do_topdown_rightleft( C )
+	}
+}
+
+iter topdown_rightleft( ref any T )
+{
+	do_topdown_rightleft( T )
+}
+
+#
+# Bottom-Up, Right-Left
+#
+
+int do_bottomup_rightleft( ref any T )
+{
+	for C:any in rev_child(T) {
+		do_bottomup_rightleft( C )
+		yield C
+	}
+}
+
+iter bottomup_rightleft( ref any T )
+{
+	do_bottomup_rightleft( T )
+}
+
+#
+# Testing
+#
+
+for C: expression in bottomup_leftright( S ) 
+{
+	print_xml( C )
+}
diff --git a/test/travs2.in b/test/travs2.in
new file mode 100644
index 00000000..81d197f3
--- /dev/null
+++ b/test/travs2.in
@@ -0,0 +1 @@
+1 2 | 3 4 
diff --git a/test/travs2.lm b/test/travs2.lm
new file mode 100644
index 00000000..06facf3b
--- /dev/null
+++ b/test/travs2.lm
@@ -0,0 +1,93 @@
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def start 
+	[expression]
+
+def expression [term expression_op*]
+
+def expression_op
+	['|' term]
+|	['&' term]
+|	['-' term]
+|	['--' term]
+
+def term [factor_rep term_rest]
+
+# This list is done manually to get shortest match.
+def term_rest
+	[]
+|	[term_op term_rest]
+
+def term_op
+	[factor_rep]
+|	['.' factor_rep]
+|	[':>' factor_rep]
+|	[':>>' factor_rep]
+|	['<:' factor_rep]
+
+def factor_rep 
+	[factor_neg factor_rep_op*]
+
+def factor_rep_op
+	['*']
+|	['**']
+|	['?']
+|	['+']
+|	['{' factor_rep_num '}']
+|	['{' ',' factor_rep_num '}']
+|	['{' factor_rep_num ',' '}']
+|	['{' factor_rep_num ',' factor_rep_num '}']
+
+def factor_rep_num [uint]
+
+def factor_neg 
+	['!' factor_neg]
+|	['^' factor_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+
+start S = parse start(stdin)
+
+#
+# Fixed point iteration
+#
+
+bool this_iter_modified()
+	{ return true }
+
+iter fixed_point( ref any T )
+{
+	bool modified = true
+	while modified {
+		modified = false
+		for S:any in T {
+			yield S
+
+			if this_iter_modified() {
+				modified = true
+				break
+			}
+		}
+	}
+}
+
+print( S, '\n' )
+
diff --git a/test/xml/Makefile b/test/xml/Makefile
new file mode 100644
index 00000000..25a0b6d3
--- /dev/null
+++ b/test/xml/Makefile
@@ -0,0 +1,34 @@
+#
+#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#
+
+#   This file is part of Ragel.
+#
+#   Ragel is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Ragel is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Ragel; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: $(BIN)
+
+$(BIN): $(COLM)
+
+$(BIN): %.bin: %.lm
+	$(COLM) $<
+
+clean:
+	rm -f *.cpp *.bin
diff --git a/test/xml/xml.in b/test/xml/xml.in
new file mode 100644
index 00000000..3c024f80
--- /dev/null
+++ b/test/xml/xml.in
@@ -0,0 +1,3962 @@
+<ragel version="5.24" filename="../colm/lmscan.rl" lang="C">
+<ragel_def name="rlscan">
+  <alphtype>char</alphtype>
+  <machine>
+    <action_list length="166">
+      <action id="0" name="inc_nl" line="217" col="16"><text> 
+		lastnl = p; 
+		column = 0;
+		line++;
+	</text></action>
+      <action id="1" name="initts" line="1" col="1"><init_tokstart></init_tokstart></action>
+      <action id="2" name="tokstart" line="1" col="1"><set_tokstart></set_tokstart></action>
+      <action id="3" name="tokend" line="1" col="1"><set_tokend>1</set_tokend></action>
+      <action id="4" name="last1" line="238" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\0' ); </text></sub_action></action>
+      <action id="5" name="last2" line="239" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\a' ); </text></sub_action></action>
+      <action id="6" name="last3" line="240" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\b' ); </text></sub_action></action>
+      <action id="7" name="last4" line="241" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\t' ); </text></sub_action></action>
+      <action id="8" name="last5" line="242" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\n' ); </text></sub_action></action>
+      <action id="9" name="last6" line="243" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\v' ); </text></sub_action></action>
+      <action id="10" name="last7" line="244" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\f' ); </text></sub_action></action>
+      <action id="11" name="last8" line="245" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, '\r' ); </text></sub_action></action>
+      <action id="12" name="last9" line="246" col="13"><set_tokend>1</set_tokend><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="13" name="last10" line="247" col="15"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, tokstart+1, tokend ); </text></sub_action></action>
+      <action id="14" name="last11" line="250" col="10"><set_tokend>1</set_tokend><sub_action><text> token( RE_Dash, 0, 0 ); </text></sub_action></action>
+      <action id="15" name="last12" line="253" col="10"><set_tokend>1</set_tokend><sub_action><text> token( RE_SqClose ); </text><ret></ret><text> </text></sub_action></action>
+      <action id="16" name="last13" line="255" col="10"><set_tokend>1</set_tokend><sub_action><text>
+			scan_error() &lt;&lt; "unterminated OR literal" &lt;&lt; endl;
+		</text></sub_action></action>
+      <action id="17" name="last14" line="260" col="12"><set_tokend>1</set_tokend><sub_action><text> token( RE_Char, tokstart, tokend ); </text></sub_action></action>
+      <action id="18" name="store15" line="265" col="13"><set_act>15</set_act></action>
+      <action id="19" name="store16" line="266" col="12"><set_act>16</set_act></action>
+      <action id="20" name="store17" line="267" col="12"><set_act>17</set_act></action>
+      <action id="21" name="store18" line="268" col="13"><set_act>18</set_act></action>
+      <action id="22" name="store19" line="269" col="11"><set_act>19</set_act></action>
+      <action id="23" name="store20" line="270" col="13"><set_act>20</set_act></action>
+      <action id="24" name="store21" line="273" col="12"><set_act>21</set_act></action>
+      <action id="25" name="last24" line="281" col="7"><set_tokend>1</set_tokend><sub_action><text> token( TK_Literal, tokstart, tokend ); </text></sub_action></action>
+      <action id="26" name="last26" line="284" col="11"><set_tokend>1</set_tokend><sub_action><text> token( RE_SqOpenNeg ); </text><call>166</call><text> </text></sub_action></action>
+      <action id="27" name="last27" line="286" col="10"><set_tokend>1</set_tokend><sub_action><text> token( '/'); </text><ret></ret><text> </text></sub_action></action>
+      <action id="28" name="last28" line="289" col="20"><set_tokend>1</set_tokend><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="29" name="last29" line="291" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_ColonEquals ); </text></sub_action></action>
+      <action id="30" name="last30" line="294" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartToState ); </text></sub_action></action>
+      <action id="31" name="last31" line="295" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllToState ); </text></sub_action></action>
+      <action id="32" name="last32" line="296" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_FinalToState ); </text></sub_action></action>
+      <action id="33" name="last33" line="297" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotStartToState ); </text></sub_action></action>
+      <action id="34" name="last34" line="298" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotFinalToState ); </text></sub_action></action>
+      <action id="35" name="last35" line="299" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_MiddleToState ); </text></sub_action></action>
+      <action id="36" name="last36" line="302" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartFromState ); </text></sub_action></action>
+      <action id="37" name="last37" line="303" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllFromState ); </text></sub_action></action>
+      <action id="38" name="last38" line="304" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_FinalFromState ); </text></sub_action></action>
+      <action id="39" name="last39" line="305" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotStartFromState ); </text></sub_action></action>
+      <action id="40" name="last40" line="306" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotFinalFromState ); </text></sub_action></action>
+      <action id="41" name="last41" line="307" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_MiddleFromState ); </text></sub_action></action>
+      <action id="42" name="last42" line="310" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartEOF ); </text></sub_action></action>
+      <action id="43" name="last43" line="311" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllEOF ); </text></sub_action></action>
+      <action id="44" name="last44" line="312" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_FinalEOF ); </text></sub_action></action>
+      <action id="45" name="last45" line="313" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotStartEOF ); </text></sub_action></action>
+      <action id="46" name="last46" line="314" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotFinalEOF ); </text></sub_action></action>
+      <action id="47" name="last47" line="315" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_MiddleEOF ); </text></sub_action></action>
+      <action id="48" name="last48" line="318" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartGblError ); </text></sub_action></action>
+      <action id="49" name="last49" line="319" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllGblError ); </text></sub_action></action>
+      <action id="50" name="last50" line="320" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_FinalGblError ); </text></sub_action></action>
+      <action id="51" name="last51" line="321" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotStartGblError ); </text></sub_action></action>
+      <action id="52" name="last52" line="322" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotFinalGblError ); </text></sub_action></action>
+      <action id="53" name="last53" line="323" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_MiddleGblError ); </text></sub_action></action>
+      <action id="54" name="last54" line="326" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartLocalError ); </text></sub_action></action>
+      <action id="55" name="last55" line="327" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllLocalError ); </text></sub_action></action>
+      <action id="56" name="last56" line="328" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_FinalLocalError ); </text></sub_action></action>
+      <action id="57" name="last57" line="329" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotStartLocalError ); </text></sub_action></action>
+      <action id="58" name="last58" line="330" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotFinalLocalError ); </text></sub_action></action>
+      <action id="59" name="last59" line="331" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_MiddleLocalError ); </text></sub_action></action>
+      <action id="60" name="last61" line="337" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StartCond ); </text></sub_action></action>
+      <action id="61" name="last62" line="338" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AllCond ); </text></sub_action></action>
+      <action id="62" name="last63" line="339" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_LeavingCond ); </text></sub_action></action>
+      <action id="63" name="last64" line="341" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_DotDot ); </text></sub_action></action>
+      <action id="64" name="last65" line="342" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_StarStar ); </text></sub_action></action>
+      <action id="65" name="last66" line="343" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_DashDash ); </text></sub_action></action>
+      <action id="66" name="last67" line="344" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_Arrow ); </text></sub_action></action>
+      <action id="67" name="last69" line="347" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_ColonGtGt ); </text></sub_action></action>
+      <action id="68" name="last70" line="348" col="12"><set_tokend>1</set_tokend><sub_action><text> token( TK_LtColon ); </text></sub_action></action>
+      <action id="69" name="last72" line="354" col="9"><set_tokend>1</set_tokend><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="70" name="last73" line="357" col="6"><set_tokend>1</set_tokend></action>
+      <action id="71" name="last74" line="359" col="10"><set_tokend>1</set_tokend><sub_action><text> token( *tokstart ); </text></sub_action></action>
+      <action id="72" name="next21" line="273" col="12"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Word, tokstart, tokend ); </text></sub_action></action>
+      <action id="73" name="next22" line="276" col="13"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_UInt, tokstart, tokend ); </text></sub_action></action>
+      <action id="74" name="next23" line="277" col="17"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Hex, tokstart, tokend ); </text></sub_action></action>
+      <action id="75" name="next24" line="281" col="7"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Literal, tokstart, tokend ); </text></sub_action></action>
+      <action id="76" name="next25" line="283" col="10"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( RE_SqOpen ); </text><call>166</call><text> </text></sub_action></action>
+      <action id="77" name="next60" line="334" col="11"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Middle ); </text></sub_action></action>
+      <action id="78" name="next68" line="346" col="12"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_ColonGt ); </text></sub_action></action>
+      <action id="79" name="next71" line="351" col="15"><set_tokend>0</set_tokend><hold></hold><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="80" name="next74" line="359" col="10"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( *tokstart ); </text></sub_action></action>
+      <action id="81" name="lag22" line="276" col="13"><exec><get_tokend></get_tokend></exec><sub_action><text> token( TK_UInt, tokstart, tokend ); </text></sub_action></action>
+      <action id="82" name="switch" line="1" col="1"><lm_switch>
+        <sub_action id="15"><exec><get_tokend></get_tokend></exec><text> token( KW_When ); </text></sub_action>
+        <sub_action id="16"><exec><get_tokend></get_tokend></exec><text> token( KW_Eof ); </text></sub_action>
+        <sub_action id="17"><exec><get_tokend></get_tokend></exec><text> token( KW_Err ); </text></sub_action>
+        <sub_action id="18"><exec><get_tokend></get_tokend></exec><text> token( KW_Lerr ); </text></sub_action>
+        <sub_action id="19"><exec><get_tokend></get_tokend></exec><text> token( KW_To ); </text></sub_action>
+        <sub_action id="20"><exec><get_tokend></get_tokend></exec><text> token( KW_From ); </text></sub_action>
+        <sub_action id="21"><exec><get_tokend></get_tokend></exec><text> token( TK_Word, tokstart, tokend ); </text></sub_action>
+    </lm_switch></action>
+      <action id="83" name="last75" line="363" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\a' ); </text></sub_action></action>
+      <action id="84" name="last76" line="364" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\b' ); </text></sub_action></action>
+      <action id="85" name="last77" line="365" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\t' ); </text></sub_action></action>
+      <action id="86" name="last78" line="366" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\n' ); </text></sub_action></action>
+      <action id="87" name="last79" line="367" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\v' ); </text></sub_action></action>
+      <action id="88" name="last80" line="368" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\f' ); </text></sub_action></action>
+      <action id="89" name="last81" line="369" col="12"><set_tokend>1</set_tokend><sub_action><text> litBuf.append( '\r' ); </text></sub_action></action>
+      <action id="90" name="last82" line="371" col="12"><set_tokend>1</set_tokend><sub_action><text>
+			litBuf.append( tokstart[1] );
+		</text></sub_action></action>
+      <action id="91" name="last83" line="374" col="10"><set_tokend>1</set_tokend><sub_action><text>
+			if ( litBuf.length &gt; 0 ) {
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '"' );
+			</text><ret></ret><text>
+		</text></sub_action></action>
+      <action id="92" name="last84" line="382" col="9"><set_tokend>1</set_tokend><sub_action><text>
+			if ( litBuf.length &gt; 0 ) {
+				litBuf.append( '\n' );
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '"' );
+			</text><ret></ret><text>
+		</text></sub_action></action>
+      <action id="93" name="last85" line="391" col="10"><set_tokend>1</set_tokend><sub_action><text> 
+			if ( litBuf.length &gt; 0 ) {
+				token( TK_LitPat, litBuf.data, litBuf.data+litBuf.length );
+				litBuf.clear();
+			}
+			token( '[' );
+			</text><call>10</call><text>
+		</text></sub_action></action>
+      <action id="94" name="last86" line="399" col="10"><set_tokend>1</set_tokend><sub_action><text> 
+			litBuf.append( *tokstart );
+		</text></sub_action></action>
+      <action id="95" name="store87" line="406" col="12"><set_act>87</set_act></action>
+      <action id="96" name="store88" line="407" col="15"><set_act>88</set_act></action>
+      <action id="97" name="store89" line="408" col="17"><set_act>89</set_act></action>
+      <action id="98" name="store90" line="409" col="15"><set_act>90</set_act></action>
+      <action id="99" name="store91" line="410" col="13"><set_act>91</set_act></action>
+      <action id="100" name="store92" line="411" col="14"><set_act>92</set_act></action>
+      <action id="101" name="store93" line="412" col="18"><set_act>93</set_act></action>
+      <action id="102" name="store94" line="413" col="14"><set_act>94</set_act></action>
+      <action id="103" name="store95" line="414" col="16"><set_act>95</set_act></action>
+      <action id="104" name="store96" line="415" col="16"><set_act>96</set_act></action>
+      <action id="105" name="store97" line="416" col="13"><set_act>97</set_act></action>
+      <action id="106" name="store98" line="417" col="15"><set_act>98</set_act></action>
+      <action id="107" name="store99" line="418" col="16"><set_act>99</set_act></action>
+      <action id="108" name="store101" line="420" col="14"><set_act>101</set_act></action>
+      <action id="109" name="store102" line="421" col="12"><set_act>102</set_act></action>
+      <action id="110" name="store103" line="422" col="12"><set_act>103</set_act></action>
+      <action id="111" name="store104" line="424" col="11"><set_act>104</set_act></action>
+      <action id="112" name="store105" line="425" col="12"><set_act>105</set_act></action>
+      <action id="113" name="store106" line="426" col="15"><set_act>106</set_act></action>
+      <action id="114" name="store107" line="427" col="12"><set_act>107</set_act></action>
+      <action id="115" name="store108" line="428" col="16"><set_act>108</set_act></action>
+      <action id="116" name="store109" line="429" col="18"><set_act>109</set_act></action>
+      <action id="117" name="store110" line="430" col="12"><set_act>110</set_act></action>
+      <action id="118" name="store112" line="432" col="16"><set_act>112</set_act></action>
+      <action id="119" name="store113" line="433" col="17"><set_act>113</set_act></action>
+      <action id="120" name="store114" line="434" col="11"><set_act>114</set_act></action>
+      <action id="121" name="store115" line="435" col="13"><set_act>115</set_act></action>
+      <action id="122" name="store116" line="436" col="15"><set_act>116</set_act></action>
+      <action id="123" name="store117" line="437" col="14"><set_act>117</set_act></action>
+      <action id="124" name="store118" line="438" col="13"><set_act>118</set_act></action>
+      <action id="125" name="store119" line="439" col="18"><set_act>119</set_act></action>
+      <action id="126" name="store120" line="440" col="13"><set_act>120</set_act></action>
+      <action id="127" name="store121" line="441" col="14"><set_act>121</set_act></action>
+      <action id="128" name="store122" line="442" col="12"><set_act>122</set_act></action>
+      <action id="129" name="store123" line="443" col="13"><set_act>123</set_act></action>
+      <action id="130" name="store124" line="444" col="13"><set_act>124</set_act></action>
+      <action id="131" name="store125" line="445" col="13"><set_act>125</set_act></action>
+      <action id="132" name="store126" line="446" col="18"><set_act>126</set_act></action>
+      <action id="133" name="store127" line="447" col="13"><set_act>127</set_act></action>
+      <action id="134" name="store128" line="448" col="11"><set_act>128</set_act></action>
+      <action id="135" name="store129" line="449" col="18"><set_act>129</set_act></action>
+      <action id="136" name="store130" line="450" col="16"><set_act>130</set_act></action>
+      <action id="137" name="store131" line="453" col="12"><set_act>131</set_act></action>
+      <action id="138" name="last133" line="457" col="10"><set_tokend>1</set_tokend><sub_action><text> 
+			token( '/' ); 
+			</text><call>168</call><text>
+		</text></sub_action></action>
+      <action id="139" name="last134" line="462" col="20"><set_tokend>1</set_tokend><sub_action><text> 
+			token( '"' );
+			token( TK_LitPat, tokstart+1, tokend );
+			token( '"' );
+		</text></sub_action></action>
+      <action id="140" name="last135" line="468" col="16"><set_tokend>1</set_tokend><sub_action><text>
+			token( TK_Literal, tokstart, tokend );
+		</text></sub_action></action>
+      <action id="141" name="last136" line="472" col="10"><set_tokend>1</set_tokend><sub_action><text> 
+			token( '"' );
+			litBuf.clear(); 
+			</text><call>203</call><text>
+		</text></sub_action></action>
+      <action id="142" name="last137" line="477" col="10"><set_tokend>1</set_tokend><sub_action><text> 
+			token( '[' ); 
+			</text><call>10</call><text>
+		</text></sub_action></action>
+      <action id="143" name="last138" line="482" col="10"><set_tokend>1</set_tokend><sub_action><text>
+			token( ']' );
+			if ( top &gt; 0 )
+				</text><ret></ret><text>
+		</text></sub_action></action>
+      <action id="144" name="last139" line="489" col="20"><set_tokend>1</set_tokend><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="145" name="last140" line="491" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_ColonEquals ); </text></sub_action></action>
+      <action id="146" name="last141" line="492" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_DoubleArrow ); </text></sub_action></action>
+      <action id="147" name="last142" line="493" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_DoubleEquals ); </text></sub_action></action>
+      <action id="148" name="last143" line="494" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_NotEquals ); </text></sub_action></action>
+      <action id="149" name="last144" line="495" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_DoubleColon ); </text></sub_action></action>
+      <action id="150" name="last145" line="496" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_LessEquals ); </text></sub_action></action>
+      <action id="151" name="last146" line="497" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_GreaterEquals ); </text></sub_action></action>
+      <action id="152" name="last147" line="498" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_LeftArrow ); </text></sub_action></action>
+      <action id="153" name="last148" line="499" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_AmpAmp ); </text></sub_action></action>
+      <action id="154" name="last149" line="500" col="11"><set_tokend>1</set_tokend><sub_action><text> token( TK_BarBar ); </text></sub_action></action>
+      <action id="155" name="last150" line="502" col="43"><set_tokend>1</set_tokend><sub_action><text> token( *tokstart ); </text></sub_action></action>
+      <action id="156" name="last152" line="509" col="9"><set_tokend>1</set_tokend><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="157" name="last153" line="512" col="6"><set_tokend>1</set_tokend></action>
+      <action id="158" name="last154" line="514" col="10"><set_tokend>1</set_tokend><sub_action><text> token( *tokstart ); </text></sub_action></action>
+      <action id="159" name="next100" line="419" col="12"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( KW_Pri ); </text></sub_action></action>
+      <action id="160" name="next111" line="431" col="14"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( KW_Print ); </text></sub_action></action>
+      <action id="161" name="next131" line="453" col="12"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Word, tokstart, tokend ); </text></sub_action></action>
+      <action id="162" name="next132" line="455" col="13"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( TK_Number, tokstart, tokend ); </text></sub_action></action>
+      <action id="163" name="next151" line="506" col="15"><set_tokend>0</set_tokend><hold></hold><sub_action><text> updateCol(); </text></sub_action></action>
+      <action id="164" name="next154" line="514" col="10"><set_tokend>0</set_tokend><hold></hold><sub_action><text> token( *tokstart ); </text></sub_action></action>
+      <action id="165" name="switch" line="1" col="1"><lm_switch>
+        <sub_action id="87"><exec><get_tokend></get_tokend></exec><text> token( KW_Lex ); </text></sub_action>
+        <sub_action id="88"><exec><get_tokend></get_tokend></exec><text> token( KW_Action ); </text></sub_action>
+        <sub_action id="89"><exec><get_tokend></get_tokend></exec><text> token( KW_AlphType ); </text></sub_action>
+        <sub_action id="90"><exec><get_tokend></get_tokend></exec><text> token( KW_Commit ); </text></sub_action>
+        <sub_action id="91"><exec><get_tokend></get_tokend></exec><text> token( KW_Undo ); </text></sub_action>
+        <sub_action id="92"><exec><get_tokend></get_tokend></exec><text> token( KW_Final ); </text></sub_action>
+        <sub_action id="93"><exec><get_tokend></get_tokend></exec><text> token( KW_Translate ); </text></sub_action>
+        <sub_action id="94"><exec><get_tokend></get_tokend></exec><text> token( KW_Token ); </text></sub_action>
+        <sub_action id="95"><exec><get_tokend></get_tokend></exec><text> token( KW_Literal ); </text></sub_action>
+        <sub_action id="96"><exec><get_tokend></get_tokend></exec><text> token( KW_NonTerm ); </text></sub_action>
+        <sub_action id="97"><exec><get_tokend></get_tokend></exec><text> token( KW_Uses ); </text></sub_action>
+        <sub_action id="98"><exec><get_tokend></get_tokend></exec><text> token( KW_Parser ); </text></sub_action>
+        <sub_action id="99"><exec><get_tokend></get_tokend></exec><text> token( KW_Include ); </text></sub_action>
+        <sub_action id="101"><exec><get_tokend></get_tokend></exec><text> token( KW_Write ); </text></sub_action>
+        <sub_action id="102"><exec><get_tokend></get_tokend></exec><text> token( KW_Nfa ); </text></sub_action>
+        <sub_action id="103"><exec><get_tokend></get_tokend></exec><text> token( KW_Pda ); </text></sub_action>
+        <sub_action id="104"><exec><get_tokend></get_tokend></exec><text> token( KW_Rl ); </text></sub_action>
+        <sub_action id="105"><exec><get_tokend></get_tokend></exec><text> token( KW_Cfl ); </text></sub_action>
+        <sub_action id="106"><exec><get_tokend></get_tokend></exec><text> token( KW_Ignore ); </text></sub_action>
+        <sub_action id="107"><exec><get_tokend></get_tokend></exec><text> token( KW_End ); </text></sub_action>
+        <sub_action id="108"><exec><get_tokend></get_tokend></exec><text> token( KW_Pattern ); </text></sub_action>
+        <sub_action id="109"><exec><get_tokend></get_tokend></exec><text> token( KW_Construct ); </text></sub_action>
+        <sub_action id="110"><exec><get_tokend></get_tokend></exec><text> token( KW_Red ); </text></sub_action>
+        <sub_action id="112"><exec><get_tokend></get_tokend></exec><text> token( KW_TypeId ); </text></sub_action>
+        <sub_action id="113"><exec><get_tokend></get_tokend></exec><text> token( KW_TypeDef ); </text></sub_action>
+        <sub_action id="114"><exec><get_tokend></get_tokend></exec><text> token( KW_If ); </text></sub_action>
+        <sub_action id="115"><exec><get_tokend></get_tokend></exec><text> token( KW_Init ); </text></sub_action>
+        <sub_action id="116"><exec><get_tokend></get_tokend></exec><text> token( KW_Reject ); </text></sub_action>
+        <sub_action id="117"><exec><get_tokend></get_tokend></exec><text> token( KW_While ); </text></sub_action>
+        <sub_action id="118"><exec><get_tokend></get_tokend></exec><text> token( KW_Else ); </text></sub_action>
+        <sub_action id="119"><exec><get_tokend></get_tokend></exec><text> token( KW_SubParser ); </text></sub_action>
+        <sub_action id="120"><exec><get_tokend></get_tokend></exec><text> token( KW_Next ); </text></sub_action>
+        <sub_action id="121"><exec><get_tokend></get_tokend></exec><text> token( KW_Match ); </text></sub_action>
+        <sub_action id="122"><exec><get_tokend></get_tokend></exec><text> token( KW_For ); </text></sub_action>
+        <sub_action id="123"><exec><get_tokend></get_tokend></exec><text> token( KW_Iter ); </text></sub_action>
+        <sub_action id="124"><exec><get_tokend></get_tokend></exec><text> token( KW_Find ); </text></sub_action>
+        <sub_action id="125"><exec><get_tokend></get_tokend></exec><text> token( KW_Root ); </text></sub_action>
+        <sub_action id="126"><exec><get_tokend></get_tokend></exec><text> token( KW_PrintXML ); </text></sub_action>
+        <sub_action id="127"><exec><get_tokend></get_tokend></exec><text> token( KW_Then ); </text></sub_action>
+        <sub_action id="128"><exec><get_tokend></get_tokend></exec><text> token( KW_Do ); </text></sub_action>
+        <sub_action id="129"><exec><get_tokend></get_tokend></exec><text> token( KW_Namespace ); </text></sub_action>
+        <sub_action id="130"><exec><get_tokend></get_tokend></exec><text> token( KW_Scanner ); </text></sub_action>
+        <sub_action id="131"><exec><get_tokend></get_tokend></exec><text> token( TK_Word, tokstart, tokend ); </text></sub_action>
+    </lm_switch></action>
+    </action_list>
+    <action_table_list length="166">
+      <action_table id="0" length="2">0 144</action_table>
+      <action_table id="1" length="1">0</action_table>
+      <action_table id="2" length="1">140</action_table>
+      <action_table id="3" length="2">0 139</action_table>
+      <action_table id="4" length="2">0 28</action_table>
+      <action_table id="5" length="1">81</action_table>
+      <action_table id="6" length="1">1</action_table>
+      <action_table id="7" length="1">2</action_table>
+      <action_table id="8" length="1">158</action_table>
+      <action_table id="9" length="1">157</action_table>
+      <action_table id="10" length="2">0 156</action_table>
+      <action_table id="11" length="1">141</action_table>
+      <action_table id="12" length="1">3</action_table>
+      <action_table id="13" length="1">155</action_table>
+      <action_table id="14" length="1">138</action_table>
+      <action_table id="15" length="2">3 137</action_table>
+      <action_table id="16" length="1">142</action_table>
+      <action_table id="17" length="1">143</action_table>
+      <action_table id="18" length="1">163</action_table>
+      <action_table id="19" length="1">164</action_table>
+      <action_table id="20" length="1">148</action_table>
+      <action_table id="21" length="1">153</action_table>
+      <action_table id="22" length="1">162</action_table>
+      <action_table id="23" length="1">149</action_table>
+      <action_table id="24" length="1">145</action_table>
+      <action_table id="25" length="1">152</action_table>
+      <action_table id="26" length="1">150</action_table>
+      <action_table id="27" length="1">147</action_table>
+      <action_table id="28" length="1">146</action_table>
+      <action_table id="29" length="1">151</action_table>
+      <action_table id="30" length="1">165</action_table>
+      <action_table id="31" length="1">161</action_table>
+      <action_table id="32" length="2">3 96</action_table>
+      <action_table id="33" length="2">3 97</action_table>
+      <action_table id="34" length="2">3 112</action_table>
+      <action_table id="35" length="2">3 98</action_table>
+      <action_table id="36" length="2">3 116</action_table>
+      <action_table id="37" length="2">3 134</action_table>
+      <action_table id="38" length="2">3 124</action_table>
+      <action_table id="39" length="2">3 114</action_table>
+      <action_table id="40" length="2">3 130</action_table>
+      <action_table id="41" length="2">3 100</action_table>
+      <action_table id="42" length="2">3 128</action_table>
+      <action_table id="43" length="2">3 120</action_table>
+      <action_table id="44" length="2">3 113</action_table>
+      <action_table id="45" length="2">3 107</action_table>
+      <action_table id="46" length="2">3 121</action_table>
+      <action_table id="47" length="2">3 129</action_table>
+      <action_table id="48" length="2">3 95</action_table>
+      <action_table id="49" length="2">3 103</action_table>
+      <action_table id="50" length="2">3 127</action_table>
+      <action_table id="51" length="2">3 135</action_table>
+      <action_table id="52" length="2">3 126</action_table>
+      <action_table id="53" length="2">3 109</action_table>
+      <action_table id="54" length="2">3 104</action_table>
+      <action_table id="55" length="2">3 106</action_table>
+      <action_table id="56" length="2">3 115</action_table>
+      <action_table id="57" length="2">3 110</action_table>
+      <action_table id="58" length="1">159</action_table>
+      <action_table id="59" length="1">160</action_table>
+      <action_table id="60" length="2">3 132</action_table>
+      <action_table id="61" length="2">3 111</action_table>
+      <action_table id="62" length="2">3 117</action_table>
+      <action_table id="63" length="2">3 122</action_table>
+      <action_table id="64" length="2">3 131</action_table>
+      <action_table id="65" length="2">3 136</action_table>
+      <action_table id="66" length="2">3 125</action_table>
+      <action_table id="67" length="2">3 133</action_table>
+      <action_table id="68" length="2">3 102</action_table>
+      <action_table id="69" length="2">3 101</action_table>
+      <action_table id="70" length="2">3 119</action_table>
+      <action_table id="71" length="2">3 118</action_table>
+      <action_table id="72" length="2">3 99</action_table>
+      <action_table id="73" length="2">3 105</action_table>
+      <action_table id="74" length="2">3 123</action_table>
+      <action_table id="75" length="2">3 108</action_table>
+      <action_table id="76" length="1">154</action_table>
+      <action_table id="77" length="1">17</action_table>
+      <action_table id="78" length="1">16</action_table>
+      <action_table id="79" length="1">14</action_table>
+      <action_table id="80" length="1">15</action_table>
+      <action_table id="81" length="1">13</action_table>
+      <action_table id="82" length="1">12</action_table>
+      <action_table id="83" length="1">4</action_table>
+      <action_table id="84" length="1">5</action_table>
+      <action_table id="85" length="1">6</action_table>
+      <action_table id="86" length="1">10</action_table>
+      <action_table id="87" length="1">8</action_table>
+      <action_table id="88" length="1">11</action_table>
+      <action_table id="89" length="1">7</action_table>
+      <action_table id="90" length="1">9</action_table>
+      <action_table id="91" length="1">71</action_table>
+      <action_table id="92" length="1">70</action_table>
+      <action_table id="93" length="2">0 69</action_table>
+      <action_table id="94" length="1">27</action_table>
+      <action_table id="95" length="2">3 24</action_table>
+      <action_table id="96" length="1">79</action_table>
+      <action_table id="97" length="1">75</action_table>
+      <action_table id="98" length="1">25</action_table>
+      <action_table id="99" length="1">80</action_table>
+      <action_table id="100" length="1">49</action_table>
+      <action_table id="101" length="1">37</action_table>
+      <action_table id="102" length="1">43</action_table>
+      <action_table id="103" length="1">61</action_table>
+      <action_table id="104" length="1">55</action_table>
+      <action_table id="105" length="1">31</action_table>
+      <action_table id="106" length="1">50</action_table>
+      <action_table id="107" length="1">38</action_table>
+      <action_table id="108" length="1">44</action_table>
+      <action_table id="109" length="1">62</action_table>
+      <action_table id="110" length="1">56</action_table>
+      <action_table id="111" length="1">32</action_table>
+      <action_table id="112" length="1">64</action_table>
+      <action_table id="113" length="1">65</action_table>
+      <action_table id="114" length="1">66</action_table>
+      <action_table id="115" length="1">63</action_table>
+      <action_table id="116" length="1">73</action_table>
+      <action_table id="117" length="1">74</action_table>
+      <action_table id="118" length="1">29</action_table>
+      <action_table id="119" length="1">78</action_table>
+      <action_table id="120" length="1">67</action_table>
+      <action_table id="121" length="1">51</action_table>
+      <action_table id="122" length="1">39</action_table>
+      <action_table id="123" length="1">45</action_table>
+      <action_table id="124" length="1">68</action_table>
+      <action_table id="125" length="1">57</action_table>
+      <action_table id="126" length="1">33</action_table>
+      <action_table id="127" length="1">77</action_table>
+      <action_table id="128" length="1">53</action_table>
+      <action_table id="129" length="1">41</action_table>
+      <action_table id="130" length="1">47</action_table>
+      <action_table id="131" length="1">59</action_table>
+      <action_table id="132" length="1">35</action_table>
+      <action_table id="133" length="1">48</action_table>
+      <action_table id="134" length="1">36</action_table>
+      <action_table id="135" length="1">42</action_table>
+      <action_table id="136" length="1">60</action_table>
+      <action_table id="137" length="1">54</action_table>
+      <action_table id="138" length="1">30</action_table>
+      <action_table id="139" length="1">52</action_table>
+      <action_table id="140" length="1">40</action_table>
+      <action_table id="141" length="1">46</action_table>
+      <action_table id="142" length="1">58</action_table>
+      <action_table id="143" length="1">34</action_table>
+      <action_table id="144" length="1">82</action_table>
+      <action_table id="145" length="1">76</action_table>
+      <action_table id="146" length="1">26</action_table>
+      <action_table id="147" length="1">72</action_table>
+      <action_table id="148" length="2">3 19</action_table>
+      <action_table id="149" length="2">3 20</action_table>
+      <action_table id="150" length="2">3 23</action_table>
+      <action_table id="151" length="2">3 21</action_table>
+      <action_table id="152" length="2">3 22</action_table>
+      <action_table id="153" length="2">3 18</action_table>
+      <action_table id="154" length="1">94</action_table>
+      <action_table id="155" length="2">0 92</action_table>
+      <action_table id="156" length="1">91</action_table>
+      <action_table id="157" length="1">93</action_table>
+      <action_table id="158" length="1">90</action_table>
+      <action_table id="159" length="1">83</action_table>
+      <action_table id="160" length="1">84</action_table>
+      <action_table id="161" length="1">88</action_table>
+      <action_table id="162" length="1">86</action_table>
+      <action_table id="163" length="1">89</action_table>
+      <action_table id="164" length="1">85</action_table>
+      <action_table id="165" length="1">87</action_table>
+    </action_table_list>
+    <start_state>10</start_state>
+    <entry_points>
+      <entry name="or_literal">166</entry>
+      <entry name="regular_type">168</entry>
+      <entry name="literal_pattern">203</entry>
+      <entry name="main">10</entry>
+    </entry_points>
+    <state_list length="205">
+      <state id="0">
+      <trans_list length="3">
+        <t>-128 9 0 x</t>
+        <t>10 10 10 0</t>
+        <t>11 127 0 x</t>
+      </trans_list>
+      </state>
+
+      <state id="1">
+      <trans_list length="7">
+        <t>-128 9 1 x</t>
+        <t>10 10 1 1</t>
+        <t>11 38 1 x</t>
+        <t>39 39 10 2</t>
+        <t>40 91 1 x</t>
+        <t>92 92 2 x</t>
+        <t>93 127 1 x</t>
+      </trans_list>
+      </state>
+
+      <state id="2">
+      <trans_list length="3">
+        <t>-128 9 1 x</t>
+        <t>10 10 1 1</t>
+        <t>11 127 1 x</t>
+      </trans_list>
+      </state>
+
+      <state id="3">
+      <trans_list length="3">
+        <t>-128 9 3 x</t>
+        <t>10 10 10 3</t>
+        <t>11 127 3 x</t>
+      </trans_list>
+      </state>
+
+      <state id="4">
+      <trans_list length="7">
+        <t>-128 9 4 x</t>
+        <t>10 10 4 1</t>
+        <t>11 33 4 x</t>
+        <t>34 34 171 x</t>
+        <t>35 91 4 x</t>
+        <t>92 92 5 x</t>
+        <t>93 127 4 x</t>
+      </trans_list>
+      </state>
+
+      <state id="5">
+      <trans_list length="3">
+        <t>-128 9 4 x</t>
+        <t>10 10 4 1</t>
+        <t>11 127 4 x</t>
+      </trans_list>
+      </state>
+
+      <state id="6">
+      <trans_list length="3">
+        <t>-128 9 6 x</t>
+        <t>10 10 168 4</t>
+        <t>11 127 6 x</t>
+      </trans_list>
+      </state>
+
+      <state id="7">
+      <trans_list length="7">
+        <t>-128 9 7 x</t>
+        <t>10 10 7 1</t>
+        <t>11 38 7 x</t>
+        <t>39 39 171 x</t>
+        <t>40 91 7 x</t>
+        <t>92 92 8 x</t>
+        <t>93 127 7 x</t>
+      </trans_list>
+      </state>
+
+      <state id="8">
+      <trans_list length="3">
+        <t>-128 9 7 x</t>
+        <t>10 10 7 1</t>
+        <t>11 127 7 x</t>
+      </trans_list>
+      </state>
+
+      <state id="9">
+      <trans_list length="7">
+        <t>-128 47 168 5</t>
+        <t>48 57 181 x</t>
+        <t>58 64 168 5</t>
+        <t>65 70 181 x</t>
+        <t>71 96 168 5</t>
+        <t>97 102 181 x</t>
+        <t>103 127 168 5</t>
+      </trans_list>
+      </state>
+
+      <state id="10" final="t">
+      <state_actions>6 7 x</state_actions>
+      <trans_list length="61">
+        <t>-128 -1 10 8</t>
+        <t>0 0 10 9</t>
+        <t>1 8 10 8</t>
+        <t>9 9 11 x</t>
+        <t>10 10 10 10</t>
+        <t>11 12 10 8</t>
+        <t>13 13 11 x</t>
+        <t>14 31 10 8</t>
+        <t>32 32 11 x</t>
+        <t>33 33 12 x</t>
+        <t>34 34 10 11</t>
+        <t>35 35 13 12</t>
+        <t>36 37 10 8</t>
+        <t>38 38 14 x</t>
+        <t>39 39 15 12</t>
+        <t>40 43 10 13</t>
+        <t>44 44 10 8</t>
+        <t>45 45 10 13</t>
+        <t>46 46 10 8</t>
+        <t>47 47 10 14</t>
+        <t>48 57 16 x</t>
+        <t>58 58 17 x</t>
+        <t>59 59 10 8</t>
+        <t>60 60 18 x</t>
+        <t>61 61 19 x</t>
+        <t>62 62 20 x</t>
+        <t>63 64 10 8</t>
+        <t>65 90 21 15</t>
+        <t>91 91 10 16</t>
+        <t>92 92 10 8</t>
+        <t>93 93 10 17</t>
+        <t>94 94 10 8</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 8</t>
+        <t>97 97 22 x</t>
+        <t>98 98 21 15</t>
+        <t>99 99 33 x</t>
+        <t>100 100 45 x</t>
+        <t>101 101 46 x</t>
+        <t>102 102 50 x</t>
+        <t>103 104 21 15</t>
+        <t>105 105 55 x</t>
+        <t>106 107 21 15</t>
+        <t>108 108 68 x</t>
+        <t>109 109 75 x</t>
+        <t>110 110 79 x</t>
+        <t>111 111 21 15</t>
+        <t>112 112 95 x</t>
+        <t>113 113 21 15</t>
+        <t>114 114 112 x</t>
+        <t>115 115 119 x</t>
+        <t>116 116 132 x</t>
+        <t>117 117 152 x</t>
+        <t>118 118 21 15</t>
+        <t>119 119 157 x</t>
+        <t>120 122 21 15</t>
+        <t>123 123 10 8</t>
+        <t>124 124 164 x</t>
+        <t>125 125 10 8</t>
+        <t>126 126 165 12</t>
+        <t>127 127 10 8</t>
+      </trans_list>
+      </state>
+
+      <state id="11" final="t">
+      <trans_list length="7">
+        <t>-128 8 10 18</t>
+        <t>9 9 11 x</t>
+        <t>10 12 10 18</t>
+        <t>13 13 11 x</t>
+        <t>14 31 10 18</t>
+        <t>32 32 11 x</t>
+        <t>33 127 10 18</t>
+      </trans_list>
+      </state>
+
+      <state id="12" final="t">
+      <trans_list length="3">
+        <t>-128 60 10 19</t>
+        <t>61 61 10 20</t>
+        <t>62 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="13" final="t">
+      <trans_list length="3">
+        <t>-128 9 0 x</t>
+        <t>10 10 10 0</t>
+        <t>11 127 0 x</t>
+      </trans_list>
+      </state>
+
+      <state id="14" final="t">
+      <trans_list length="3">
+        <t>-128 37 10 19</t>
+        <t>38 38 10 21</t>
+        <t>39 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="15" final="t">
+      <trans_list length="7">
+        <t>-128 9 1 x</t>
+        <t>10 10 1 1</t>
+        <t>11 38 1 x</t>
+        <t>39 39 10 2</t>
+        <t>40 91 1 x</t>
+        <t>92 92 2 x</t>
+        <t>93 127 1 x</t>
+      </trans_list>
+      </state>
+
+      <state id="16" final="t">
+      <trans_list length="3">
+        <t>-128 47 10 22</t>
+        <t>48 57 16 x</t>
+        <t>58 127 10 22</t>
+      </trans_list>
+      </state>
+
+      <state id="17" final="t">
+      <trans_list length="5">
+        <t>-128 57 10 19</t>
+        <t>58 58 10 23</t>
+        <t>59 60 10 19</t>
+        <t>61 61 10 24</t>
+        <t>62 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="18" final="t">
+      <trans_list length="5">
+        <t>-128 44 10 19</t>
+        <t>45 45 10 25</t>
+        <t>46 60 10 19</t>
+        <t>61 61 10 26</t>
+        <t>62 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="19" final="t">
+      <trans_list length="4">
+        <t>-128 60 10 19</t>
+        <t>61 61 10 27</t>
+        <t>62 62 10 28</t>
+        <t>63 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="20" final="t">
+      <trans_list length="3">
+        <t>-128 60 10 19</t>
+        <t>61 61 10 29</t>
+        <t>62 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="21" final="t">
+      <trans_list length="9">
+        <t>-128 47 10 30</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 30</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 30</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 30</t>
+        <t>97 122 21 15</t>
+        <t>123 127 10 30</t>
+      </trans_list>
+      </state>
+
+      <state id="22" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 23 x</t>
+        <t>100 107 21 15</t>
+        <t>108 108 27 x</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="23" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 24 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="24" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 25 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="25" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 110 21 15</t>
+        <t>111 111 26 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="26" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 21 32</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="27" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 111 21 15</t>
+        <t>112 112 28 x</t>
+        <t>113 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="28" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 103 21 15</t>
+        <t>104 104 29 x</t>
+        <t>105 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="29" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 30 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="30" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 120 21 15</t>
+        <t>121 121 31 x</t>
+        <t>122 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="31" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 111 21 15</t>
+        <t>112 112 32 x</t>
+        <t>113 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="32" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 33</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="33" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 101 21 15</t>
+        <t>102 102 34 x</t>
+        <t>103 110 21 15</t>
+        <t>111 111 35 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="34" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 21 34</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="35" final="t">
+      <trans_list length="12">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 108 21 15</t>
+        <t>109 109 36 x</t>
+        <t>110 110 39 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="36" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 108 21 15</t>
+        <t>109 109 37 x</t>
+        <t>110 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="37" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 38 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="38" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 35</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="39" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 40 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="40" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 41 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="41" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 42 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="42" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 116 21 15</t>
+        <t>117 117 43 x</t>
+        <t>118 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="43" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 44 x</t>
+        <t>100 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="44" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 36</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="45" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 110 21 15</t>
+        <t>111 111 21 37</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="46" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 47 x</t>
+        <t>109 109 21 15</t>
+        <t>110 110 49 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="47" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 48 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="48" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 38</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="49" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 21 39</t>
+        <t>101 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="50" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 51 x</t>
+        <t>106 110 21 15</t>
+        <t>111 111 54 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="51" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 52 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="52" final="t">
+      <trans_list length="12">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 53 x</t>
+        <t>98 99 21 15</t>
+        <t>100 100 21 40</t>
+        <t>101 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="53" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 21 41</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="54" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 21 42</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="55" final="t">
+      <trans_list length="16">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 101 21 15</t>
+        <t>102 102 21 43</t>
+        <t>103 103 56 x</t>
+        <t>104 109 21 15</t>
+        <t>110 110 60 x</t>
+        <t>111 115 21 15</t>
+        <t>116 116 66 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="56" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 57 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="57" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 110 21 15</t>
+        <t>111 111 58 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="58" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 59 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="59" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 44</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="60" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 61 x</t>
+        <t>100 104 21 15</t>
+        <t>105 105 65 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="61" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 62 x</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="62" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 116 21 15</t>
+        <t>117 117 63 x</t>
+        <t>118 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="63" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 64 x</t>
+        <t>101 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="64" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 45</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="65" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 46</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="66" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 67 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="67" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 21 47</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="68" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 69 x</t>
+        <t>102 104 21 15</t>
+        <t>105 105 70 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="69" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 119 21 15</t>
+        <t>120 120 21 48</t>
+        <t>121 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="70" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 71 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="71" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 72 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="72" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 73 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="73" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 74 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="74" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 21 49</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="75" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 76 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="76" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 77 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="77" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 78 x</t>
+        <t>100 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="78" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 103 21 15</t>
+        <t>104 104 21 50</t>
+        <t>105 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="79" final="t">
+      <trans_list length="15">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 80 x</t>
+        <t>98 100 21 15</t>
+        <t>101 101 87 x</t>
+        <t>102 102 89 x</t>
+        <t>103 110 21 15</t>
+        <t>111 111 90 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="80" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 108 21 15</t>
+        <t>109 109 81 x</t>
+        <t>110 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="81" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 82 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="82" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 83 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="83" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 111 21 15</t>
+        <t>112 112 84 x</t>
+        <t>113 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="84" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 85 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="85" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 86 x</t>
+        <t>100 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="86" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 51</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="87" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 119 21 15</t>
+        <t>120 120 88 x</t>
+        <t>121 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="88" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 52</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="89" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 21 53</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="90" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 91 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="91" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 92 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="92" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 93 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="93" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 94 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="94" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 108 21 15</t>
+        <t>109 109 21 54</t>
+        <t>110 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="95" final="t">
+      <trans_list length="14">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 96 x</t>
+        <t>98 99 21 15</t>
+        <t>100 100 104 x</t>
+        <t>101 113 21 15</t>
+        <t>114 114 105 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="96" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 97 x</t>
+        <t>115 115 21 15</t>
+        <t>116 116 100 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="97" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 98 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="98" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 99 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="99" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 21 55</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="100" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 101 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="101" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 102 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="102" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 103 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="103" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 21 56</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="104" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 21 57</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="105" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 106 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="106" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 58</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 58</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 58</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 58</t>
+        <t>97 109 21 15</t>
+        <t>110 110 107 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 58</t>
+      </trans_list>
+      </state>
+
+      <state id="107" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 108 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="108" final="t">
+      <trans_list length="9">
+        <t>-128 47 10 59</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 59</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 59</t>
+        <t>95 95 109 x</t>
+        <t>96 96 10 59</t>
+        <t>97 122 21 15</t>
+        <t>123 127 10 59</t>
+      </trans_list>
+      </state>
+
+      <state id="109" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 119 21 15</t>
+        <t>120 120 110 x</t>
+        <t>121 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="110" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 108 21 15</t>
+        <t>109 109 111 x</t>
+        <t>110 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="111" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 21 60</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="112" final="t">
+      <trans_list length="15">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 113 x</t>
+        <t>102 107 21 15</t>
+        <t>108 108 21 61</t>
+        <t>109 110 21 15</t>
+        <t>111 111 117 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="113" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 21 62</t>
+        <t>101 105 21 15</t>
+        <t>106 106 114 x</t>
+        <t>107 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="114" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 115 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="115" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 116 x</t>
+        <t>100 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="116" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 63</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="117" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 110 21 15</t>
+        <t>111 111 118 x</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="118" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 21 64</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="119" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 98 21 15</t>
+        <t>99 99 120 x</t>
+        <t>100 116 21 15</t>
+        <t>117 117 125 x</t>
+        <t>118 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="120" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 121 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="121" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 122 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="122" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 123 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="123" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 124 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="124" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 21 65</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="125" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 21 15</t>
+        <t>98 98 126 x</t>
+        <t>99 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="126" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 111 21 15</t>
+        <t>112 112 127 x</t>
+        <t>113 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="127" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 128 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="128" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 129 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="129" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 130 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="130" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 131 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="131" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 113 21 15</t>
+        <t>114 114 21 66</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="132" final="t">
+      <trans_list length="17">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 103 21 15</t>
+        <t>104 104 133 x</t>
+        <t>105 110 21 15</t>
+        <t>111 111 135 x</t>
+        <t>112 113 21 15</t>
+        <t>114 114 138 x</t>
+        <t>115 120 21 15</t>
+        <t>121 121 145 x</t>
+        <t>122 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="133" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 134 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="134" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 21 67</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="135" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 106 21 15</t>
+        <t>107 107 136 x</t>
+        <t>108 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="136" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 137 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="137" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 21 68</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="138" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 139 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="139" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 140 x</t>
+        <t>111 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="140" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 141 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="141" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 142 x</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="142" final="t">
+      <trans_list length="10">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 97 143 x</t>
+        <t>98 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="143" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 144 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="144" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 69</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="145" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 111 21 15</t>
+        <t>112 112 146 x</t>
+        <t>113 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="146" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 147 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="147" final="t">
+      <trans_list length="9">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 148 x</t>
+        <t>96 96 10 31</t>
+        <t>97 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="148" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 149 x</t>
+        <t>101 104 21 15</t>
+        <t>105 105 151 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="149" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 150 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="150" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 101 21 15</t>
+        <t>102 102 21 70</t>
+        <t>103 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="151" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 21 71</t>
+        <t>101 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="152" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 109 21 15</t>
+        <t>110 110 153 x</t>
+        <t>111 114 21 15</t>
+        <t>115 115 155 x</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="153" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 99 21 15</t>
+        <t>100 100 154 x</t>
+        <t>101 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="154" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 110 21 15</t>
+        <t>111 111 21 72</t>
+        <t>112 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="155" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 156 x</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="156" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 114 21 15</t>
+        <t>115 115 21 73</t>
+        <t>116 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="157" final="t">
+      <trans_list length="13">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 103 21 15</t>
+        <t>104 104 158 x</t>
+        <t>105 113 21 15</t>
+        <t>114 114 161 x</t>
+        <t>115 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="158" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 159 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="159" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 107 21 15</t>
+        <t>108 108 160 x</t>
+        <t>109 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="160" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 74</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="161" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 104 21 15</t>
+        <t>105 105 162 x</t>
+        <t>106 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="162" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 115 21 15</t>
+        <t>116 116 163 x</t>
+        <t>117 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="163" final="t">
+      <trans_list length="11">
+        <t>-128 47 10 31</t>
+        <t>48 57 21 15</t>
+        <t>58 64 10 31</t>
+        <t>65 90 21 15</t>
+        <t>91 94 10 31</t>
+        <t>95 95 21 15</t>
+        <t>96 96 10 31</t>
+        <t>97 100 21 15</t>
+        <t>101 101 21 75</t>
+        <t>102 122 21 15</t>
+        <t>123 127 10 31</t>
+      </trans_list>
+      </state>
+
+      <state id="164" final="t">
+      <trans_list length="3">
+        <t>-128 123 10 19</t>
+        <t>124 124 10 76</t>
+        <t>125 127 10 19</t>
+      </trans_list>
+      </state>
+
+      <state id="165" final="t">
+      <trans_list length="3">
+        <t>-128 9 3 x</t>
+        <t>10 10 10 3</t>
+        <t>11 127 3 x</t>
+      </trans_list>
+      </state>
+
+      <state id="166" final="t">
+      <state_actions>6 7 x</state_actions>
+      <trans_list length="8">
+        <t>-128 -1 166 77</t>
+        <t>0 0 166 78</t>
+        <t>1 44 166 77</t>
+        <t>45 45 166 79</t>
+        <t>46 91 166 77</t>
+        <t>92 92 167 x</t>
+        <t>93 93 166 80</t>
+        <t>94 127 166 77</t>
+      </trans_list>
+      </state>
+
+      <state id="167" final="t">
+      <trans_list length="18">
+        <t>-128 9 166 81</t>
+        <t>10 10 166 82</t>
+        <t>11 47 166 81</t>
+        <t>48 48 166 83</t>
+        <t>49 96 166 81</t>
+        <t>97 97 166 84</t>
+        <t>98 98 166 85</t>
+        <t>99 101 166 81</t>
+        <t>102 102 166 86</t>
+        <t>103 109 166 81</t>
+        <t>110 110 166 87</t>
+        <t>111 113 166 81</t>
+        <t>114 114 166 88</t>
+        <t>115 115 166 81</t>
+        <t>116 116 166 89</t>
+        <t>117 117 166 81</t>
+        <t>118 118 166 90</t>
+        <t>119 127 166 81</t>
+      </trans_list>
+      </state>
+
+      <state id="168" final="t">
+      <state_actions>6 7 x</state_actions>
+      <trans_list length="47">
+        <t>-128 -1 168 91</t>
+        <t>0 0 168 92</t>
+        <t>1 8 168 91</t>
+        <t>9 9 169 x</t>
+        <t>10 10 168 93</t>
+        <t>11 12 168 91</t>
+        <t>13 13 169 x</t>
+        <t>14 31 168 91</t>
+        <t>32 32 169 x</t>
+        <t>33 33 168 91</t>
+        <t>34 34 170 12</t>
+        <t>35 35 172 12</t>
+        <t>36 36 173 x</t>
+        <t>37 37 174 x</t>
+        <t>38 38 168 91</t>
+        <t>39 39 175 12</t>
+        <t>40 41 168 91</t>
+        <t>42 42 176 x</t>
+        <t>43 44 168 91</t>
+        <t>45 45 177 x</t>
+        <t>46 46 178 x</t>
+        <t>47 47 168 94</t>
+        <t>48 48 179 12</t>
+        <t>49 57 180 x</t>
+        <t>58 58 182 x</t>
+        <t>59 59 168 91</t>
+        <t>60 60 184 x</t>
+        <t>61 61 168 91</t>
+        <t>62 62 186 x</t>
+        <t>63 63 168 91</t>
+        <t>64 64 187 x</t>
+        <t>65 90 188 95</t>
+        <t>91 91 189 x</t>
+        <t>92 94 168 91</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 91</t>
+        <t>97 100 188 95</t>
+        <t>101 101 190 x</t>
+        <t>102 102 193 x</t>
+        <t>103 107 188 95</t>
+        <t>108 108 196 x</t>
+        <t>109 115 188 95</t>
+        <t>116 116 199 x</t>
+        <t>117 118 188 95</t>
+        <t>119 119 200 x</t>
+        <t>120 122 188 95</t>
+        <t>123 127 168 91</t>
+      </trans_list>
+      </state>
+
+      <state id="169" final="t">
+      <trans_list length="7">
+        <t>-128 8 168 96</t>
+        <t>9 9 169 x</t>
+        <t>10 12 168 96</t>
+        <t>13 13 169 x</t>
+        <t>14 31 168 96</t>
+        <t>32 32 169 x</t>
+        <t>33 127 168 96</t>
+      </trans_list>
+      </state>
+
+      <state id="170" final="t">
+      <trans_list length="7">
+        <t>-128 9 4 x</t>
+        <t>10 10 4 1</t>
+        <t>11 33 4 x</t>
+        <t>34 34 171 x</t>
+        <t>35 91 4 x</t>
+        <t>92 92 5 x</t>
+        <t>93 127 4 x</t>
+      </trans_list>
+      </state>
+
+      <state id="171" final="t">
+      <trans_list length="3">
+        <t>-128 104 168 97</t>
+        <t>105 105 168 98</t>
+        <t>106 127 168 97</t>
+      </trans_list>
+      </state>
+
+      <state id="172" final="t">
+      <trans_list length="3">
+        <t>-128 9 6 x</t>
+        <t>10 10 168 4</t>
+        <t>11 127 6 x</t>
+      </trans_list>
+      </state>
+
+      <state id="173" final="t">
+      <trans_list length="13">
+        <t>-128 32 168 99</t>
+        <t>33 33 168 100</t>
+        <t>34 41 168 99</t>
+        <t>42 42 168 101</t>
+        <t>43 46 168 99</t>
+        <t>47 47 168 102</t>
+        <t>48 62 168 99</t>
+        <t>63 63 168 103</t>
+        <t>64 93 168 99</t>
+        <t>94 94 168 104</t>
+        <t>95 125 168 99</t>
+        <t>126 126 168 105</t>
+        <t>127 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="174" final="t">
+      <trans_list length="13">
+        <t>-128 32 168 99</t>
+        <t>33 33 168 106</t>
+        <t>34 41 168 99</t>
+        <t>42 42 168 107</t>
+        <t>43 46 168 99</t>
+        <t>47 47 168 108</t>
+        <t>48 62 168 99</t>
+        <t>63 63 168 109</t>
+        <t>64 93 168 99</t>
+        <t>94 94 168 110</t>
+        <t>95 125 168 99</t>
+        <t>126 126 168 111</t>
+        <t>127 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="175" final="t">
+      <trans_list length="7">
+        <t>-128 9 7 x</t>
+        <t>10 10 7 1</t>
+        <t>11 38 7 x</t>
+        <t>39 39 171 x</t>
+        <t>40 91 7 x</t>
+        <t>92 92 8 x</t>
+        <t>93 127 7 x</t>
+      </trans_list>
+      </state>
+
+      <state id="176" final="t">
+      <trans_list length="3">
+        <t>-128 41 168 99</t>
+        <t>42 42 168 112</t>
+        <t>43 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="177" final="t">
+      <trans_list length="5">
+        <t>-128 44 168 99</t>
+        <t>45 45 168 113</t>
+        <t>46 61 168 99</t>
+        <t>62 62 168 114</t>
+        <t>63 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="178" final="t">
+      <trans_list length="3">
+        <t>-128 45 168 99</t>
+        <t>46 46 168 115</t>
+        <t>47 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="179" final="t">
+      <trans_list length="5">
+        <t>-128 47 168 116</t>
+        <t>48 57 180 x</t>
+        <t>58 119 168 116</t>
+        <t>120 120 9 x</t>
+        <t>121 127 168 116</t>
+      </trans_list>
+      </state>
+
+      <state id="180" final="t">
+      <trans_list length="3">
+        <t>-128 47 168 116</t>
+        <t>48 57 180 x</t>
+        <t>58 127 168 116</t>
+      </trans_list>
+      </state>
+
+      <state id="181" final="t">
+      <trans_list length="7">
+        <t>-128 47 168 117</t>
+        <t>48 57 181 x</t>
+        <t>58 64 168 117</t>
+        <t>65 70 181 x</t>
+        <t>71 96 168 117</t>
+        <t>97 102 181 x</t>
+        <t>103 127 168 117</t>
+      </trans_list>
+      </state>
+
+      <state id="182" final="t">
+      <trans_list length="4">
+        <t>-128 60 168 99</t>
+        <t>61 61 168 118</t>
+        <t>62 62 183 x</t>
+        <t>63 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="183" final="t">
+      <trans_list length="3">
+        <t>-128 61 168 119</t>
+        <t>62 62 168 120</t>
+        <t>63 127 168 119</t>
+      </trans_list>
+      </state>
+
+      <state id="184" final="t">
+      <trans_list length="15">
+        <t>-128 32 168 99</t>
+        <t>33 33 168 121</t>
+        <t>34 41 168 99</t>
+        <t>42 42 168 122</t>
+        <t>43 46 168 99</t>
+        <t>47 47 168 123</t>
+        <t>48 57 168 99</t>
+        <t>58 58 168 124</t>
+        <t>59 61 168 99</t>
+        <t>62 62 185 x</t>
+        <t>63 93 168 99</t>
+        <t>94 94 168 125</t>
+        <t>95 125 168 99</t>
+        <t>126 126 168 126</t>
+        <t>127 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="185" final="t">
+      <trans_list length="11">
+        <t>-128 32 168 127</t>
+        <t>33 33 168 128</t>
+        <t>34 41 168 127</t>
+        <t>42 42 168 129</t>
+        <t>43 46 168 127</t>
+        <t>47 47 168 130</t>
+        <t>48 93 168 127</t>
+        <t>94 94 168 131</t>
+        <t>95 125 168 127</t>
+        <t>126 126 168 132</t>
+        <t>127 127 168 127</t>
+      </trans_list>
+      </state>
+
+      <state id="186" final="t">
+      <trans_list length="13">
+        <t>-128 32 168 99</t>
+        <t>33 33 168 133</t>
+        <t>34 41 168 99</t>
+        <t>42 42 168 134</t>
+        <t>43 46 168 99</t>
+        <t>47 47 168 135</t>
+        <t>48 62 168 99</t>
+        <t>63 63 168 136</t>
+        <t>64 93 168 99</t>
+        <t>94 94 168 137</t>
+        <t>95 125 168 99</t>
+        <t>126 126 168 138</t>
+        <t>127 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="187" final="t">
+      <trans_list length="11">
+        <t>-128 32 168 99</t>
+        <t>33 33 168 139</t>
+        <t>34 41 168 99</t>
+        <t>42 42 168 140</t>
+        <t>43 46 168 99</t>
+        <t>47 47 168 141</t>
+        <t>48 93 168 99</t>
+        <t>94 94 168 142</t>
+        <t>95 125 168 99</t>
+        <t>126 126 168 143</t>
+        <t>127 127 168 99</t>
+      </trans_list>
+      </state>
+
+      <state id="188" final="t">
+      <trans_list length="9">
+        <t>-128 47 168 144</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 144</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 144</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 144</t>
+        <t>97 122 188 95</t>
+        <t>123 127 168 144</t>
+      </trans_list>
+      </state>
+
+      <state id="189" final="t">
+      <trans_list length="3">
+        <t>-128 93 168 145</t>
+        <t>94 94 168 146</t>
+        <t>95 127 168 145</t>
+      </trans_list>
+      </state>
+
+      <state id="190" final="t">
+      <trans_list length="13">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 110 188 95</t>
+        <t>111 111 191 x</t>
+        <t>112 113 188 95</t>
+        <t>114 114 192 x</t>
+        <t>115 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="191" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 101 188 95</t>
+        <t>102 102 188 148</t>
+        <t>103 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="192" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 113 188 95</t>
+        <t>114 114 188 149</t>
+        <t>115 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="193" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 113 188 95</t>
+        <t>114 114 194 x</t>
+        <t>115 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="194" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 110 188 95</t>
+        <t>111 111 195 x</t>
+        <t>112 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="195" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 108 188 95</t>
+        <t>109 109 188 150</t>
+        <t>110 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="196" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 100 188 95</t>
+        <t>101 101 197 x</t>
+        <t>102 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="197" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 113 188 95</t>
+        <t>114 114 198 x</t>
+        <t>115 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="198" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 113 188 95</t>
+        <t>114 114 188 151</t>
+        <t>115 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="199" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 110 188 95</t>
+        <t>111 111 188 152</t>
+        <t>112 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="200" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 103 188 95</t>
+        <t>104 104 201 x</t>
+        <t>105 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="201" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 100 188 95</t>
+        <t>101 101 202 x</t>
+        <t>102 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="202" final="t">
+      <trans_list length="11">
+        <t>-128 47 168 147</t>
+        <t>48 57 188 95</t>
+        <t>58 64 168 147</t>
+        <t>65 90 188 95</t>
+        <t>91 94 168 147</t>
+        <t>95 95 188 95</t>
+        <t>96 96 168 147</t>
+        <t>97 109 188 95</t>
+        <t>110 110 188 153</t>
+        <t>111 122 188 95</t>
+        <t>123 127 168 147</t>
+      </trans_list>
+      </state>
+
+      <state id="203" final="t">
+      <state_actions>6 7 x</state_actions>
+      <trans_list length="8">
+        <t>-128 9 203 154</t>
+        <t>10 10 203 155</t>
+        <t>11 33 203 154</t>
+        <t>34 34 203 156</t>
+        <t>35 90 203 154</t>
+        <t>91 91 203 157</t>
+        <t>92 92 204 x</t>
+        <t>93 127 203 154</t>
+      </trans_list>
+      </state>
+
+      <state id="204" final="t">
+      <trans_list length="14">
+        <t>-128 96 203 158</t>
+        <t>97 97 203 159</t>
+        <t>98 98 203 160</t>
+        <t>99 101 203 158</t>
+        <t>102 102 203 161</t>
+        <t>103 109 203 158</t>
+        <t>110 110 203 162</t>
+        <t>111 113 203 158</t>
+        <t>114 114 203 163</t>
+        <t>115 115 203 158</t>
+        <t>116 116 203 164</t>
+        <t>117 117 203 158</t>
+        <t>118 118 203 165</t>
+        <t>119 127 203 158</t>
+      </trans_list>
+      </state>
+    </state_list>
+  </machine>
+</ragel_def>
+<ragel_def name="section_parse">
+  <alphtype>int</alphtype>
+  <machine>
+    <action_list length="5">
+      <action id="0" name="clear_words" line="97" col="21"><text> word = lit = 0; word_len = lit_len = 0; </text></action>
+      <action id="1" name="store_lit" line="98" col="19"><text> lit = tokdata; lit_len = toklen; </text></action>
+      <action id="2" name="incl_err" line="101" col="18"><text> scan_error() &lt;&lt; "bad include statement" &lt;&lt; endl; </text></action>
+      <action id="3" name="handle_include" line="105" col="2"><text>
+		#if 0
+		char *inclSectionName = word;
+		char *inclFileName = 0;
+
+		/* Implement defaults for the input file and section name. */
+		if ( inclSectionName == 0 )
+			inclSectionName = parser-&gt;sectionName;
+
+		if ( lit != 0 ) 
+			inclFileName = prepareFileName( lit, lit_len );
+		else
+			inclFileName = fileName;
+
+		/* Check for a recursive include structure. Add the current file/section
+		 * name then check if what we are including is already in the stack. */
+		includeStack.append( IncludeStackItem( fileName, parser-&gt;sectionName ) );
+
+		if ( recursiveInclude( inclFileName, inclSectionName ) )
+			scan_error() &lt;&lt; "include: this is a recursive include operation" &lt;&lt; endl;
+		else {
+			/* Open the input file for reading. */
+			ifstream *inFile = new ifstream( inclFileName );
+			if ( ! inFile-&gt;is_open() ) {
+				scan_error() &lt;&lt; "include: could not open " &lt;&lt; 
+						inclFileName &lt;&lt; " for reading" &lt;&lt; endl;
+			}
+
+			Scanner scanner( inclFileName, *inFile, output, parser,
+					inclSectionName, includeDepth+1 );
+			scanner.do_scan( );
+			delete inFile;
+		}
+
+		/* Remove the last element (len-1) */
+		includeStack.remove( -1 );
+		#endif
+	</text></action>
+      <action id="4" name="handle_token" line="152" col="2"><text>
+		InputLoc loc;
+
+		#ifdef PRINT_TOKENS
+		cerr &lt;&lt; "scanner:" &lt;&lt; line &lt;&lt; ":" &lt;&lt; column &lt;&lt; 
+				": sending token to the parser " &lt;&lt; Parser_lelNames[*p];
+		cerr &lt;&lt; " " &lt;&lt; toklen;
+		if ( tokdata != 0 )
+			cerr &lt;&lt; " " &lt;&lt; tokdata;
+		cerr &lt;&lt; endl;
+		#endif
+
+		loc.fileName = fileName;
+		loc.line = line;
+		loc.col = column;
+
+		parser-&gt;token( loc, type, tokdata, toklen );
+	</text></action>
+    </action_list>
+    <action_table_list length="4">
+      <action_table id="0" length="1">2</action_table>
+      <action_table id="1" length="2">0 1</action_table>
+      <action_table id="2" length="1">3</action_table>
+      <action_table id="3" length="1">4</action_table>
+    </action_table_list>
+    <start_state>3</start_state>
+    <error_state>0</error_state>
+    <entry_points>
+      <entry name="main">3</entry>
+    </entry_points>
+    <state_list length="4">
+      <state id="0">
+      <trans_list length="0">
+      </trans_list>
+      </state>
+
+      <state id="1">
+      <state_actions>x x 0</state_actions>
+      <trans_list length="3">
+        <t>-2147483648 131 x 0</t>
+        <t>132 132 2 1</t>
+        <t>133 2147483647 x 0</t>
+      </trans_list>
+      </state>
+
+      <state id="2">
+      <state_actions>x x 0</state_actions>
+      <trans_list length="3">
+        <t>-2147483648 58 x 0</t>
+        <t>59 59 3 2</t>
+        <t>60 2147483647 x 0</t>
+      </trans_list>
+      </state>
+
+      <state id="3" final="t">
+      <trans_list length="3">
+        <t>-2147483648 128 3 3</t>
+        <t>129 129 1 x</t>
+        <t>130 2147483647 3 3</t>
+      </trans_list>
+      </state>
+    </state_list>
+  </machine>
+</ragel_def>
+<host line="1" col="1">/*
+ *  Copyright 2006-2007 Adrian Thurston &lt;thurston@cs.queensu.ca&gt;
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include &lt;iostream&gt;
+#include &lt;fstream&gt;
+#include &lt;string.h&gt;
+
+#include "colm.h"
+#include "lmscan.h"
+#include "lmparse.h"
+#include "parsedata.h"
+#include "avltree.h"
+#include "vector.h"
+
+//#define PRINT_TOKENS
+
+using std::ifstream;
+using std::istream;
+using std::ostream;
+using std::cout;
+using std::cerr;
+using std::endl;
+
+</host>
+<write def_name="section_parse" line="45" col="2"><arg>data</arg></write>
+<host line="46">
+
+void Scanner::sectionParseInit()
+{
+	</host>
+<write def_name="section_parse" line="50" col="5"><arg>init</arg></write>
+<host line="51">}
+
+ostream &amp;Scanner::scan_error()
+{
+	/* Maintain the error count. */
+	gblErrorCount += 1;
+	cerr &lt;&lt; fileName &lt;&lt; ":" &lt;&lt; line &lt;&lt; ":" &lt;&lt; column &lt;&lt; ": ";
+	return cerr;
+}
+
+bool Scanner::recursiveInclude( char *inclFileName, char *inclSectionName )
+{
+	for ( IncludeStack::Iter si = includeStack; si.lte(); si++ ) {
+		if ( strcmp( si-&gt;fileName, inclFileName ) == 0 &amp;&amp;
+				strcmp( si-&gt;sectionName, inclSectionName ) == 0 )
+		{
+			return true;
+		}
+	}
+	return false;	
+}
+
+void Scanner::updateCol()
+{
+	char *from = lastnl;
+	if ( from == 0 )
+		from = tokstart;
+	//cerr &lt;&lt; "adding " &lt;&lt; tokend - from &lt;&lt; " to column" &lt;&lt; endl;
+	column += tokend - from;
+	lastnl = 0;
+}
+
+void Scanner::token( int type, char c )
+{
+	token( type, &amp;c, &amp;c + 1 );
+}
+
+void Scanner::token( int type )
+{
+	token( type, 0, 0 );
+}
+
+</host>
+<host line="178">
+
+void Scanner::token( int type, char *start, char *end )
+{
+	char *tokdata = 0;
+	int toklen = 0;
+	int *p = &amp;type;
+	int *pe = &amp;type + 1;
+
+	if ( start != 0 ) {
+		toklen = end-start;
+		tokdata = new char[toklen+1];
+		memcpy( tokdata, start, toklen );
+		tokdata[toklen] = 0;
+	}
+
+	</host>
+<write def_name="section_parse" line="196" col="3"><arg>exec</arg></write>
+<host line="197">
+
+	updateCol();
+}
+
+void Scanner::endSection( )
+{
+	/* Execute the eof actions for the section parser. */
+	</host>
+<write def_name="section_parse" line="207" col="3"><arg>eof</arg></write>
+<host line="208">
+}
+
+</host>
+<host line="516">
+
+</host>
+<write def_name="rlscan" line="518" col="4"><arg>data</arg></write>
+<host line="519">
+void Scanner::do_scan()
+{
+	int bufsize = 8;
+	char *buf = new char[bufsize];
+	const char last_char = 0;
+	int cs, act, have = 0;
+	int top, stack[32];
+	bool execute = true;
+
+	sectionParseInit();
+	</host>
+<write def_name="rlscan" line="530" col="5"><arg>init</arg></write>
+<host line="531">
+	while ( execute ) {
+		char *p = buf + have;
+		int space = bufsize - have;
+
+		if ( space == 0 ) {
+			/* We filled up the buffer trying to scan a token. Grow it. */
+			bufsize = bufsize * 2;
+			char *newbuf = new char[bufsize];
+
+			/* Recompute p and space. */
+			p = newbuf + have;
+			space = bufsize - have;
+
+			/* Patch up pointers possibly in use. */
+			if ( tokstart != 0 )
+				tokstart = newbuf + ( tokstart - buf );
+			tokend = newbuf + ( tokend - buf );
+
+			/* Copy the new buffer in. */
+			memcpy( newbuf, buf, have );
+			delete[] buf;
+			buf = newbuf;
+		}
+
+		input.read( p, space );
+		int len = input.gcount();
+
+		/* If we see eof then append the EOF char. */
+	 	if ( len == 0 ) {
+			p[0] = last_char, len = 1;
+			execute = false;
+		}
+
+		char *pe = p + len;
+		</host>
+<write def_name="rlscan" line="566" col="6"><arg>exec</arg></write>
+<host line="567">
+		/* Check if we failed. */
+		if ( cs == rlscan_error ) {
+			/* Machine failed before finding a token. I'm not yet sure if this
+			 * is reachable. */
+			scan_error() &lt;&lt; "scanner error" &lt;&lt; endl;
+			exit(1);
+		}
+
+		/* Decide if we need to preserve anything. */
+		char *preserve = tokstart;
+
+		/* Now set up the prefix. */
+		if ( preserve == 0 )
+			have = 0;
+		else {
+			/* There is data that needs to be shifted over. */
+			have = pe - preserve;
+			memmove( buf, preserve, have );
+			unsigned int shiftback = preserve - buf;
+			if ( tokstart != 0 )
+				tokstart -= shiftback;
+			tokend -= shiftback;
+
+			preserve = buf;
+		}
+	}
+	delete[] buf;
+
+	InputLoc loc;
+	loc.fileName = "&lt;EOF&gt;";
+	loc.line = line;
+	loc.col = 1;
+	parser-&gt;token( loc, _eof, 0, 0 );
+}
+
+void scan( char *fileName, istream &amp;input, ostream &amp;output )
+{
+	Scanner scanner( fileName, input, output, 0, 0, 0 );
+}
+</host>
+</ragel>
diff --git a/test/xml/xml.lm b/test/xml/xml.lm
new file mode 100644
index 00000000..c8749bab
--- /dev/null
+++ b/test/xml/xml.lm
@@ -0,0 +1,167 @@
+#
+# Definitions
+#
+
+rl xml_digit / (0x30..0x39) /
+
+rl base_char / 0x41..0x5A | 0x61..0x7A /
+
+rl char / 0x9 | 0xA | 0xD | 0x20..0x7f /
+
+rl letter / base_char /
+
+rl name_char / letter | digit | '.' | '-' | '_' | ':' | 0xb7 /
+
+rl name / (letter | '_' | ':') name_char* /
+
+#
+# Reference definitions. These appear in the 
+# top level and also in strings.
+#
+
+rl entity_ref_pat / '&' name ';' /
+
+rl char_ref_pat / '&#' [0-9]+ ';' | '&0x' [0-9a-fA-F]+ ';' /
+
+#
+# Single quotes.
+#
+lex sq
+{
+	token sq_close /'\''/
+
+	# References in single quotes
+	token sq_entity_ref /entity_ref_pat/
+	token sq_char_ref /char_ref_pat/
+
+	token sq_data / [^<&']+ /
+
+	def sq_item 
+		[ sq_data ]
+	|	[ sq_entity_ref ]
+	|	[ sq_char_ref ]
+
+	# The opening quote belongs to the tag region. 
+	def sq_string 
+		[ '\'' sq_item* sq_close ]
+}
+
+#
+# Double quotes.
+#
+lex dq
+{
+	token dq_close /'"'/
+
+	# References in double quotes
+	token dq_entity_ref /entity_ref_pat/
+	token dq_char_ref /char_ref_pat/
+
+	token dq_data / [^<&"]+ /
+
+	def dq_item 
+		[ dq_data ]
+	|	[ dq_entity_ref ]
+	|	[ dq_char_ref ]
+
+	# The opening quote belongs to the tag region. 
+	def dq_string 
+		[ '"' dq_item* dq_close ]
+}
+
+#
+# Tag elements. 
+#
+lex tag
+{
+	literal '\'', '\"', '=', '\/', '>'
+
+	# Within this region whitespace is not significant.
+	ignore xml_space / (0x20 | 0x9 | 0xD | 0xA)+ /
+
+	#
+	# Attributes
+	#
+	token attr_name / name /
+}
+
+#
+# Top Level
+#
+lex start
+{
+	#
+	# Comments
+	#
+
+	# Cannot contain '--'
+	rl char_no_dash / char - '-' /
+	token comment / '<!--' ( char_no_dash | '-' char_no_dash )* '-->' /
+
+
+	# Opening a tag.
+	literal '<'
+
+	#
+	# Character Data
+	#
+
+	token cdata / '<![CDATA[' char* :> ']]>'/
+	token char_data / [^<&]+ /
+	token entity_ref /entity_ref_pat/
+	token char_ref /char_ref_pat/
+}
+
+
+def attribute_value 
+	[ sq_string ]
+|	[ dq_string ]
+
+def attribute 
+	[ attr_name '=' attribute_value ]
+
+def empty_tag 
+	[ '<' attr_name attribute* '/' '>' ]
+
+def close_tag 
+	[ '<' '/' attr_name '>' ]
+
+def open_tag 
+	[ '<' attr_name attribute* '>' ]
+
+def tag 
+	[open_tag content close_tag]
+
+def content_item 
+	[tag]
+|	[empty_tag]
+|	[char_data]
+|	[entity_ref]
+|	[char_ref]
+|	[cdata]
+|	[comment]
+
+def content 
+	[content_item*]
+
+def document 
+	[content]
+
+def start 
+	[document]
+	{
+		for Switch:tag in lhs {
+			if match Switch
+					["<lm_switch>" SwitchContent:content "</lm_switch>"]
+			{
+				print( 'SWITCH\n' )
+				for Text:tag in SwitchContent {
+					if match Text
+							["<text>" TextContent:content "</text>"]
+					{
+						print( ' ', TextContent, '\n' )
+					}
+				}
+			}
+		}
+	}
diff --git a/version.mk b/version.mk
new file mode 100644
index 00000000..8272a624
--- /dev/null
+++ b/version.mk
@@ -0,0 +1,2 @@
+VERSION = 0.1.0
+PUBDATE = June 2008
-- 
cgit v1.2.1

-- 
cgit v1.2.1


From f37a1daa7fad185883204c9125c1eb2c1723e364 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 18:03:10 +0000
Subject: Moved the headers and code from common/ into colm/.

---
 Makefile.in        |   2 +-
 colm/Makefile.in   |  16 ++-
 colm/buffer.h      |  55 +++++++++++
 colm/common.cpp    | 257 ++++++++++++++++++++++++++++++++++++++++++++++++
 colm/common.h      | 283 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 colm/config.h.in   |  50 ++++++++++
 colm/pcheck.h      |  48 +++++++++
 common/Makefile.in |  67 -------------
 common/buffer.h    |  55 -----------
 common/common.cpp  | 257 ------------------------------------------------
 common/common.h    | 283 -----------------------------------------------------
 common/config.h.in |  50 ----------
 common/pcheck.h    |  48 ---------
 configure          |   7 +-
 configure.in       |   4 +-
 15 files changed, 711 insertions(+), 771 deletions(-)
 create mode 100644 colm/buffer.h
 create mode 100644 colm/common.cpp
 create mode 100644 colm/common.h
 create mode 100644 colm/config.h.in
 create mode 100644 colm/pcheck.h
 delete mode 100644 common/Makefile.in
 delete mode 100644 common/buffer.h
 delete mode 100644 common/common.cpp
 delete mode 100644 common/common.h
 delete mode 100644 common/config.h.in
 delete mode 100644 common/pcheck.h

diff --git a/Makefile.in b/Makefile.in
index 26e4b879..f14d2473 100644
--- a/Makefile.in
+++ b/Makefile.in
@@ -19,7 +19,7 @@
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
-BUILD_SUBDIRS = common colm
+BUILD_SUBDIRS = colm
 ALL_SUBDIRS = $(BUILD_SUBDIRS) test
 
 #*************************************
diff --git a/colm/Makefile.in b/colm/Makefile.in
index 61b57867..21dba83c 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -18,7 +18,7 @@
 #   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
-INCS += -I../common -I../aapl
+INCS += -I../aapl
 DEFS +=
 
 CFLAGS += -g -Wall -Wwrite-strings
@@ -28,6 +28,7 @@ LDFLAGS +=
 CC_SRCS = \
 	compile.cpp \
 	bytecode.cpp \
+	tree.cpp \
 	fsmrun.cpp \
 	pdarun.cpp \
 	input.cpp \
@@ -54,18 +55,21 @@ CC_SRCS = \
 	closure.cpp \
 	fsmap.cpp \
 	dotgen.cpp \
-	tree.cpp
+	common.cpp
 
 RUNTIME_SRC = fsmrun.cpp pdarun.cpp bytecode.cpp list.cpp \
 	map.cpp string.cpp input.cpp tree.cpp
-GEN_SRC = lmscan.cpp lmparse.h lmparse.cpp 
+GEN_SRC = version.h lmscan.cpp lmparse.h lmparse.cpp 
 
 RUNTIME = runtime.a
 
-LIBS = ../common/common.a
+LIBS = 
 
 #*************************************
 
+# Get the version info.
+include ../version.mk
+
 PREFIX = @prefix@
 
 BUILD_PARSERS = @BUILD_PARSERS@
@@ -87,6 +91,10 @@ colm: $(GEN_SRC) $(OBJS) $(LIBS)
 $(RUNTIME): $(RUNTIME_OBJS)
 	ar -cr $@ $(RUNTIME_OBJS)
 
+version.h: ../version.mk
+	echo '#define VERSION "$(VERSION)"' > version.h
+	echo '#define PUBDATE "$(PUBDATE)"' >> version.h
+
 ifeq ($(BUILD_PARSERS),true)
 
 lmparse.h: lmparse.kh
diff --git a/colm/buffer.h b/colm/buffer.h
new file mode 100644
index 00000000..99c4e82d
--- /dev/null
+++ b/colm/buffer.h
@@ -0,0 +1,55 @@
+/*
+ *  Copyright 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _BUFFER_H
+#define _BUFFER_H
+
+#define BUFFER_INITIAL_SIZE 4096
+
+/* An automatically grown buffer for collecting tokens. Always reuses space;
+ * never down resizes. */
+struct Buffer
+{
+	Buffer()
+	{
+		data = (char*) malloc( BUFFER_INITIAL_SIZE );
+		allocated = BUFFER_INITIAL_SIZE;
+		length = 0;
+	}
+	~Buffer() { free(data); }
+
+	void append( char p )
+	{
+		if ( length == allocated ) {
+			allocated *= 2;
+			data = (char*) realloc( data, allocated );
+		}
+		data[length++] = p;
+	}
+		
+	void clear() { length = 0; }
+
+	char *data;
+	int allocated;
+	int length;
+};
+
+#endif /* _BUFFER_H */
diff --git a/colm/common.cpp b/colm/common.cpp
new file mode 100644
index 00000000..e6b0a70b
--- /dev/null
+++ b/colm/common.cpp
@@ -0,0 +1,257 @@
+/*
+ *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pcheck.h"
+#include "common.h"
+#include <assert.h>
+
+HostType hostTypesC[] =
+{
+	{ "char",     0,       true,   CHAR_MIN,  CHAR_MAX,   sizeof(char) },
+	{ "unsigned", "char",  false,  0,         UCHAR_MAX,  sizeof(unsigned char) },
+	{ "short",    0,       true,   SHRT_MIN,  SHRT_MAX,   sizeof(short) },
+	{ "unsigned", "short", false,  0,         USHRT_MAX,  sizeof(unsigned short) },
+	{ "int",      0,       true,   INT_MIN,   INT_MAX,    sizeof(int) },
+	{ "unsigned", "int",   false,  0,         UINT_MAX,   sizeof(unsigned int) },
+	{ "long",     0,       true,   LONG_MIN,  LONG_MAX,   sizeof(long) },
+	{ "unsigned", "long",  false,  0,         ULONG_MAX,  sizeof(unsigned long) }
+};
+
+HostType hostTypesD[] =
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "ubyte",    0,  false,  0,         UCHAR_MAX,   1 },
+	{ "char",     0,  false,  0,         UCHAR_MAX,   1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "ushort",   0,  false,  0,         USHRT_MAX,   2 },
+	{ "wchar",    0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+	{ "uint",     0,  false,  0,         UINT_MAX,    4 },
+	{ "dchar",    0,  false,  0,         UINT_MAX,    4 }
+};
+
+HostType hostTypesJava[] = 
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+};
+
+HostType hostTypesRuby[] = 
+{
+	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
+	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
+	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
+	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
+};
+
+HostLang hostLangC =    { hostTypesC,    8, hostTypesC+0,    true };
+HostLang hostLangD =    { hostTypesD,    9, hostTypesD+2,    true };
+HostLang hostLangJava = { hostTypesJava, 4, hostTypesJava+2, false };
+HostLang hostLangRuby = { hostTypesRuby, 4, hostTypesRuby+2, false };
+
+HostLang *hostLang = &hostLangC;
+HostLangType hostLangType = CCode;
+
+/* Construct a new parameter checker with for paramSpec. */
+ParamCheck::ParamCheck( const char *paramSpec, int argc,  const char **argv )
+:
+	state(noparam),
+	argOffset(0),
+	curArg(0),
+	iCurArg(1),
+	paramSpec(paramSpec), 
+	argc(argc), 
+	argv(argv)
+{
+}
+
+/* Check a single option. Returns the index of the next parameter.  Sets p to
+ * the arg character if valid, 0 otherwise.  Sets parg to the parameter arg if
+ * there is one, NULL otherwise. */
+bool ParamCheck::check()
+{
+	bool requiresParam;
+
+	if ( iCurArg >= argc ) {            /* Off the end of the arg list. */
+		state = noparam;
+		return false;
+	}
+
+	if ( argOffset != 0 && *argOffset == 0 ) {
+		/* We are at the end of an arg string. */
+		iCurArg += 1;
+		if ( iCurArg >= argc ) {
+			state = noparam;
+			return false;
+		}
+		argOffset = 0;
+	}
+
+	if ( argOffset == 0 ) {
+		/* Set the current arg. */
+		curArg = argv[iCurArg];
+
+		/* We are at the beginning of an arg string. */
+		if ( argv[iCurArg] == 0 ||        /* Argv[iCurArg] is null. */
+			 argv[iCurArg][0] != '-' ||   /* Not a param. */
+			 argv[iCurArg][1] == 0 ) {    /* Only a dash. */
+			parameter = 0;
+			parameterArg = 0;
+
+			iCurArg += 1;
+			state = noparam;
+			return true;
+		}
+		argOffset = argv[iCurArg] + 1;
+	}
+
+	/* Get the arg char. */
+	char argChar = *argOffset;
+	
+	/* Loop over all the parms and look for a match. */
+	const char *pSpec = paramSpec;
+	while ( *pSpec != 0 ) {
+		char pSpecChar = *pSpec;
+
+		/* If there is a ':' following the char then
+		 * it requires a parm.  If a parm is required
+		 * then move ahead two in the parmspec. Otherwise
+		 * move ahead one in the parm spec. */
+		if ( pSpec[1] == ':' ) {
+			requiresParam = true;
+			pSpec += 2;
+		}
+		else {
+			requiresParam = false;
+			pSpec += 1;
+		}
+
+		/* Do we have a match. */
+		if ( argChar == pSpecChar ) {
+			if ( requiresParam ) {
+				if ( argOffset[1] == 0 ) {
+					/* The param must follow. */
+					if ( iCurArg + 1 == argc ) {
+						/* We are the last arg so there
+						 * cannot be a parameter to it. */
+						parameter = argChar;
+						parameterArg = 0;
+						iCurArg += 1;
+						argOffset = 0;
+						state = invalid;
+						return true;
+					}
+					else {
+						/* the parameter to the arg is the next arg. */
+						parameter = pSpecChar;
+						parameterArg = argv[iCurArg + 1];
+						iCurArg += 2;
+						argOffset = 0;
+						state = match;
+						return true;
+					}
+				}
+				else {
+					/* The param for the arg is built in. */
+					parameter = pSpecChar;
+					parameterArg = argOffset + 1;
+					iCurArg += 1;
+					argOffset = 0;
+					state = match;
+					return true;
+				}
+			}
+			else {
+				/* Good, we matched the parm and no
+				 * arg is required. */
+				parameter = pSpecChar;
+				parameterArg = 0;
+				argOffset += 1;
+				state = match;
+				return true;
+			}
+		}
+	}
+
+	/* We did not find a match. Bad Argument. */
+	parameter = argChar;
+	parameterArg = 0;
+	argOffset += 1;
+	state = invalid;
+	return true;
+}
+
+/* Scans a string looking for the file extension. If there is a file
+ * extension then pointer returned points to inside the string
+ * passed in. Otherwise returns null. */
+const char *findFileExtension( const char *stemFile )
+{
+	const char *ppos = stemFile + strlen(stemFile) - 1;
+
+	/* Scan backwards from the end looking for the first dot.
+	 * If we encounter a '/' before the first dot, then stop the scan. */
+	while ( 1 ) {
+		/* If we found a dot or got to the beginning of the string then
+		 * we are done. */
+		if ( ppos == stemFile || *ppos == '.' )
+			break;
+
+		/* If we hit a / then there is no extension. Done. */
+		if ( *ppos == '/' ) {
+			ppos = stemFile;
+			break;
+		}
+		ppos--;
+	} 
+
+	/* If we got to the front of the string then bail we 
+	 * did not find an extension  */
+	if ( ppos == stemFile )
+		ppos = 0;
+
+	return ppos;
+}
+
+/* Make a file name from a stem. Removes the old filename suffix and
+ * replaces it with a new one. Returns a newed up string. */
+char *fileNameFromStem( const char *stemFile, const char *suffix )
+{
+	int len = strlen( stemFile );
+	assert( len > 0 );
+
+	/* Get the extension. */
+	const char *ppos = findFileExtension( stemFile );
+
+	/* If an extension was found, then shorten what we think the len is. */
+	if ( ppos != 0 )
+		len = ppos - stemFile;
+
+	/* Make the return string from the stem and the suffix. */
+	char *retVal = new char[ len + strlen( suffix ) + 1 ];
+	strncpy( retVal, stemFile, len );
+	strcpy( retVal + len, suffix );
+
+	return retVal;
+}
+
+
diff --git a/colm/common.h b/colm/common.h
new file mode 100644
index 00000000..53ce443d
--- /dev/null
+++ b/colm/common.h
@@ -0,0 +1,283 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _COMMON_H
+#define _COMMON_H
+
+#include <fstream>
+#include <climits>
+
+enum MarkType
+{
+	MarkEnter,
+	MarkLeave
+};
+
+typedef unsigned long long Size;
+
+struct Key
+{
+private:
+	long key;
+
+public:
+	friend inline Key operator+(const Key key1, const Key key2);
+	friend inline Key operator-(const Key key1, const Key key2);
+	friend inline Key operator/(const Key key1, const Key key2);
+	friend inline long operator&(const Key key1, const Key key2);
+
+	friend inline bool operator<( const Key key1, const Key key2 );
+	friend inline bool operator<=( const Key key1, const Key key2 );
+	friend inline bool operator>( const Key key1, const Key key2 );
+	friend inline bool operator>=( const Key key1, const Key key2 );
+	friend inline bool operator==( const Key key1, const Key key2 );
+	friend inline bool operator!=( const Key key1, const Key key2 );
+
+	friend struct KeyOps;
+	
+	Key( ) {}
+	Key( const Key &key ) : key(key.key) {}
+	Key( long key ) : key(key) {}
+
+	/* Returns the value used to represent the key. This value must be
+	 * interpreted based on signedness. */
+	long getVal() const { return key; };
+
+	/* Returns the key casted to a long long. This form of the key does not
+	 * require and signedness interpretation. */
+	long long getLongLong() const;
+
+	bool isUpper() const { return ( 'A' <= key && key <= 'Z' ); }
+	bool isLower() const { return ( 'a' <= key && key <= 'z' ); }
+	bool isPrintable() const { return ( 32 <= key && key < 127 ); }
+
+	Key toUpper() const
+		{ return Key( 'A' + ( key - 'a' ) ); }
+	Key toLower() const
+		{ return Key( 'a' + ( key - 'A' ) ); }
+
+	void operator+=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key += other.key;
+	}
+
+	void operator-=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key -= other.key;
+	}
+
+	void operator|=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key |= other.key;
+	}
+
+	/* Decrement. Needed only for ranges. */
+	inline void decrement();
+	inline void increment();
+};
+
+struct HostType
+{
+	char *data1;
+	char *data2;
+	bool isSigned;
+	long long minVal;
+	long long maxVal;
+	unsigned int size;
+};
+
+struct HostLang
+{
+	HostType *hostTypes;
+	int numHostTypes;
+	HostType *defaultAlphType;
+	bool explicitUnsigned;
+};
+
+
+/* Target language. */
+enum HostLangType
+{
+	CCode,
+	DCode,
+	JavaCode,
+	RubyCode
+};
+
+extern HostLang *hostLang;
+extern HostLangType hostLangType;
+
+extern HostLang hostLangC;
+extern HostLang hostLangD;
+extern HostLang hostLangJava;
+extern HostLang hostLangRuby;
+
+/* An abstraction of the key operators that manages key operations such as
+ * comparison and increment according the signedness of the key. */
+struct KeyOps
+{
+	/* Default to signed alphabet. */
+	KeyOps() :
+		isSigned(true),
+		alphType(0)
+	{}
+
+	/* Default to signed alphabet. */
+	KeyOps( bool isSigned ) 
+		:isSigned(isSigned) {}
+
+	bool isSigned;
+	Key minKey, maxKey;
+	HostType *alphType;
+
+	void setAlphType( HostType *alphType )
+	{
+		this->alphType = alphType;
+		isSigned = alphType->isSigned;
+		if ( isSigned ) {
+			minKey = (long) alphType->minVal;
+			maxKey = (long) alphType->maxVal;
+		}
+		else {
+			minKey = (long) (unsigned long) alphType->minVal; 
+			maxKey = (long) (unsigned long) alphType->maxVal;
+		}
+	}
+
+	/* Compute the distance between two keys. */
+	Size span( Key key1, Key key2 )
+	{
+		return isSigned ? 
+			(unsigned long long)(
+				(long long)key2.key - 
+				(long long)key1.key + 1) : 
+			(unsigned long long)(
+				(unsigned long)key2.key) - 
+				(unsigned long long)((unsigned long)key1.key) + 1;
+	}
+
+	Size alphSize()
+		{ return span( minKey, maxKey ); }
+
+	HostType *typeSubsumes( long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+
+	HostType *typeSubsumes( bool isSigned, long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
+					maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+};
+
+extern KeyOps *keyOps;
+
+inline bool operator<( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key < key2.key : 
+		(unsigned long)key1.key < (unsigned long)key2.key;
+}
+
+inline bool operator<=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ?  key1.key <= key2.key : 
+		(unsigned long)key1.key <= (unsigned long)key2.key;
+}
+
+inline bool operator>( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key > key2.key : 
+		(unsigned long)key1.key > (unsigned long)key2.key;
+}
+
+inline bool operator>=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key >= key2.key : 
+		(unsigned long)key1.key >= (unsigned long)key2.key;
+}
+
+inline bool operator==( const Key key1, const Key key2 )
+{
+	return key1.key == key2.key;
+}
+
+inline bool operator!=( const Key key1, const Key key2 )
+{
+	return key1.key != key2.key;
+}
+
+/* Decrement. Needed only for ranges. */
+inline void Key::decrement()
+{
+	key = keyOps->isSigned ? key - 1 : ((unsigned long)key)-1;
+}
+
+/* Increment. Needed only for ranges. */
+inline void Key::increment()
+{
+	key = keyOps->isSigned ? key+1 : ((unsigned long)key)+1;
+}
+
+inline long long Key::getLongLong() const
+{
+	return keyOps->isSigned ? (long long)key : (long long)(unsigned long)key;
+}
+
+inline Key operator+(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key + key2.key );
+}
+
+inline Key operator-(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key - key2.key );
+}
+
+inline long operator&(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key & key2.key;
+}
+
+inline Key operator/(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key / key2.key;
+}
+
+const char *findFileExtension( const char *stemFile );
+char *fileNameFromStem( const char *stemFile, const char *suffix );
+
+#endif /* _COMMON_H */
diff --git a/colm/config.h.in b/colm/config.h.in
new file mode 100644
index 00000000..c370f3b6
--- /dev/null
+++ b/colm/config.h.in
@@ -0,0 +1,50 @@
+/*
+ *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _CONFIG_H
+#define _CONFIG_H
+
+/* Programs. */
+#undef GDC
+#undef GOBJC
+#undef CXX
+#undef CC
+#undef JAVAC
+#undef TXL
+#undef RUBY
+
+/* Configuration */
+#undef COLM_LOG
+#undef COLM_LOG_BYTECODE
+#undef COLM_LOG_PARSE
+#undef COLM_LOG_MATCH
+#undef COLM_LOG_COMPILE
+
+/* If COLM_LOG is defined then turn on all logging options. */
+#ifdef COLM_LOG
+#define COLM_LOG_BYTECODE 1
+#define COLM_LOG_PARSE 1
+#define COLM_LOG_MATCH 1
+#define COLM_LOG_COMPILE 1
+#endif
+
+
+#endif /* _CONFIG_H */
diff --git a/colm/pcheck.h b/colm/pcheck.h
new file mode 100644
index 00000000..df3706c2
--- /dev/null
+++ b/colm/pcheck.h
@@ -0,0 +1,48 @@
+/*
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ */
+
+/*  This file is part of Ragel.
+ *
+ *  Ragel is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Ragel is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Ragel; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _PCHECK_H
+#define _PCHECK_H
+
+class ParamCheck
+{
+public:
+	ParamCheck( const char *paramSpec, int argc, const char **argv );
+
+	bool check();
+
+	const char *parameterArg; /* The argument to the parameter. */
+	char parameter;     /* The parameter matched. */
+	enum { match, invalid, noparam } state;
+
+	const char *argOffset;    /* If we are reading params inside an
+	                     * arg this points to the offset. */
+
+	const char *curArg;       /* Pointer to the current arg. */
+	int iCurArg;        /* Index to the current arg. */
+
+private:
+	const char *paramSpec;    /* Parameter spec supplied by the coder. */
+	int argc;           /* Arguement data from the command line. */
+	const char **argv;
+};
+
+#endif /* _PCHECK_H */
diff --git a/common/Makefile.in b/common/Makefile.in
deleted file mode 100644
index 47dc3567..00000000
--- a/common/Makefile.in
+++ /dev/null
@@ -1,67 +0,0 @@
-#
-#   Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
-#
-
-#   This file is part of Ragel.
-#
-#   Ragel is free software; you can redistribute it and/or modify
-#   it under the terms of the GNU General Public License as published by
-#   the Free Software Foundation; either version 2 of the License, or
-#   (at your option) any later version.
-#
-#   Ragel is distributed in the hope that it will be useful,
-#   but WITHOUT ANY WARRANTY; without even the implied warranty of
-#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#   GNU General Public License for more details.
-#
-#   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
-#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
-
-INCS += 
-DEFS +=
-
-CFLAGS += -g -Wall
-LDFLAGS +=
-
-CC_SRCS = common.cpp
-
-GEN_SRC = version.h
-
-#*************************************
-
-# Programs
-CXX = @CXX@
-
-# Get objects and dependencies from sources.
-OBJS = $(CC_SRCS:%.cpp=%.o)
-DEPS = $(CC_SRCS:%.cpp=.%.d)
-
-# Get the version info.
-include ../version.mk
-
-# rules
-
-all: common.a
-
-common.a: $(GEN_SRC) $(OBJS)
-	ar -cr $@ $(OBJS) 
-
-version.h: ../version.mk
-	echo '#define VERSION "$(VERSION)"' > version.h
-	echo '#define PUBDATE "$(PUBDATE)"' >> version.h
-
-%.o: %.cpp
-	@$(CXX) -M $(DEFS) $(INCS) $< > .$*.d
-	$(CXX) -c $(CFLAGS) $(DEFS) $(INCS) -o $@ $<
-
-distclean: clean
-	rm -f Makefile config.h
-
-clean:
-	rm -f tags version.h .*.d *.o common.a
-
-install:
-	@true
-
--include $(DEPS)
diff --git a/common/buffer.h b/common/buffer.h
deleted file mode 100644
index 99c4e82d..00000000
--- a/common/buffer.h
+++ /dev/null
@@ -1,55 +0,0 @@
-/*
- *  Copyright 2003 Adrian Thurston <thurston@cs.queensu.ca>
- */
-
-/*  This file is part of Ragel.
- *
- *  Ragel is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Ragel is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#ifndef _BUFFER_H
-#define _BUFFER_H
-
-#define BUFFER_INITIAL_SIZE 4096
-
-/* An automatically grown buffer for collecting tokens. Always reuses space;
- * never down resizes. */
-struct Buffer
-{
-	Buffer()
-	{
-		data = (char*) malloc( BUFFER_INITIAL_SIZE );
-		allocated = BUFFER_INITIAL_SIZE;
-		length = 0;
-	}
-	~Buffer() { free(data); }
-
-	void append( char p )
-	{
-		if ( length == allocated ) {
-			allocated *= 2;
-			data = (char*) realloc( data, allocated );
-		}
-		data[length++] = p;
-	}
-		
-	void clear() { length = 0; }
-
-	char *data;
-	int allocated;
-	int length;
-};
-
-#endif /* _BUFFER_H */
diff --git a/common/common.cpp b/common/common.cpp
deleted file mode 100644
index e6b0a70b..00000000
--- a/common/common.cpp
+++ /dev/null
@@ -1,257 +0,0 @@
-/*
- *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
- */
-
-/*  This file is part of Ragel.
- *
- *  Ragel is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Ragel is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#include "pcheck.h"
-#include "common.h"
-#include <assert.h>
-
-HostType hostTypesC[] =
-{
-	{ "char",     0,       true,   CHAR_MIN,  CHAR_MAX,   sizeof(char) },
-	{ "unsigned", "char",  false,  0,         UCHAR_MAX,  sizeof(unsigned char) },
-	{ "short",    0,       true,   SHRT_MIN,  SHRT_MAX,   sizeof(short) },
-	{ "unsigned", "short", false,  0,         USHRT_MAX,  sizeof(unsigned short) },
-	{ "int",      0,       true,   INT_MIN,   INT_MAX,    sizeof(int) },
-	{ "unsigned", "int",   false,  0,         UINT_MAX,   sizeof(unsigned int) },
-	{ "long",     0,       true,   LONG_MIN,  LONG_MAX,   sizeof(long) },
-	{ "unsigned", "long",  false,  0,         ULONG_MAX,  sizeof(unsigned long) }
-};
-
-HostType hostTypesD[] =
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "ubyte",    0,  false,  0,         UCHAR_MAX,   1 },
-	{ "char",     0,  false,  0,         UCHAR_MAX,   1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "ushort",   0,  false,  0,         USHRT_MAX,   2 },
-	{ "wchar",    0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-	{ "uint",     0,  false,  0,         UINT_MAX,    4 },
-	{ "dchar",    0,  false,  0,         UINT_MAX,    4 }
-};
-
-HostType hostTypesJava[] = 
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-};
-
-HostType hostTypesRuby[] = 
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-};
-
-HostLang hostLangC =    { hostTypesC,    8, hostTypesC+0,    true };
-HostLang hostLangD =    { hostTypesD,    9, hostTypesD+2,    true };
-HostLang hostLangJava = { hostTypesJava, 4, hostTypesJava+2, false };
-HostLang hostLangRuby = { hostTypesRuby, 4, hostTypesRuby+2, false };
-
-HostLang *hostLang = &hostLangC;
-HostLangType hostLangType = CCode;
-
-/* Construct a new parameter checker with for paramSpec. */
-ParamCheck::ParamCheck( const char *paramSpec, int argc,  const char **argv )
-:
-	state(noparam),
-	argOffset(0),
-	curArg(0),
-	iCurArg(1),
-	paramSpec(paramSpec), 
-	argc(argc), 
-	argv(argv)
-{
-}
-
-/* Check a single option. Returns the index of the next parameter.  Sets p to
- * the arg character if valid, 0 otherwise.  Sets parg to the parameter arg if
- * there is one, NULL otherwise. */
-bool ParamCheck::check()
-{
-	bool requiresParam;
-
-	if ( iCurArg >= argc ) {            /* Off the end of the arg list. */
-		state = noparam;
-		return false;
-	}
-
-	if ( argOffset != 0 && *argOffset == 0 ) {
-		/* We are at the end of an arg string. */
-		iCurArg += 1;
-		if ( iCurArg >= argc ) {
-			state = noparam;
-			return false;
-		}
-		argOffset = 0;
-	}
-
-	if ( argOffset == 0 ) {
-		/* Set the current arg. */
-		curArg = argv[iCurArg];
-
-		/* We are at the beginning of an arg string. */
-		if ( argv[iCurArg] == 0 ||        /* Argv[iCurArg] is null. */
-			 argv[iCurArg][0] != '-' ||   /* Not a param. */
-			 argv[iCurArg][1] == 0 ) {    /* Only a dash. */
-			parameter = 0;
-			parameterArg = 0;
-
-			iCurArg += 1;
-			state = noparam;
-			return true;
-		}
-		argOffset = argv[iCurArg] + 1;
-	}
-
-	/* Get the arg char. */
-	char argChar = *argOffset;
-	
-	/* Loop over all the parms and look for a match. */
-	const char *pSpec = paramSpec;
-	while ( *pSpec != 0 ) {
-		char pSpecChar = *pSpec;
-
-		/* If there is a ':' following the char then
-		 * it requires a parm.  If a parm is required
-		 * then move ahead two in the parmspec. Otherwise
-		 * move ahead one in the parm spec. */
-		if ( pSpec[1] == ':' ) {
-			requiresParam = true;
-			pSpec += 2;
-		}
-		else {
-			requiresParam = false;
-			pSpec += 1;
-		}
-
-		/* Do we have a match. */
-		if ( argChar == pSpecChar ) {
-			if ( requiresParam ) {
-				if ( argOffset[1] == 0 ) {
-					/* The param must follow. */
-					if ( iCurArg + 1 == argc ) {
-						/* We are the last arg so there
-						 * cannot be a parameter to it. */
-						parameter = argChar;
-						parameterArg = 0;
-						iCurArg += 1;
-						argOffset = 0;
-						state = invalid;
-						return true;
-					}
-					else {
-						/* the parameter to the arg is the next arg. */
-						parameter = pSpecChar;
-						parameterArg = argv[iCurArg + 1];
-						iCurArg += 2;
-						argOffset = 0;
-						state = match;
-						return true;
-					}
-				}
-				else {
-					/* The param for the arg is built in. */
-					parameter = pSpecChar;
-					parameterArg = argOffset + 1;
-					iCurArg += 1;
-					argOffset = 0;
-					state = match;
-					return true;
-				}
-			}
-			else {
-				/* Good, we matched the parm and no
-				 * arg is required. */
-				parameter = pSpecChar;
-				parameterArg = 0;
-				argOffset += 1;
-				state = match;
-				return true;
-			}
-		}
-	}
-
-	/* We did not find a match. Bad Argument. */
-	parameter = argChar;
-	parameterArg = 0;
-	argOffset += 1;
-	state = invalid;
-	return true;
-}
-
-/* Scans a string looking for the file extension. If there is a file
- * extension then pointer returned points to inside the string
- * passed in. Otherwise returns null. */
-const char *findFileExtension( const char *stemFile )
-{
-	const char *ppos = stemFile + strlen(stemFile) - 1;
-
-	/* Scan backwards from the end looking for the first dot.
-	 * If we encounter a '/' before the first dot, then stop the scan. */
-	while ( 1 ) {
-		/* If we found a dot or got to the beginning of the string then
-		 * we are done. */
-		if ( ppos == stemFile || *ppos == '.' )
-			break;
-
-		/* If we hit a / then there is no extension. Done. */
-		if ( *ppos == '/' ) {
-			ppos = stemFile;
-			break;
-		}
-		ppos--;
-	} 
-
-	/* If we got to the front of the string then bail we 
-	 * did not find an extension  */
-	if ( ppos == stemFile )
-		ppos = 0;
-
-	return ppos;
-}
-
-/* Make a file name from a stem. Removes the old filename suffix and
- * replaces it with a new one. Returns a newed up string. */
-char *fileNameFromStem( const char *stemFile, const char *suffix )
-{
-	int len = strlen( stemFile );
-	assert( len > 0 );
-
-	/* Get the extension. */
-	const char *ppos = findFileExtension( stemFile );
-
-	/* If an extension was found, then shorten what we think the len is. */
-	if ( ppos != 0 )
-		len = ppos - stemFile;
-
-	/* Make the return string from the stem and the suffix. */
-	char *retVal = new char[ len + strlen( suffix ) + 1 ];
-	strncpy( retVal, stemFile, len );
-	strcpy( retVal + len, suffix );
-
-	return retVal;
-}
-
-
diff --git a/common/common.h b/common/common.h
deleted file mode 100644
index 53ce443d..00000000
--- a/common/common.h
+++ /dev/null
@@ -1,283 +0,0 @@
-/*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
- */
-
-/*  This file is part of Ragel.
- *
- *  Ragel is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Ragel is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#ifndef _COMMON_H
-#define _COMMON_H
-
-#include <fstream>
-#include <climits>
-
-enum MarkType
-{
-	MarkEnter,
-	MarkLeave
-};
-
-typedef unsigned long long Size;
-
-struct Key
-{
-private:
-	long key;
-
-public:
-	friend inline Key operator+(const Key key1, const Key key2);
-	friend inline Key operator-(const Key key1, const Key key2);
-	friend inline Key operator/(const Key key1, const Key key2);
-	friend inline long operator&(const Key key1, const Key key2);
-
-	friend inline bool operator<( const Key key1, const Key key2 );
-	friend inline bool operator<=( const Key key1, const Key key2 );
-	friend inline bool operator>( const Key key1, const Key key2 );
-	friend inline bool operator>=( const Key key1, const Key key2 );
-	friend inline bool operator==( const Key key1, const Key key2 );
-	friend inline bool operator!=( const Key key1, const Key key2 );
-
-	friend struct KeyOps;
-	
-	Key( ) {}
-	Key( const Key &key ) : key(key.key) {}
-	Key( long key ) : key(key) {}
-
-	/* Returns the value used to represent the key. This value must be
-	 * interpreted based on signedness. */
-	long getVal() const { return key; };
-
-	/* Returns the key casted to a long long. This form of the key does not
-	 * require and signedness interpretation. */
-	long long getLongLong() const;
-
-	bool isUpper() const { return ( 'A' <= key && key <= 'Z' ); }
-	bool isLower() const { return ( 'a' <= key && key <= 'z' ); }
-	bool isPrintable() const { return ( 32 <= key && key < 127 ); }
-
-	Key toUpper() const
-		{ return Key( 'A' + ( key - 'a' ) ); }
-	Key toLower() const
-		{ return Key( 'a' + ( key - 'A' ) ); }
-
-	void operator+=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key += other.key;
-	}
-
-	void operator-=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key -= other.key;
-	}
-
-	void operator|=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key |= other.key;
-	}
-
-	/* Decrement. Needed only for ranges. */
-	inline void decrement();
-	inline void increment();
-};
-
-struct HostType
-{
-	char *data1;
-	char *data2;
-	bool isSigned;
-	long long minVal;
-	long long maxVal;
-	unsigned int size;
-};
-
-struct HostLang
-{
-	HostType *hostTypes;
-	int numHostTypes;
-	HostType *defaultAlphType;
-	bool explicitUnsigned;
-};
-
-
-/* Target language. */
-enum HostLangType
-{
-	CCode,
-	DCode,
-	JavaCode,
-	RubyCode
-};
-
-extern HostLang *hostLang;
-extern HostLangType hostLangType;
-
-extern HostLang hostLangC;
-extern HostLang hostLangD;
-extern HostLang hostLangJava;
-extern HostLang hostLangRuby;
-
-/* An abstraction of the key operators that manages key operations such as
- * comparison and increment according the signedness of the key. */
-struct KeyOps
-{
-	/* Default to signed alphabet. */
-	KeyOps() :
-		isSigned(true),
-		alphType(0)
-	{}
-
-	/* Default to signed alphabet. */
-	KeyOps( bool isSigned ) 
-		:isSigned(isSigned) {}
-
-	bool isSigned;
-	Key minKey, maxKey;
-	HostType *alphType;
-
-	void setAlphType( HostType *alphType )
-	{
-		this->alphType = alphType;
-		isSigned = alphType->isSigned;
-		if ( isSigned ) {
-			minKey = (long) alphType->minVal;
-			maxKey = (long) alphType->maxVal;
-		}
-		else {
-			minKey = (long) (unsigned long) alphType->minVal; 
-			maxKey = (long) (unsigned long) alphType->maxVal;
-		}
-	}
-
-	/* Compute the distance between two keys. */
-	Size span( Key key1, Key key2 )
-	{
-		return isSigned ? 
-			(unsigned long long)(
-				(long long)key2.key - 
-				(long long)key1.key + 1) : 
-			(unsigned long long)(
-				(unsigned long)key2.key) - 
-				(unsigned long long)((unsigned long)key1.key) + 1;
-	}
-
-	Size alphSize()
-		{ return span( minKey, maxKey ); }
-
-	HostType *typeSubsumes( long long maxVal )
-	{
-		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-			if ( maxVal <= hostLang->hostTypes[i].maxVal )
-				return hostLang->hostTypes + i;
-		}
-		return 0;
-	}
-
-	HostType *typeSubsumes( bool isSigned, long long maxVal )
-	{
-		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
-					maxVal <= hostLang->hostTypes[i].maxVal )
-				return hostLang->hostTypes + i;
-		}
-		return 0;
-	}
-};
-
-extern KeyOps *keyOps;
-
-inline bool operator<( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key < key2.key : 
-		(unsigned long)key1.key < (unsigned long)key2.key;
-}
-
-inline bool operator<=( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ?  key1.key <= key2.key : 
-		(unsigned long)key1.key <= (unsigned long)key2.key;
-}
-
-inline bool operator>( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key > key2.key : 
-		(unsigned long)key1.key > (unsigned long)key2.key;
-}
-
-inline bool operator>=( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key >= key2.key : 
-		(unsigned long)key1.key >= (unsigned long)key2.key;
-}
-
-inline bool operator==( const Key key1, const Key key2 )
-{
-	return key1.key == key2.key;
-}
-
-inline bool operator!=( const Key key1, const Key key2 )
-{
-	return key1.key != key2.key;
-}
-
-/* Decrement. Needed only for ranges. */
-inline void Key::decrement()
-{
-	key = keyOps->isSigned ? key - 1 : ((unsigned long)key)-1;
-}
-
-/* Increment. Needed only for ranges. */
-inline void Key::increment()
-{
-	key = keyOps->isSigned ? key+1 : ((unsigned long)key)+1;
-}
-
-inline long long Key::getLongLong() const
-{
-	return keyOps->isSigned ? (long long)key : (long long)(unsigned long)key;
-}
-
-inline Key operator+(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return Key( key1.key + key2.key );
-}
-
-inline Key operator-(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return Key( key1.key - key2.key );
-}
-
-inline long operator&(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return key1.key & key2.key;
-}
-
-inline Key operator/(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return key1.key / key2.key;
-}
-
-const char *findFileExtension( const char *stemFile );
-char *fileNameFromStem( const char *stemFile, const char *suffix );
-
-#endif /* _COMMON_H */
diff --git a/common/config.h.in b/common/config.h.in
deleted file mode 100644
index c370f3b6..00000000
--- a/common/config.h.in
+++ /dev/null
@@ -1,50 +0,0 @@
-/*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
- */
-
-/*  This file is part of Ragel.
- *
- *  Ragel is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Ragel is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#ifndef _CONFIG_H
-#define _CONFIG_H
-
-/* Programs. */
-#undef GDC
-#undef GOBJC
-#undef CXX
-#undef CC
-#undef JAVAC
-#undef TXL
-#undef RUBY
-
-/* Configuration */
-#undef COLM_LOG
-#undef COLM_LOG_BYTECODE
-#undef COLM_LOG_PARSE
-#undef COLM_LOG_MATCH
-#undef COLM_LOG_COMPILE
-
-/* If COLM_LOG is defined then turn on all logging options. */
-#ifdef COLM_LOG
-#define COLM_LOG_BYTECODE 1
-#define COLM_LOG_PARSE 1
-#define COLM_LOG_MATCH 1
-#define COLM_LOG_COMPILE 1
-#endif
-
-
-#endif /* _CONFIG_H */
diff --git a/common/pcheck.h b/common/pcheck.h
deleted file mode 100644
index df3706c2..00000000
--- a/common/pcheck.h
+++ /dev/null
@@ -1,48 +0,0 @@
-/*
- *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
- */
-
-/*  This file is part of Ragel.
- *
- *  Ragel is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Ragel is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#ifndef _PCHECK_H
-#define _PCHECK_H
-
-class ParamCheck
-{
-public:
-	ParamCheck( const char *paramSpec, int argc, const char **argv );
-
-	bool check();
-
-	const char *parameterArg; /* The argument to the parameter. */
-	char parameter;     /* The parameter matched. */
-	enum { match, invalid, noparam } state;
-
-	const char *argOffset;    /* If we are reading params inside an
-	                     * arg this points to the offset. */
-
-	const char *curArg;       /* Pointer to the current arg. */
-	int iCurArg;        /* Index to the current arg. */
-
-private:
-	const char *paramSpec;    /* Parameter spec supplied by the coder. */
-	int argc;           /* Arguement data from the command line. */
-	const char **argv;
-};
-
-#endif /* _PCHECK_H */
diff --git a/configure b/configure
index be493813..0b75c81e 100755
--- a/configure
+++ b/configure
@@ -1649,7 +1649,7 @@ ac_link='$CC -o conftest$ac_exeext $CFLAGS $CPPFLAGS $LDFLAGS conftest.$ac_ext $
 ac_compiler_gnu=$ac_cv_c_compiler_gnu
 
 
-ac_config_headers="$ac_config_headers common/config.h"
+ac_config_headers="$ac_config_headers colm/config.h"
 
 
 BUILD_PARSERS=true
@@ -3120,7 +3120,7 @@ fi
 
 fi # BUILD_PARSERS
 
-ac_config_files="$ac_config_files Makefile common/Makefile colm/Makefile"
+ac_config_files="$ac_config_files Makefile colm/Makefile"
 
 cat >confcache <<\_ACEOF
 # This file is a shell script that caches the results of configure
@@ -3674,9 +3674,8 @@ cat >>$CONFIG_STATUS <<\_ACEOF
 for ac_config_target in $ac_config_targets
 do
   case $ac_config_target in
-    "common/config.h") CONFIG_HEADERS="$CONFIG_HEADERS common/config.h" ;;
+    "colm/config.h") CONFIG_HEADERS="$CONFIG_HEADERS colm/config.h" ;;
     "Makefile") CONFIG_FILES="$CONFIG_FILES Makefile" ;;
-    "common/Makefile") CONFIG_FILES="$CONFIG_FILES common/Makefile" ;;
     "colm/Makefile") CONFIG_FILES="$CONFIG_FILES colm/Makefile" ;;
 
   *) { { echo "$as_me:$LINENO: error: invalid argument: $ac_config_target" >&5
diff --git a/configure.in b/configure.in
index 9a4d827d..575d2a7f 100644
--- a/configure.in
+++ b/configure.in
@@ -19,7 +19,7 @@ dnl   along with Colm; if not, write to the Free Software
 dnl   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
   
 AC_INIT(colm/main.cpp)
-AC_CONFIG_HEADER(common/config.h)
+AC_CONFIG_HEADER(colm/config.h)
 
 dnl Set to true if build system should generate parsers from ragel, kelbt, and
 dnl gperf sources. Set to false if generated files are included and not to be
@@ -74,6 +74,6 @@ fi
 fi # BUILD_PARSERS
 
 dnl write output files
-AC_OUTPUT(Makefile common/Makefile colm/Makefile)
+AC_OUTPUT(Makefile colm/Makefile)
 
 echo "configuration of colm complete"
-- 
cgit v1.2.1


From bc864c0e57f439ec24672de1918040ef8dfd7984 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 19:34:16 +0000
Subject: Updated my email address. Fixed some GPL preambles: ragel -> colm.

---
 Makefile.in          |  2 +-
 aapl/astring.h       |  2 +-
 aapl/avlbasic.h      |  2 +-
 aapl/avlcommon.h     |  2 +-
 aapl/avlibasic.h     |  2 +-
 aapl/avlikeyless.h   |  2 +-
 aapl/avlimap.h       |  2 +-
 aapl/avlimel.h       |  2 +-
 aapl/avlimelkey.h    |  2 +-
 aapl/avliset.h       |  2 +-
 aapl/avlitree.h      |  2 +-
 aapl/avlkeyless.h    |  2 +-
 aapl/avlmap.h        |  2 +-
 aapl/avlmel.h        |  2 +-
 aapl/avlmelkey.h     |  2 +-
 aapl/avlset.h        |  2 +-
 aapl/avltree.h       |  2 +-
 aapl/bstcommon.h     |  2 +-
 aapl/bstmap.h        |  2 +-
 aapl/bstset.h        |  2 +-
 aapl/bsttable.h      |  2 +-
 aapl/bubblesort.h    |  2 +-
 aapl/compare.h       |  2 +-
 aapl/dlcommon.h      |  2 +-
 aapl/dlist.h         |  2 +-
 aapl/dlistmel.h      |  2 +-
 aapl/dlistval.h      |  2 +-
 aapl/insertsort.h    |  2 +-
 aapl/mergesort.h     |  2 +-
 aapl/quicksort.h     |  2 +-
 aapl/resize.h        |  2 +-
 aapl/sbstmap.h       |  2 +-
 aapl/sbstset.h       |  2 +-
 aapl/sbsttable.h     |  2 +-
 aapl/svector.h       |  2 +-
 aapl/table.h         |  2 +-
 aapl/vector.h        |  2 +-
 colm/Makefile.in     |  4 ++--
 colm/buffer.h        | 10 +++++-----
 colm/bytecode.cpp    |  2 +-
 colm/bytecode.h      |  2 +-
 colm/closure.cpp     |  2 +-
 colm/colm.h          |  2 +-
 colm/common.cpp      | 10 +++++-----
 colm/common.h        | 10 +++++-----
 colm/compile.cpp     |  2 +-
 colm/config.h.in     |  2 +-
 colm/dotgen.cpp      |  2 +-
 colm/dotgen.h        |  2 +-
 colm/fsmap.cpp       |  2 +-
 colm/fsmattach.cpp   |  2 +-
 colm/fsmbase.cpp     |  2 +-
 colm/fsmcodegen.cpp  |  2 +-
 colm/fsmcodegen.h    |  2 +-
 colm/fsmexec.cpp     |  2 +-
 colm/fsmgraph.cpp    |  2 +-
 colm/fsmgraph.h      |  2 +-
 colm/fsmmin.cpp      |  2 +-
 colm/fsmrun.cpp      |  2 +-
 colm/fsmrun.h        |  2 +-
 colm/fsmstate.cpp    |  2 +-
 colm/input.cpp       |  2 +-
 colm/input.h         |  2 +-
 colm/list.cpp        |  2 +-
 colm/lmparse.kh      |  2 +-
 colm/lmparse.kl      |  2 +-
 colm/lmscan.h        |  2 +-
 colm/lmscan.rl       |  2 +-
 colm/main.cpp        |  2 +-
 colm/map.cpp         |  2 +-
 colm/parsedata.cpp   |  2 +-
 colm/parsedata.h     |  2 +-
 colm/parsetree.cpp   |  2 +-
 colm/parsetree.h     |  2 +-
 colm/pcheck.h        | 10 +++++-----
 colm/pdabuild.cpp    |  2 +-
 colm/pdacodegen.cpp  |  2 +-
 colm/pdacodegen.h    |  2 +-
 colm/pdagraph.cpp    |  2 +-
 colm/pdagraph.h      |  2 +-
 colm/pdarun.cpp      |  2 +-
 colm/pdarun.h        |  2 +-
 colm/redbuild.cpp    |  2 +-
 colm/redbuild.h      |  2 +-
 colm/redfsm.cpp      |  2 +-
 colm/redfsm.h        |  2 +-
 colm/string.cpp      |  2 +-
 colm/tree.cpp        |  2 +-
 configure.in         |  2 +-
 test/Makefile        |  2 +-
 test/cxx/Makefile    |  2 +-
 test/diff/Makefile   |  2 +-
 test/dns/Makefile    |  2 +-
 test/html/Makefile   |  2 +-
 test/http/Makefile   |  2 +-
 test/python/Makefile |  2 +-
 test/ruby/Makefile   |  2 +-
 test/xml/Makefile    |  2 +-
 test/xml/xml.in      |  2 +-
 99 files changed, 116 insertions(+), 116 deletions(-)

diff --git a/Makefile.in b/Makefile.in
index f14d2473..c16f4e8d 100644
--- a/Makefile.in
+++ b/Makefile.in
@@ -1,5 +1,5 @@
 #
-#   Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Colm.
diff --git a/aapl/astring.h b/aapl/astring.h
index 37cc0cc4..251e9139 100644
--- a/aapl/astring.h
+++ b/aapl/astring.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlbasic.h b/aapl/avlbasic.h
index 780ef07a..ed826f38 100644
--- a/aapl/avlbasic.h
+++ b/aapl/avlbasic.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlcommon.h b/aapl/avlcommon.h
index fca4ea4f..6cb0b89a 100644
--- a/aapl/avlcommon.h
+++ b/aapl/avlcommon.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlibasic.h b/aapl/avlibasic.h
index a48faaa8..b916f742 100644
--- a/aapl/avlibasic.h
+++ b/aapl/avlibasic.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlikeyless.h b/aapl/avlikeyless.h
index 559b75af..0c606089 100644
--- a/aapl/avlikeyless.h
+++ b/aapl/avlikeyless.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002, 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002, 2003 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlimap.h b/aapl/avlimap.h
index 38bfff75..c207dc52 100644
--- a/aapl/avlimap.h
+++ b/aapl/avlimap.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlimel.h b/aapl/avlimel.h
index 9442a997..bceddcd4 100644
--- a/aapl/avlimel.h
+++ b/aapl/avlimel.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlimelkey.h b/aapl/avlimelkey.h
index faa56e83..52d3a409 100644
--- a/aapl/avlimelkey.h
+++ b/aapl/avlimelkey.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avliset.h b/aapl/avliset.h
index cf5be365..9594e7d7 100644
--- a/aapl/avliset.h
+++ b/aapl/avliset.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlitree.h b/aapl/avlitree.h
index b053c96f..28394bb1 100644
--- a/aapl/avlitree.h
+++ b/aapl/avlitree.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlkeyless.h b/aapl/avlkeyless.h
index 30805136..fecf8bda 100644
--- a/aapl/avlkeyless.h
+++ b/aapl/avlkeyless.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002, 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002, 2003 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlmap.h b/aapl/avlmap.h
index e4e15662..378613cd 100644
--- a/aapl/avlmap.h
+++ b/aapl/avlmap.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlmel.h b/aapl/avlmel.h
index 7bfad3b7..6d0deb7d 100644
--- a/aapl/avlmel.h
+++ b/aapl/avlmel.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlmelkey.h b/aapl/avlmelkey.h
index 9261cc83..5a66c9c2 100644
--- a/aapl/avlmelkey.h
+++ b/aapl/avlmelkey.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avlset.h b/aapl/avlset.h
index 224ee59f..579378a3 100644
--- a/aapl/avlset.h
+++ b/aapl/avlset.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/avltree.h b/aapl/avltree.h
index cf153595..2aa8e15f 100644
--- a/aapl/avltree.h
+++ b/aapl/avltree.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/bstcommon.h b/aapl/bstcommon.h
index bd390cdc..888717f3 100644
--- a/aapl/bstcommon.h
+++ b/aapl/bstcommon.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/bstmap.h b/aapl/bstmap.h
index 5154b86c..30c8e3c5 100644
--- a/aapl/bstmap.h
+++ b/aapl/bstmap.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/bstset.h b/aapl/bstset.h
index ce710ee0..4a0f88ee 100644
--- a/aapl/bstset.h
+++ b/aapl/bstset.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/bsttable.h b/aapl/bsttable.h
index 9898ebff..4e4babc3 100644
--- a/aapl/bsttable.h
+++ b/aapl/bsttable.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/bubblesort.h b/aapl/bubblesort.h
index 20e0f6f4..bcc2fb6a 100644
--- a/aapl/bubblesort.h
+++ b/aapl/bubblesort.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/compare.h b/aapl/compare.h
index 3d547b51..22937e9b 100644
--- a/aapl/compare.h
+++ b/aapl/compare.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/dlcommon.h b/aapl/dlcommon.h
index 5ce9bd30..91dff25f 100644
--- a/aapl/dlcommon.h
+++ b/aapl/dlcommon.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/dlist.h b/aapl/dlist.h
index eaf3e5d5..e34c8da4 100644
--- a/aapl/dlist.h
+++ b/aapl/dlist.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/dlistmel.h b/aapl/dlistmel.h
index 34331393..17de5432 100644
--- a/aapl/dlistmel.h
+++ b/aapl/dlistmel.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/dlistval.h b/aapl/dlistval.h
index 6f249995..4fcf33fa 100644
--- a/aapl/dlistval.h
+++ b/aapl/dlistval.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/insertsort.h b/aapl/insertsort.h
index eb3e2649..94aef7b2 100644
--- a/aapl/insertsort.h
+++ b/aapl/insertsort.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/mergesort.h b/aapl/mergesort.h
index d017511f..68b84260 100644
--- a/aapl/mergesort.h
+++ b/aapl/mergesort.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/quicksort.h b/aapl/quicksort.h
index 9bb96efd..bb6941ef 100644
--- a/aapl/quicksort.h
+++ b/aapl/quicksort.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/resize.h b/aapl/resize.h
index 24edc16e..9e8491aa 100644
--- a/aapl/resize.h
+++ b/aapl/resize.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/sbstmap.h b/aapl/sbstmap.h
index 9436a472..e3975a1c 100644
--- a/aapl/sbstmap.h
+++ b/aapl/sbstmap.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/sbstset.h b/aapl/sbstset.h
index fe8ddf6c..3487ee75 100644
--- a/aapl/sbstset.h
+++ b/aapl/sbstset.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/sbsttable.h b/aapl/sbsttable.h
index 100b87ec..348f1fd0 100644
--- a/aapl/sbsttable.h
+++ b/aapl/sbsttable.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/svector.h b/aapl/svector.h
index db3a5656..7dcae62c 100644
--- a/aapl/svector.h
+++ b/aapl/svector.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002, 2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/table.h b/aapl/table.h
index c1f2b7bd..c218281b 100644
--- a/aapl/table.h
+++ b/aapl/table.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/aapl/vector.h b/aapl/vector.h
index 835607b1..5e7f9e57 100644
--- a/aapl/vector.h
+++ b/aapl/vector.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002, 2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Aapl.
diff --git a/colm/Makefile.in b/colm/Makefile.in
index 21dba83c..3f9a3a0c 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -1,5 +1,5 @@
 #
-#   Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Colm.
@@ -115,7 +115,7 @@ endif
 	$(CXX) -c $(CFLAGS) $(DEFS) $(INCS) -o $@ $<
 
 distclean: clean
-	rm -f Makefile 
+	rm -f Makefile config.h
 
 ifeq ($(BUILD_PARSERS),true)
 EXTRA_CLEAN = $(GEN_SRC)
diff --git a/colm/buffer.h b/colm/buffer.h
index 99c4e82d..9039ad4b 100644
--- a/colm/buffer.h
+++ b/colm/buffer.h
@@ -1,21 +1,21 @@
 /*
- *  Copyright 2003 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2003 Adrian Thurston <thurston@complang.org>
  */
 
-/*  This file is part of Ragel.
+/*  This file is part of Colm.
  *
- *  Ragel is free software; you can redistribute it and/or modify
+ *  Colm is free software; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation; either version 2 of the License, or
  *  (at your option) any later version.
  * 
- *  Ragel is distributed in the hope that it will be useful,
+ *  Colm is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  * 
  *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
+ *  along with Colm; if not, write to the Free Software
  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
  */
 
diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 30a76deb..8cd1b98b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 0bdcab99..885d2f4b 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/closure.cpp b/colm/closure.cpp
index 3a10d030..b3c17b1c 100644
--- a/colm/closure.cpp
+++ b/colm/closure.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2005 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2005 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/colm.h b/colm/colm.h
index 9d906c49..b3a1d21e 100644
--- a/colm/colm.h
+++ b/colm/colm.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/common.cpp b/colm/common.cpp
index e6b0a70b..8b262bb5 100644
--- a/colm/common.cpp
+++ b/colm/common.cpp
@@ -1,21 +1,21 @@
 /*
- *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2006-2007 Adrian Thurston <thurston@complang.org>
  */
 
-/*  This file is part of Ragel.
+/*  This file is part of Colm.
  *
- *  Ragel is free software; you can redistribute it and/or modify
+ *  Colm is free software; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation; either version 2 of the License, or
  *  (at your option) any later version.
  * 
- *  Ragel is distributed in the hope that it will be useful,
+ *  Colm is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  * 
  *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
+ *  along with Colm; if not, write to the Free Software
  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
  */
 
diff --git a/colm/common.h b/colm/common.h
index 53ce443d..688e60ee 100644
--- a/colm/common.h
+++ b/colm/common.h
@@ -1,21 +1,21 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
-/*  This file is part of Ragel.
+/*  This file is part of Colm.
  *
- *  Ragel is free software; you can redistribute it and/or modify
+ *  Colm is free software; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation; either version 2 of the License, or
  *  (at your option) any later version.
  * 
- *  Ragel is distributed in the hope that it will be useful,
+ *  Colm is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  * 
  *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
+ *  along with Colm; if not, write to the Free Software
  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
  */
 
diff --git a/colm/compile.cpp b/colm/compile.cpp
index ebe1fbdc..c0c31721 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/config.h.in b/colm/config.h.in
index c370f3b6..4dc1ce02 100644
--- a/colm/config.h.in
+++ b/colm/config.h.in
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Ragel.
diff --git a/colm/dotgen.cpp b/colm/dotgen.cpp
index d362d714..fd8af6b8 100644
--- a/colm/dotgen.cpp
+++ b/colm/dotgen.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/dotgen.h b/colm/dotgen.h
index c0cd31e7..e370866c 100644
--- a/colm/dotgen.h
+++ b/colm/dotgen.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmap.cpp b/colm/fsmap.cpp
index d843474f..bf190888 100644
--- a/colm/fsmap.cpp
+++ b/colm/fsmap.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002-2004 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002-2004 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmattach.cpp b/colm/fsmattach.cpp
index 201cdd76..31783ae0 100644
--- a/colm/fsmattach.cpp
+++ b/colm/fsmattach.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmbase.cpp b/colm/fsmbase.cpp
index 6db6e8da..823a7858 100644
--- a/colm/fsmbase.cpp
+++ b/colm/fsmbase.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 025c6dce..027ac3b5 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmcodegen.h b/colm/fsmcodegen.h
index ff804e88..3fbdd32d 100644
--- a/colm/fsmcodegen.h
+++ b/colm/fsmcodegen.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmexec.cpp b/colm/fsmexec.cpp
index 80370890..6f152d56 100644
--- a/colm/fsmexec.cpp
+++ b/colm/fsmexec.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmgraph.cpp b/colm/fsmgraph.cpp
index 6b955ad6..9ea082f0 100644
--- a/colm/fsmgraph.cpp
+++ b/colm/fsmgraph.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001, 2002, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001, 2002, 2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmgraph.h b/colm/fsmgraph.h
index 9c002077..2ab979f5 100644
--- a/colm/fsmgraph.h
+++ b/colm/fsmgraph.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmmin.cpp b/colm/fsmmin.cpp
index 901659f5..3abc4e88 100644
--- a/colm/fsmmin.cpp
+++ b/colm/fsmmin.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 9edb584b..bf6b0ce8 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 43f8cc8c..4d0dc58f 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/fsmstate.cpp b/colm/fsmstate.cpp
index d9df91ad..ab5bd93a 100644
--- a/colm/fsmstate.cpp
+++ b/colm/fsmstate.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2002 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/input.cpp b/colm/input.cpp
index d9a3c7e0..5434b2d6 100644
--- a/colm/input.cpp
+++ b/colm/input.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007, 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007, 2008 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/input.h b/colm/input.h
index e8e6655b..3796c554 100644
--- a/colm/input.h
+++ b/colm/input.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007, 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007, 2008 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/list.cpp b/colm/list.cpp
index 5d0fc7f1..8671fd51 100644
--- a/colm/list.cpp
+++ b/colm/list.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/lmparse.kh b/colm/lmparse.kh
index 598edf84..bac8a62d 100644
--- a/colm/lmparse.kh
+++ b/colm/lmparse.kh
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index ef04b711..06d19aa0 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/lmscan.h b/colm/lmscan.h
index 06ad6deb..8aa0d6da 100644
--- a/colm/lmscan.h
+++ b/colm/lmscan.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/lmscan.rl b/colm/lmscan.rl
index 6bbc5d00..d772a887 100644
--- a/colm/lmscan.rl
+++ b/colm/lmscan.rl
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2006-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2006-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/main.cpp b/colm/main.cpp
index 2e78efd7..75940d46 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/map.cpp b/colm/map.cpp
index 6327b301..0a98ae5f 100644
--- a/colm/map.cpp
+++ b/colm/map.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2008 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 54b55b23..5aab7886 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 801956f0..c16a6a2e 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/parsetree.cpp b/colm/parsetree.cpp
index 86284867..438193ee 100644
--- a/colm/parsetree.cpp
+++ b/colm/parsetree.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/parsetree.h b/colm/parsetree.h
index aceefea1..c4c6c9e8 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pcheck.h b/colm/pcheck.h
index df3706c2..5be60426 100644
--- a/colm/pcheck.h
+++ b/colm/pcheck.h
@@ -1,21 +1,21 @@
 /*
- *  Copyright 2001, 2002 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001, 2002 Adrian Thurston <thurston@complang.org>
  */
 
-/*  This file is part of Ragel.
+/*  This file is part of Colm.
  *
- *  Ragel is free software; you can redistribute it and/or modify
+ *  Colm is free software; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation; either version 2 of the License, or
  *  (at your option) any later version.
  * 
- *  Ragel is distributed in the hope that it will be useful,
+ *  Colm is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  * 
  *  You should have received a copy of the GNU General Public License
- *  along with Ragel; if not, write to the Free Software
+ *  along with Colm; if not, write to the Free Software
  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
  */
 
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 7d01deca..243d8fe1 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index fee17754..915cb6e5 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2003-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2003-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdacodegen.h b/colm/pdacodegen.h
index 79e6677c..216bd9e3 100644
--- a/colm/pdacodegen.h
+++ b/colm/pdacodegen.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdagraph.cpp b/colm/pdagraph.cpp
index 22c77dcc..72fd8dfc 100644
--- a/colm/pdagraph.cpp
+++ b/colm/pdagraph.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001, 2002, 2005 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001, 2002, 2005 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdagraph.h b/colm/pdagraph.h
index 8442ac10..fc0e5ef7 100644
--- a/colm/pdagraph.h
+++ b/colm/pdagraph.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2005 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2005 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 35a60446..04e2adef 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 7f633abe..84ab5682 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/redbuild.cpp b/colm/redbuild.cpp
index feec178f..b1789460 100644
--- a/colm/redbuild.cpp
+++ b/colm/redbuild.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2005-2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2005-2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/redbuild.h b/colm/redbuild.h
index 15c00ca2..2bc2b2f9 100644
--- a/colm/redbuild.h
+++ b/colm/redbuild.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2005, 2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2005, 2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/redfsm.cpp b/colm/redfsm.cpp
index 033bc131..31995c91 100644
--- a/colm/redfsm.cpp
+++ b/colm/redfsm.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/redfsm.h b/colm/redfsm.h
index 161df043..32310552 100644
--- a/colm/redfsm.h
+++ b/colm/redfsm.h
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2001-2006 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/string.cpp b/colm/string.cpp
index 84500f92..d2452862 100644
--- a/colm/string.cpp
+++ b/colm/string.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2007 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/colm/tree.cpp b/colm/tree.cpp
index f7f83c26..76c92ae3 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -1,5 +1,5 @@
 /*
- *  Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+ *  Copyright 2008 Adrian Thurston <thurston@complang.org>
  */
 
 /*  This file is part of Colm.
diff --git a/configure.in b/configure.in
index 575d2a7f..e1d898c7 100644
--- a/configure.in
+++ b/configure.in
@@ -1,5 +1,5 @@
 dnl 
-dnl   Copyright 2001-2008 Adrian Thurston <thurston@cs.queensu.ca>
+dnl   Copyright 2001-2008 Adrian Thurston <thurston@complang.org>
 dnl
 
 dnl   This file is part of Colm.
diff --git a/test/Makefile b/test/Makefile
index 8e420541..f86db51d 100644
--- a/test/Makefile
+++ b/test/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/cxx/Makefile b/test/cxx/Makefile
index a775f8c7..c19f557b 100644
--- a/test/cxx/Makefile
+++ b/test/cxx/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/diff/Makefile b/test/diff/Makefile
index 25a0b6d3..3e51996f 100644
--- a/test/diff/Makefile
+++ b/test/diff/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/dns/Makefile b/test/dns/Makefile
index 27b04782..86e11071 100644
--- a/test/dns/Makefile
+++ b/test/dns/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2007 Adrian Thurston <thurston@complang.org>
 #
 
 SRC = $(wildcard *.lm)
diff --git a/test/html/Makefile b/test/html/Makefile
index 25a0b6d3..3e51996f 100644
--- a/test/html/Makefile
+++ b/test/html/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/http/Makefile b/test/http/Makefile
index 25a0b6d3..3e51996f 100644
--- a/test/http/Makefile
+++ b/test/http/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/python/Makefile b/test/python/Makefile
index eeab1e53..7ee4cbe7 100644
--- a/test/python/Makefile
+++ b/test/python/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2007 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2007 Adrian Thurston <thurston@complang.org>
 #
 
 
diff --git a/test/ruby/Makefile b/test/ruby/Makefile
index 22647b42..bb1a9fe3 100644
--- a/test/ruby/Makefile
+++ b/test/ruby/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2008 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2008 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/xml/Makefile b/test/xml/Makefile
index 25a0b6d3..3e51996f 100644
--- a/test/xml/Makefile
+++ b/test/xml/Makefile
@@ -1,5 +1,5 @@
 #
-#   Copyright 2002-2006 Adrian Thurston <thurston@cs.queensu.ca>
+#   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
 #   This file is part of Ragel.
diff --git a/test/xml/xml.in b/test/xml/xml.in
index 3c024f80..22882c95 100644
--- a/test/xml/xml.in
+++ b/test/xml/xml.in
@@ -3741,7 +3741,7 @@
   </machine>
 </ragel_def>
 <host line="1" col="1">/*
- *  Copyright 2006-2007 Adrian Thurston &lt;thurston@cs.queensu.ca&gt;
+ *  Copyright 2006-2007 Adrian Thurston &lt;thurston@complang.org&gt;
  */
 
 /*  This file is part of Ragel.
-- 
cgit v1.2.1


From 9b670aed8f5ecbde13fe30da09eacf569f924002 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 22:33:17 +0000
Subject: Const correctness fixes.

---
 colm/common.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/colm/common.h b/colm/common.h
index 688e60ee..faf7e203 100644
--- a/colm/common.h
+++ b/colm/common.h
@@ -99,8 +99,8 @@ public:
 
 struct HostType
 {
-	char *data1;
-	char *data2;
+	const char *data1;
+	const char *data2;
 	bool isSigned;
 	long long minVal;
 	long long maxVal;
-- 
cgit v1.2.1


From 6451201175074b9aba0a9d0dc0ebe89647225cdd Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 23:17:53 +0000
Subject: some organization improvements

---
 colm/Makefile.in   |   2 +-
 colm/colm.h        |   2 +-
 colm/common.cpp    | 257 ------------------------------------------------
 colm/common.h      | 283 -----------------------------------------------------
 colm/fsmcodegen.h  |   2 +-
 colm/fsmgraph.h    |   2 +-
 colm/keyops.h      | 283 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 colm/main.cpp      |  66 ++++++++++++-
 colm/parsedata.cpp |  37 -------
 colm/parsedata.h   |   2 +-
 colm/pcheck.cpp    | 154 +++++++++++++++++++++++++++++
 colm/redfsm.h      |   2 +-
 12 files changed, 508 insertions(+), 584 deletions(-)
 delete mode 100644 colm/common.cpp
 delete mode 100644 colm/common.h
 create mode 100644 colm/keyops.h
 create mode 100644 colm/pcheck.cpp

diff --git a/colm/Makefile.in b/colm/Makefile.in
index 3f9a3a0c..11616d65 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -55,7 +55,7 @@ CC_SRCS = \
 	closure.cpp \
 	fsmap.cpp \
 	dotgen.cpp \
-	common.cpp
+	pcheck.cpp
 
 RUNTIME_SRC = fsmrun.cpp pdarun.cpp bytecode.cpp list.cpp \
 	map.cpp string.cpp input.cpp tree.cpp
diff --git a/colm/colm.h b/colm/colm.h
index b3a1d21e..6ae9fc68 100644
--- a/colm/colm.h
+++ b/colm/colm.h
@@ -30,7 +30,7 @@
 
 #include "config.h"
 #include "avltree.h"
-#include "common.h"
+#include "keyops.h"
 
 #define PROGNAME "colm"
 
diff --git a/colm/common.cpp b/colm/common.cpp
deleted file mode 100644
index 8b262bb5..00000000
--- a/colm/common.cpp
+++ /dev/null
@@ -1,257 +0,0 @@
-/*
- *  Copyright 2006-2007 Adrian Thurston <thurston@complang.org>
- */
-
-/*  This file is part of Colm.
- *
- *  Colm is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Colm is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Colm; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#include "pcheck.h"
-#include "common.h"
-#include <assert.h>
-
-HostType hostTypesC[] =
-{
-	{ "char",     0,       true,   CHAR_MIN,  CHAR_MAX,   sizeof(char) },
-	{ "unsigned", "char",  false,  0,         UCHAR_MAX,  sizeof(unsigned char) },
-	{ "short",    0,       true,   SHRT_MIN,  SHRT_MAX,   sizeof(short) },
-	{ "unsigned", "short", false,  0,         USHRT_MAX,  sizeof(unsigned short) },
-	{ "int",      0,       true,   INT_MIN,   INT_MAX,    sizeof(int) },
-	{ "unsigned", "int",   false,  0,         UINT_MAX,   sizeof(unsigned int) },
-	{ "long",     0,       true,   LONG_MIN,  LONG_MAX,   sizeof(long) },
-	{ "unsigned", "long",  false,  0,         ULONG_MAX,  sizeof(unsigned long) }
-};
-
-HostType hostTypesD[] =
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "ubyte",    0,  false,  0,         UCHAR_MAX,   1 },
-	{ "char",     0,  false,  0,         UCHAR_MAX,   1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "ushort",   0,  false,  0,         USHRT_MAX,   2 },
-	{ "wchar",    0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-	{ "uint",     0,  false,  0,         UINT_MAX,    4 },
-	{ "dchar",    0,  false,  0,         UINT_MAX,    4 }
-};
-
-HostType hostTypesJava[] = 
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-};
-
-HostType hostTypesRuby[] = 
-{
-	{ "byte",     0,  true,   CHAR_MIN,  CHAR_MAX,    1 },
-	{ "short",    0,  true,   SHRT_MIN,  SHRT_MAX,    2 },
-	{ "char",     0,  false,  0,         USHRT_MAX,   2 },
-	{ "int",      0,  true,   INT_MIN,   INT_MAX,     4 },
-};
-
-HostLang hostLangC =    { hostTypesC,    8, hostTypesC+0,    true };
-HostLang hostLangD =    { hostTypesD,    9, hostTypesD+2,    true };
-HostLang hostLangJava = { hostTypesJava, 4, hostTypesJava+2, false };
-HostLang hostLangRuby = { hostTypesRuby, 4, hostTypesRuby+2, false };
-
-HostLang *hostLang = &hostLangC;
-HostLangType hostLangType = CCode;
-
-/* Construct a new parameter checker with for paramSpec. */
-ParamCheck::ParamCheck( const char *paramSpec, int argc,  const char **argv )
-:
-	state(noparam),
-	argOffset(0),
-	curArg(0),
-	iCurArg(1),
-	paramSpec(paramSpec), 
-	argc(argc), 
-	argv(argv)
-{
-}
-
-/* Check a single option. Returns the index of the next parameter.  Sets p to
- * the arg character if valid, 0 otherwise.  Sets parg to the parameter arg if
- * there is one, NULL otherwise. */
-bool ParamCheck::check()
-{
-	bool requiresParam;
-
-	if ( iCurArg >= argc ) {            /* Off the end of the arg list. */
-		state = noparam;
-		return false;
-	}
-
-	if ( argOffset != 0 && *argOffset == 0 ) {
-		/* We are at the end of an arg string. */
-		iCurArg += 1;
-		if ( iCurArg >= argc ) {
-			state = noparam;
-			return false;
-		}
-		argOffset = 0;
-	}
-
-	if ( argOffset == 0 ) {
-		/* Set the current arg. */
-		curArg = argv[iCurArg];
-
-		/* We are at the beginning of an arg string. */
-		if ( argv[iCurArg] == 0 ||        /* Argv[iCurArg] is null. */
-			 argv[iCurArg][0] != '-' ||   /* Not a param. */
-			 argv[iCurArg][1] == 0 ) {    /* Only a dash. */
-			parameter = 0;
-			parameterArg = 0;
-
-			iCurArg += 1;
-			state = noparam;
-			return true;
-		}
-		argOffset = argv[iCurArg] + 1;
-	}
-
-	/* Get the arg char. */
-	char argChar = *argOffset;
-	
-	/* Loop over all the parms and look for a match. */
-	const char *pSpec = paramSpec;
-	while ( *pSpec != 0 ) {
-		char pSpecChar = *pSpec;
-
-		/* If there is a ':' following the char then
-		 * it requires a parm.  If a parm is required
-		 * then move ahead two in the parmspec. Otherwise
-		 * move ahead one in the parm spec. */
-		if ( pSpec[1] == ':' ) {
-			requiresParam = true;
-			pSpec += 2;
-		}
-		else {
-			requiresParam = false;
-			pSpec += 1;
-		}
-
-		/* Do we have a match. */
-		if ( argChar == pSpecChar ) {
-			if ( requiresParam ) {
-				if ( argOffset[1] == 0 ) {
-					/* The param must follow. */
-					if ( iCurArg + 1 == argc ) {
-						/* We are the last arg so there
-						 * cannot be a parameter to it. */
-						parameter = argChar;
-						parameterArg = 0;
-						iCurArg += 1;
-						argOffset = 0;
-						state = invalid;
-						return true;
-					}
-					else {
-						/* the parameter to the arg is the next arg. */
-						parameter = pSpecChar;
-						parameterArg = argv[iCurArg + 1];
-						iCurArg += 2;
-						argOffset = 0;
-						state = match;
-						return true;
-					}
-				}
-				else {
-					/* The param for the arg is built in. */
-					parameter = pSpecChar;
-					parameterArg = argOffset + 1;
-					iCurArg += 1;
-					argOffset = 0;
-					state = match;
-					return true;
-				}
-			}
-			else {
-				/* Good, we matched the parm and no
-				 * arg is required. */
-				parameter = pSpecChar;
-				parameterArg = 0;
-				argOffset += 1;
-				state = match;
-				return true;
-			}
-		}
-	}
-
-	/* We did not find a match. Bad Argument. */
-	parameter = argChar;
-	parameterArg = 0;
-	argOffset += 1;
-	state = invalid;
-	return true;
-}
-
-/* Scans a string looking for the file extension. If there is a file
- * extension then pointer returned points to inside the string
- * passed in. Otherwise returns null. */
-const char *findFileExtension( const char *stemFile )
-{
-	const char *ppos = stemFile + strlen(stemFile) - 1;
-
-	/* Scan backwards from the end looking for the first dot.
-	 * If we encounter a '/' before the first dot, then stop the scan. */
-	while ( 1 ) {
-		/* If we found a dot or got to the beginning of the string then
-		 * we are done. */
-		if ( ppos == stemFile || *ppos == '.' )
-			break;
-
-		/* If we hit a / then there is no extension. Done. */
-		if ( *ppos == '/' ) {
-			ppos = stemFile;
-			break;
-		}
-		ppos--;
-	} 
-
-	/* If we got to the front of the string then bail we 
-	 * did not find an extension  */
-	if ( ppos == stemFile )
-		ppos = 0;
-
-	return ppos;
-}
-
-/* Make a file name from a stem. Removes the old filename suffix and
- * replaces it with a new one. Returns a newed up string. */
-char *fileNameFromStem( const char *stemFile, const char *suffix )
-{
-	int len = strlen( stemFile );
-	assert( len > 0 );
-
-	/* Get the extension. */
-	const char *ppos = findFileExtension( stemFile );
-
-	/* If an extension was found, then shorten what we think the len is. */
-	if ( ppos != 0 )
-		len = ppos - stemFile;
-
-	/* Make the return string from the stem and the suffix. */
-	char *retVal = new char[ len + strlen( suffix ) + 1 ];
-	strncpy( retVal, stemFile, len );
-	strcpy( retVal + len, suffix );
-
-	return retVal;
-}
-
-
diff --git a/colm/common.h b/colm/common.h
deleted file mode 100644
index faf7e203..00000000
--- a/colm/common.h
+++ /dev/null
@@ -1,283 +0,0 @@
-/*
- *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
- */
-
-/*  This file is part of Colm.
- *
- *  Colm is free software; you can redistribute it and/or modify
- *  it under the terms of the GNU General Public License as published by
- *  the Free Software Foundation; either version 2 of the License, or
- *  (at your option) any later version.
- * 
- *  Colm is distributed in the hope that it will be useful,
- *  but WITHOUT ANY WARRANTY; without even the implied warranty of
- *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- *  GNU General Public License for more details.
- * 
- *  You should have received a copy of the GNU General Public License
- *  along with Colm; if not, write to the Free Software
- *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
- */
-
-#ifndef _COMMON_H
-#define _COMMON_H
-
-#include <fstream>
-#include <climits>
-
-enum MarkType
-{
-	MarkEnter,
-	MarkLeave
-};
-
-typedef unsigned long long Size;
-
-struct Key
-{
-private:
-	long key;
-
-public:
-	friend inline Key operator+(const Key key1, const Key key2);
-	friend inline Key operator-(const Key key1, const Key key2);
-	friend inline Key operator/(const Key key1, const Key key2);
-	friend inline long operator&(const Key key1, const Key key2);
-
-	friend inline bool operator<( const Key key1, const Key key2 );
-	friend inline bool operator<=( const Key key1, const Key key2 );
-	friend inline bool operator>( const Key key1, const Key key2 );
-	friend inline bool operator>=( const Key key1, const Key key2 );
-	friend inline bool operator==( const Key key1, const Key key2 );
-	friend inline bool operator!=( const Key key1, const Key key2 );
-
-	friend struct KeyOps;
-	
-	Key( ) {}
-	Key( const Key &key ) : key(key.key) {}
-	Key( long key ) : key(key) {}
-
-	/* Returns the value used to represent the key. This value must be
-	 * interpreted based on signedness. */
-	long getVal() const { return key; };
-
-	/* Returns the key casted to a long long. This form of the key does not
-	 * require and signedness interpretation. */
-	long long getLongLong() const;
-
-	bool isUpper() const { return ( 'A' <= key && key <= 'Z' ); }
-	bool isLower() const { return ( 'a' <= key && key <= 'z' ); }
-	bool isPrintable() const { return ( 32 <= key && key < 127 ); }
-
-	Key toUpper() const
-		{ return Key( 'A' + ( key - 'a' ) ); }
-	Key toLower() const
-		{ return Key( 'a' + ( key - 'A' ) ); }
-
-	void operator+=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key += other.key;
-	}
-
-	void operator-=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key -= other.key;
-	}
-
-	void operator|=( const Key other )
-	{
-		/* FIXME: must be made aware of isSigned. */
-		key |= other.key;
-	}
-
-	/* Decrement. Needed only for ranges. */
-	inline void decrement();
-	inline void increment();
-};
-
-struct HostType
-{
-	const char *data1;
-	const char *data2;
-	bool isSigned;
-	long long minVal;
-	long long maxVal;
-	unsigned int size;
-};
-
-struct HostLang
-{
-	HostType *hostTypes;
-	int numHostTypes;
-	HostType *defaultAlphType;
-	bool explicitUnsigned;
-};
-
-
-/* Target language. */
-enum HostLangType
-{
-	CCode,
-	DCode,
-	JavaCode,
-	RubyCode
-};
-
-extern HostLang *hostLang;
-extern HostLangType hostLangType;
-
-extern HostLang hostLangC;
-extern HostLang hostLangD;
-extern HostLang hostLangJava;
-extern HostLang hostLangRuby;
-
-/* An abstraction of the key operators that manages key operations such as
- * comparison and increment according the signedness of the key. */
-struct KeyOps
-{
-	/* Default to signed alphabet. */
-	KeyOps() :
-		isSigned(true),
-		alphType(0)
-	{}
-
-	/* Default to signed alphabet. */
-	KeyOps( bool isSigned ) 
-		:isSigned(isSigned) {}
-
-	bool isSigned;
-	Key minKey, maxKey;
-	HostType *alphType;
-
-	void setAlphType( HostType *alphType )
-	{
-		this->alphType = alphType;
-		isSigned = alphType->isSigned;
-		if ( isSigned ) {
-			minKey = (long) alphType->minVal;
-			maxKey = (long) alphType->maxVal;
-		}
-		else {
-			minKey = (long) (unsigned long) alphType->minVal; 
-			maxKey = (long) (unsigned long) alphType->maxVal;
-		}
-	}
-
-	/* Compute the distance between two keys. */
-	Size span( Key key1, Key key2 )
-	{
-		return isSigned ? 
-			(unsigned long long)(
-				(long long)key2.key - 
-				(long long)key1.key + 1) : 
-			(unsigned long long)(
-				(unsigned long)key2.key) - 
-				(unsigned long long)((unsigned long)key1.key) + 1;
-	}
-
-	Size alphSize()
-		{ return span( minKey, maxKey ); }
-
-	HostType *typeSubsumes( long long maxVal )
-	{
-		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-			if ( maxVal <= hostLang->hostTypes[i].maxVal )
-				return hostLang->hostTypes + i;
-		}
-		return 0;
-	}
-
-	HostType *typeSubsumes( bool isSigned, long long maxVal )
-	{
-		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
-					maxVal <= hostLang->hostTypes[i].maxVal )
-				return hostLang->hostTypes + i;
-		}
-		return 0;
-	}
-};
-
-extern KeyOps *keyOps;
-
-inline bool operator<( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key < key2.key : 
-		(unsigned long)key1.key < (unsigned long)key2.key;
-}
-
-inline bool operator<=( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ?  key1.key <= key2.key : 
-		(unsigned long)key1.key <= (unsigned long)key2.key;
-}
-
-inline bool operator>( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key > key2.key : 
-		(unsigned long)key1.key > (unsigned long)key2.key;
-}
-
-inline bool operator>=( const Key key1, const Key key2 )
-{
-	return keyOps->isSigned ? key1.key >= key2.key : 
-		(unsigned long)key1.key >= (unsigned long)key2.key;
-}
-
-inline bool operator==( const Key key1, const Key key2 )
-{
-	return key1.key == key2.key;
-}
-
-inline bool operator!=( const Key key1, const Key key2 )
-{
-	return key1.key != key2.key;
-}
-
-/* Decrement. Needed only for ranges. */
-inline void Key::decrement()
-{
-	key = keyOps->isSigned ? key - 1 : ((unsigned long)key)-1;
-}
-
-/* Increment. Needed only for ranges. */
-inline void Key::increment()
-{
-	key = keyOps->isSigned ? key+1 : ((unsigned long)key)+1;
-}
-
-inline long long Key::getLongLong() const
-{
-	return keyOps->isSigned ? (long long)key : (long long)(unsigned long)key;
-}
-
-inline Key operator+(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return Key( key1.key + key2.key );
-}
-
-inline Key operator-(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return Key( key1.key - key2.key );
-}
-
-inline long operator&(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return key1.key & key2.key;
-}
-
-inline Key operator/(const Key key1, const Key key2)
-{
-	/* FIXME: must be made aware of isSigned. */
-	return key1.key / key2.key;
-}
-
-const char *findFileExtension( const char *stemFile );
-char *fileNameFromStem( const char *stemFile, const char *suffix );
-
-#endif /* _COMMON_H */
diff --git a/colm/fsmcodegen.h b/colm/fsmcodegen.h
index 3fbdd32d..06e998c3 100644
--- a/colm/fsmcodegen.h
+++ b/colm/fsmcodegen.h
@@ -25,7 +25,7 @@
 #include <iostream>
 #include <string>
 #include <stdio.h>
-#include "common.h"
+#include "keyops.h"
 #include "parsedata.h"
 #include "redfsm.h"
 
diff --git a/colm/fsmgraph.h b/colm/fsmgraph.h
index 2ab979f5..f898a3d6 100644
--- a/colm/fsmgraph.h
+++ b/colm/fsmgraph.h
@@ -23,7 +23,7 @@
 #define _FSMGRAPH_H
 
 #include <assert.h>
-#include "common.h"
+#include "keyops.h"
 #include "vector.h"
 #include "bstset.h"
 #include "compare.h"
diff --git a/colm/keyops.h b/colm/keyops.h
new file mode 100644
index 00000000..c9828cfd
--- /dev/null
+++ b/colm/keyops.h
@@ -0,0 +1,283 @@
+/*
+ *  Copyright 2001-2006 Adrian Thurston <thurston@complang.org>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#ifndef _KEYOPS_H
+#define _KEYOPS_H
+
+#include <fstream>
+#include <climits>
+
+enum MarkType
+{
+	MarkEnter,
+	MarkLeave
+};
+
+typedef unsigned long long Size;
+
+struct Key
+{
+private:
+	long key;
+
+public:
+	friend inline Key operator+(const Key key1, const Key key2);
+	friend inline Key operator-(const Key key1, const Key key2);
+	friend inline Key operator/(const Key key1, const Key key2);
+	friend inline long operator&(const Key key1, const Key key2);
+
+	friend inline bool operator<( const Key key1, const Key key2 );
+	friend inline bool operator<=( const Key key1, const Key key2 );
+	friend inline bool operator>( const Key key1, const Key key2 );
+	friend inline bool operator>=( const Key key1, const Key key2 );
+	friend inline bool operator==( const Key key1, const Key key2 );
+	friend inline bool operator!=( const Key key1, const Key key2 );
+
+	friend struct KeyOps;
+	
+	Key( ) {}
+	Key( const Key &key ) : key(key.key) {}
+	Key( long key ) : key(key) {}
+
+	/* Returns the value used to represent the key. This value must be
+	 * interpreted based on signedness. */
+	long getVal() const { return key; };
+
+	/* Returns the key casted to a long long. This form of the key does not
+	 * require and signedness interpretation. */
+	long long getLongLong() const;
+
+	bool isUpper() const { return ( 'A' <= key && key <= 'Z' ); }
+	bool isLower() const { return ( 'a' <= key && key <= 'z' ); }
+	bool isPrintable() const { return ( 32 <= key && key < 127 ); }
+
+	Key toUpper() const
+		{ return Key( 'A' + ( key - 'a' ) ); }
+	Key toLower() const
+		{ return Key( 'a' + ( key - 'A' ) ); }
+
+	void operator+=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key += other.key;
+	}
+
+	void operator-=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key -= other.key;
+	}
+
+	void operator|=( const Key other )
+	{
+		/* FIXME: must be made aware of isSigned. */
+		key |= other.key;
+	}
+
+	/* Decrement. Needed only for ranges. */
+	inline void decrement();
+	inline void increment();
+};
+
+struct HostType
+{
+	const char *data1;
+	const char *data2;
+	bool isSigned;
+	long long minVal;
+	long long maxVal;
+	unsigned int size;
+};
+
+struct HostLang
+{
+	HostType *hostTypes;
+	int numHostTypes;
+	HostType *defaultAlphType;
+	bool explicitUnsigned;
+};
+
+
+/* Target language. */
+enum HostLangType
+{
+	CCode,
+	DCode,
+	JavaCode,
+	RubyCode
+};
+
+extern HostLang *hostLang;
+extern HostLangType hostLangType;
+
+extern HostLang hostLangC;
+extern HostLang hostLangD;
+extern HostLang hostLangJava;
+extern HostLang hostLangRuby;
+
+/* An abstraction of the key operators that manages key operations such as
+ * comparison and increment according the signedness of the key. */
+struct KeyOps
+{
+	/* Default to signed alphabet. */
+	KeyOps() :
+		isSigned(true),
+		alphType(0)
+	{}
+
+	/* Default to signed alphabet. */
+	KeyOps( bool isSigned ) 
+		:isSigned(isSigned) {}
+
+	bool isSigned;
+	Key minKey, maxKey;
+	HostType *alphType;
+
+	void setAlphType( HostType *alphType )
+	{
+		this->alphType = alphType;
+		isSigned = alphType->isSigned;
+		if ( isSigned ) {
+			minKey = (long) alphType->minVal;
+			maxKey = (long) alphType->maxVal;
+		}
+		else {
+			minKey = (long) (unsigned long) alphType->minVal; 
+			maxKey = (long) (unsigned long) alphType->maxVal;
+		}
+	}
+
+	/* Compute the distance between two keys. */
+	Size span( Key key1, Key key2 )
+	{
+		return isSigned ? 
+			(unsigned long long)(
+				(long long)key2.key - 
+				(long long)key1.key + 1) : 
+			(unsigned long long)(
+				(unsigned long)key2.key) - 
+				(unsigned long long)((unsigned long)key1.key) + 1;
+	}
+
+	Size alphSize()
+		{ return span( minKey, maxKey ); }
+
+	HostType *typeSubsumes( long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+
+	HostType *typeSubsumes( bool isSigned, long long maxVal )
+	{
+		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
+			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
+					maxVal <= hostLang->hostTypes[i].maxVal )
+				return hostLang->hostTypes + i;
+		}
+		return 0;
+	}
+};
+
+extern KeyOps *keyOps;
+
+inline bool operator<( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key < key2.key : 
+		(unsigned long)key1.key < (unsigned long)key2.key;
+}
+
+inline bool operator<=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ?  key1.key <= key2.key : 
+		(unsigned long)key1.key <= (unsigned long)key2.key;
+}
+
+inline bool operator>( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key > key2.key : 
+		(unsigned long)key1.key > (unsigned long)key2.key;
+}
+
+inline bool operator>=( const Key key1, const Key key2 )
+{
+	return keyOps->isSigned ? key1.key >= key2.key : 
+		(unsigned long)key1.key >= (unsigned long)key2.key;
+}
+
+inline bool operator==( const Key key1, const Key key2 )
+{
+	return key1.key == key2.key;
+}
+
+inline bool operator!=( const Key key1, const Key key2 )
+{
+	return key1.key != key2.key;
+}
+
+/* Decrement. Needed only for ranges. */
+inline void Key::decrement()
+{
+	key = keyOps->isSigned ? key - 1 : ((unsigned long)key)-1;
+}
+
+/* Increment. Needed only for ranges. */
+inline void Key::increment()
+{
+	key = keyOps->isSigned ? key+1 : ((unsigned long)key)+1;
+}
+
+inline long long Key::getLongLong() const
+{
+	return keyOps->isSigned ? (long long)key : (long long)(unsigned long)key;
+}
+
+inline Key operator+(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key + key2.key );
+}
+
+inline Key operator-(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return Key( key1.key - key2.key );
+}
+
+inline long operator&(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key & key2.key;
+}
+
+inline Key operator/(const Key key1, const Key key2)
+{
+	/* FIXME: must be made aware of isSigned. */
+	return key1.key / key2.key;
+}
+
+const char *findFileExtension( const char *stemFile );
+char *fileNameFromStem( const char *stemFile, const char *suffix );
+
+#endif /* _KEYOPS_H */
diff --git a/colm/main.cpp b/colm/main.cpp
index 75940d46..8b8ac853 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -32,7 +32,7 @@
 #include "pcheck.h"
 #include "vector.h"
 #include "version.h"
-#include "common.h"
+#include "keyops.h"
 #include "parsedata.h"
 #include "vector.h"
 #include "version.h"
@@ -82,6 +82,16 @@ void version();
 /* Total error count. */
 int gblErrorCount = 0;
 
+HostType hostTypesC[] =
+{
+	{ "char",     0,       true,   CHAR_MIN,  CHAR_MAX,   sizeof(char) },
+};
+
+HostLang hostLangC =    { hostTypesC,    8, hostTypesC+0,    true };
+
+HostLang *hostLang = &hostLangC;
+HostLangType hostLangType = CCode;
+
 /* Print the opening to an error in the input, then return the error ostream. */
 ostream &error( const InputLoc &loc )
 {
@@ -153,6 +163,60 @@ void version()
 			"Copyright (c) 2007, 2008 by Adrian Thurston" << endl;
 }
 
+/* Scans a string looking for the file extension. If there is a file
+ * extension then pointer returned points to inside the string
+ * passed in. Otherwise returns null. */
+const char *findFileExtension( const char *stemFile )
+{
+	const char *ppos = stemFile + strlen(stemFile) - 1;
+
+	/* Scan backwards from the end looking for the first dot.
+	 * If we encounter a '/' before the first dot, then stop the scan. */
+	while ( 1 ) {
+		/* If we found a dot or got to the beginning of the string then
+		 * we are done. */
+		if ( ppos == stemFile || *ppos == '.' )
+			break;
+
+		/* If we hit a / then there is no extension. Done. */
+		if ( *ppos == '/' ) {
+			ppos = stemFile;
+			break;
+		}
+		ppos--;
+	} 
+
+	/* If we got to the front of the string then bail we 
+	 * did not find an extension  */
+	if ( ppos == stemFile )
+		ppos = 0;
+
+	return ppos;
+}
+
+/* Make a file name from a stem. Removes the old filename suffix and
+ * replaces it with a new one. Returns a newed up string. */
+char *fileNameFromStem( const char *stemFile, const char *suffix )
+{
+	int len = strlen( stemFile );
+	assert( len > 0 );
+
+	/* Get the extension. */
+	const char *ppos = findFileExtension( stemFile );
+
+	/* If an extension was found, then shorten what we think the len is. */
+	if ( ppos != 0 )
+		len = ppos - stemFile;
+
+	/* Make the return string from the stem and the suffix. */
+	char *retVal = new char[ len + strlen( suffix ) + 1 ];
+	strncpy( retVal, stemFile, len );
+	strcpy( retVal + len, suffix );
+
+	return retVal;
+}
+
+
 /* Invoked by the parser when the root element is opened. */
 void openOutput( )
 {
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 5aab7886..92957327 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -707,43 +707,6 @@ void ParseData::initGraphDict( )
 	createBuiltin( "empty", BT_Empty );
 }
 
-/* Set the alphabet type. If the types are not valid returns false. */
-bool ParseData::setAlphType( char *s1, char *s2 )
-{
-	bool valid = false;
-	for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-		if ( strcmp( s1, hostLang->hostTypes[i].data1 ) == 0 && 
-				hostLang->hostTypes[i].data2 != 0 && 
-				strcmp( s2, hostLang->hostTypes[i].data2 ) == 0 )
-		{
-			valid = true;
-			userAlphType = hostLang->hostTypes + i;
-			break;
-		}
-	}
-
-	alphTypeSet = true;
-	return valid;
-}
-
-/* Set the alphabet type. If the types are not valid returns false. */
-bool ParseData::setAlphType( char *s1 )
-{
-	bool valid = false;
-	for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-		if ( strcmp( s1, hostLang->hostTypes[i].data1 ) == 0 && 
-				hostLang->hostTypes[i].data2 == 0 )
-		{
-			valid = true;
-			userAlphType = hostLang->hostTypes + i;
-			break;
-		}
-	}
-
-	alphTypeSet = true;
-	return valid;
-}
-
 /* Initialize the key operators object that will be referenced by all fsms
  * created. */
 void ParseData::initKeyOps( )
diff --git a/colm/parsedata.h b/colm/parsedata.h
index c16a6a2e..12a1e07d 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -35,7 +35,7 @@
 #include "fsmgraph.h"
 #include "compare.h"
 #include "vector.h"
-#include "common.h"
+#include "keyops.h"
 #include "parsetree.h"
 #include "astring.h"
 #include "pdagraph.h"
diff --git a/colm/pcheck.cpp b/colm/pcheck.cpp
new file mode 100644
index 00000000..ee1985c7
--- /dev/null
+++ b/colm/pcheck.cpp
@@ -0,0 +1,154 @@
+/*
+ *  Copyright 2006-2007 Adrian Thurston <thurston@complang.org>
+ */
+
+/*  This file is part of Colm.
+ *
+ *  Colm is free software; you can redistribute it and/or modify
+ *  it under the terms of the GNU General Public License as published by
+ *  the Free Software Foundation; either version 2 of the License, or
+ *  (at your option) any later version.
+ * 
+ *  Colm is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU General Public License for more details.
+ * 
+ *  You should have received a copy of the GNU General Public License
+ *  along with Colm; if not, write to the Free Software
+ *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+ */
+
+#include "pcheck.h"
+#include <assert.h>
+
+/* Construct a new parameter checker with for paramSpec. */
+ParamCheck::ParamCheck( const char *paramSpec, int argc,  const char **argv )
+:
+	state(noparam),
+	argOffset(0),
+	curArg(0),
+	iCurArg(1),
+	paramSpec(paramSpec), 
+	argc(argc), 
+	argv(argv)
+{
+}
+
+/* Check a single option. Returns the index of the next parameter.  Sets p to
+ * the arg character if valid, 0 otherwise.  Sets parg to the parameter arg if
+ * there is one, NULL otherwise. */
+bool ParamCheck::check()
+{
+	bool requiresParam;
+
+	if ( iCurArg >= argc ) {            /* Off the end of the arg list. */
+		state = noparam;
+		return false;
+	}
+
+	if ( argOffset != 0 && *argOffset == 0 ) {
+		/* We are at the end of an arg string. */
+		iCurArg += 1;
+		if ( iCurArg >= argc ) {
+			state = noparam;
+			return false;
+		}
+		argOffset = 0;
+	}
+
+	if ( argOffset == 0 ) {
+		/* Set the current arg. */
+		curArg = argv[iCurArg];
+
+		/* We are at the beginning of an arg string. */
+		if ( argv[iCurArg] == 0 ||        /* Argv[iCurArg] is null. */
+			 argv[iCurArg][0] != '-' ||   /* Not a param. */
+			 argv[iCurArg][1] == 0 ) {    /* Only a dash. */
+			parameter = 0;
+			parameterArg = 0;
+
+			iCurArg += 1;
+			state = noparam;
+			return true;
+		}
+		argOffset = argv[iCurArg] + 1;
+	}
+
+	/* Get the arg char. */
+	char argChar = *argOffset;
+	
+	/* Loop over all the parms and look for a match. */
+	const char *pSpec = paramSpec;
+	while ( *pSpec != 0 ) {
+		char pSpecChar = *pSpec;
+
+		/* If there is a ':' following the char then
+		 * it requires a parm.  If a parm is required
+		 * then move ahead two in the parmspec. Otherwise
+		 * move ahead one in the parm spec. */
+		if ( pSpec[1] == ':' ) {
+			requiresParam = true;
+			pSpec += 2;
+		}
+		else {
+			requiresParam = false;
+			pSpec += 1;
+		}
+
+		/* Do we have a match. */
+		if ( argChar == pSpecChar ) {
+			if ( requiresParam ) {
+				if ( argOffset[1] == 0 ) {
+					/* The param must follow. */
+					if ( iCurArg + 1 == argc ) {
+						/* We are the last arg so there
+						 * cannot be a parameter to it. */
+						parameter = argChar;
+						parameterArg = 0;
+						iCurArg += 1;
+						argOffset = 0;
+						state = invalid;
+						return true;
+					}
+					else {
+						/* the parameter to the arg is the next arg. */
+						parameter = pSpecChar;
+						parameterArg = argv[iCurArg + 1];
+						iCurArg += 2;
+						argOffset = 0;
+						state = match;
+						return true;
+					}
+				}
+				else {
+					/* The param for the arg is built in. */
+					parameter = pSpecChar;
+					parameterArg = argOffset + 1;
+					iCurArg += 1;
+					argOffset = 0;
+					state = match;
+					return true;
+				}
+			}
+			else {
+				/* Good, we matched the parm and no
+				 * arg is required. */
+				parameter = pSpecChar;
+				parameterArg = 0;
+				argOffset += 1;
+				state = match;
+				return true;
+			}
+		}
+	}
+
+	/* We did not find a match. Bad Argument. */
+	parameter = argChar;
+	parameterArg = 0;
+	argOffset += 1;
+	state = invalid;
+	return true;
+}
+
+
diff --git a/colm/redfsm.h b/colm/redfsm.h
index 32310552..d5d5a03f 100644
--- a/colm/redfsm.h
+++ b/colm/redfsm.h
@@ -25,7 +25,7 @@
 #include <assert.h>
 #include <string.h>
 #include <string>
-#include "common.h"
+#include "keyops.h"
 #include "vector.h"
 #include "dlist.h"
 #include "compare.h"
-- 
cgit v1.2.1


From 8036f23c96d6f0dea1a25fde68fbb18ac4793b9f Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 1 Nov 2008 23:34:59 +0000
Subject: Added a pointer to Program to FsmRun.

---
 colm/bytecode.cpp  |  4 ++--
 colm/fsmrun.cpp    | 59 +++++++++++++++++++++++++++---------------------------
 colm/fsmrun.h      |  3 ++-
 colm/parsedata.cpp |  2 +-
 4 files changed, 35 insertions(+), 33 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 8cd1b98b..8c25079d 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -156,7 +156,7 @@ Stream *open_stream_file( Program *prg, FILE *file )
 	res->id = LEL_ID_STREAM;
 	res->file = file;
 	res->in = new InputStreamFile( file );
-	res->scanner = new FsmRun( prg->rtd->fsmTables );
+	res->scanner = new FsmRun( prg );
 	res->scanner->attachInputStream( res->in );
 	return res;
 }
@@ -166,7 +166,7 @@ Stream *open_stream_fd( Program *prg, long fd )
 	Stream *res = (Stream*)prg->mapElPool.allocate();
 	res->id = LEL_ID_STREAM;
 	res->in = new InputStreamFD( fd );
-	res->scanner = new FsmRun( prg->rtd->fsmTables );
+	res->scanner = new FsmRun( prg );
 	res->scanner->attachInputStream( res->in );
 	return res;
 }
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index bf6b0ce8..8eb2101b 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -42,8 +42,9 @@ void operator<<( ostream &out, exit_object & )
 	exit(1);
 }
 
-FsmRun::FsmRun( FsmTables *tables ) :
-	tables(tables),
+FsmRun::FsmRun( Program *prg ) :
+	prg(prg),
+	tables(prg->rtd->fsmTables),
 	parser(0),
 	position(0)
 {
@@ -213,7 +214,7 @@ void FsmRun::queueBack( Kid *input )
 void FsmRun::sendBackIgnore( Kid *ignore )
 {
 	/* Ignore tokens are queued in reverse order. */
-	while ( tree_is_ignore( parser->prg, ignore ) ) {
+	while ( tree_is_ignore( prg, ignore ) ) {
 		#ifdef COLM_LOG_PARSE
 		LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
 		cerr << "sending back: " << lelInfo[ignore->tree->id].name;
@@ -232,7 +233,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 		/* Check for reverse code. */
 		Alg *alg = ignore->tree->alg;
 		if ( alg != 0 && alg->flags & AF_HAS_RCODE ) {
-			Execution execution( parser->prg, parser->reverseCode, 
+			Execution execution( prg, parser->reverseCode, 
 					parser, 0, 0, 0 );
 
 			/* Do the reverse exeuction. */
@@ -273,7 +274,7 @@ void FsmRun::sendBack( Kid *input )
 
 	/* Check for reverse code. */
 	if ( alg->flags & AF_HAS_RCODE ) {
-		Execution execution( parser->prg, parser->reverseCode, 
+		Execution execution( prg, parser->reverseCode, 
 				parser, 0, 0, 0 );
 
 		/* Do the reverse exeuction. */
@@ -282,7 +283,7 @@ void FsmRun::sendBack( Kid *input )
 	}
 
 	/* Always push back the ignore text. */
-	sendBackIgnore( tree_ignore( parser->prg, input->tree ) );
+	sendBackIgnore( tree_ignore( prg, input->tree ) );
 
 	/* If eof was just sent back remember that it needs to be sent again. */
 	if ( input->tree->id == parser->tables->gbl->eofId )
@@ -292,12 +293,12 @@ void FsmRun::sendBack( Kid *input )
 	Tree *lastBound = parser->bindings.top();
 	if ( lastBound == input->tree ) {
 		parser->bindings.pop();
-		tree_downref( parser->prg, input->tree );
+		tree_downref( prg, input->tree );
 	}
 
 	/* Downref the tree that was sent back and free the kid. */
-	tree_downref( parser->prg, input->tree );
-	parser->prg->kidPool.free( input );
+	tree_downref( prg, input->tree );
+	prg->kidPool.free( input );
 }
 
 void FsmRun::sendEOF( )
@@ -306,14 +307,14 @@ void FsmRun::sendEOF( )
 	cerr << "token: _EOF" << endl;
 	#endif
 
-	Kid *input = parser->prg->kidPool.allocate();
-	input->tree = parser->prg->treePool.allocate();
-	input->tree->alg = parser->prg->algPool.allocate();
+	Kid *input = prg->kidPool.allocate();
+	input->tree = prg->treePool.allocate();
+	input->tree->alg = prg->algPool.allocate();
 
 	input->tree->refs = 1;
 	input->tree->id = parser->tables->gbl->eofId;
 
-	bool ctxDepParsing = parser->prg->ctxDepParsing;
+	bool ctxDepParsing = prg->ctxDepParsing;
 	long frameId = parser->tables->gbl->regionInfo[region].eofFrameId;
 	if ( ctxDepParsing && frameId >= 0 ) {
 		#ifdef COLM_LOG_PARSE
@@ -323,7 +324,7 @@ void FsmRun::sendEOF( )
 		Code *code = parser->tables->gbl->frameInfo[frameId].code;
 	
 		/* Execute the translation. */
-		Execution execution( parser->prg, parser->reverseCode, 
+		Execution execution( prg, parser->reverseCode, 
 				parser, code, 0, 0 );
 		execution.execute( parser->root );
 
@@ -360,7 +361,7 @@ void FsmRun::sendQueuedTokens()
 			#endif
 			
 			parser->ignore( send->tree );
-			parser->prg->kidPool.free( send );
+			prg->kidPool.free( send );
 		}
 		else {
 			#ifdef COLM_LOG_PARSE
@@ -378,12 +379,12 @@ void FsmRun::sendToken( long id )
 	cerr << "token: " << parser->tables->gbl->lelInfo[id].name << endl;
 	#endif
 
-	bool ctxDepParsing = parser->prg->ctxDepParsing;
+	bool ctxDepParsing = prg->ctxDepParsing;
 	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
 
 	/* Copy the token data. */
 	long length = p-tokstart;
-	Head *tokdata = string_alloc_const( parser->prg, tokstart, length );
+	Head *tokdata = string_alloc_const( prg, tokstart, length );
 
 	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
 		translateLangEl( id, tokdata, false, 0 );
@@ -415,7 +416,7 @@ void FsmRun::sendNamedLangEl()
 	/* Copy the token data. */
 	Head *tokdata = 0;
 	if ( data != 0 )
-		tokdata = string_alloc_new( parser->prg, data, length );
+		tokdata = string_alloc_new( prg, data, length );
 
 	makeToken( klangEl->id, tokdata, true, bindId );
 }
@@ -458,11 +459,11 @@ void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindI
 	p = tokstart;
 
 	/* Execute the translation. */
-	Execution execution( parser->prg, parser->reverseCode, 
+	Execution execution( prg, parser->reverseCode, 
 			parser, code, 0, tokdata );
 	execution.execute( parser->root );
 
-	string_free( parser->prg, tokdata );
+	string_free( prg, tokdata );
 
 	set_AF_GROUP_MEM();
 }
@@ -471,12 +472,12 @@ void FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 {
 	/* Make the token object. */
 	long objectLength = parser->tables->gbl->lelInfo[id].objectLength;
-	Kid *attrs = alloc_attrs( parser->prg, objectLength );
+	Kid *attrs = alloc_attrs( prg, objectLength );
 
 	Kid *input = 0;
-	input = parser->prg->kidPool.allocate();
-	input->tree = parser->prg->treePool.allocate();
-	input->tree->alg = parser->prg->algPool.allocate();
+	input = prg->kidPool.allocate();
+	input->tree = prg->treePool.allocate();
+	input->tree->alg = prg->algPool.allocate();
 
 	if ( namedLangEl )
 		input->tree->alg->flags |= AF_NAMED;
@@ -491,9 +492,9 @@ void FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 	/* Set attributes for the labelled components. */
 	for ( int i = 0; i < 32; i++ ) {
 		if ( mark_leave[i] != 0 ) {
-			Head *data = string_alloc_new( parser->prg, 
+			Head *data = string_alloc_new( prg, 
 					mark_enter[i], mark_leave[i] - mark_enter[i] );
-			set_attr( input->tree, i, construct_string( parser->prg, data ) );
+			set_attr( input->tree, i, construct_string( prg, data ) );
 			tree_upref( get_attr( input->tree, i ) );
 		}
 	}
@@ -614,9 +615,9 @@ void FsmRun::sendIgnore( long id )
 	#endif
 
 	/* Make the ignore string. */
-	Head *ignoreStr = string_alloc_const( parser->prg, tokstart, length );
+	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
 	
-	Tree *tree = parser->prg->treePool.allocate();
+	Tree *tree = prg->treePool.allocate();
 	tree->refs = 1;
 	tree->id = id;
 	tree->tokdata = ignoreStr;
@@ -677,7 +678,7 @@ Head *FsmRun::extractToken( long length )
 	if ( tokstart + length > pe )
 		cerr << "NOT ENOUGH DATA TO FETCH TOKEN" << endp;
 
-	Head *tokdata = string_alloc_const( parser->prg, tokstart, length );
+	Head *tokdata = string_alloc_const( prg, tokstart, length );
 	p = tokstart + length;
 	tokstart = 0;
 
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 4d0dc58f..1637c259 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -83,7 +83,7 @@ struct RunBuf
 
 struct FsmRun
 {
-	FsmRun( FsmTables *tables );
+	FsmRun( Program *prg );
 	~FsmRun();
 
 	void set_AF_GROUP_MEM();
@@ -113,6 +113,7 @@ struct FsmRun
 
 	void execute();
 
+	Program *prg;
 	FsmTables *tables;
 	PdaRun *parser;
 	InputStream *inputStream;
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 92957327..348d5f85 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1627,8 +1627,8 @@ void ParseData::makePatternParsers()
 
 void ParseData::parsePatterns()
 {
-	FsmRun fsmRun( runtimeData->fsmTables );
 	Program program( false, runtimeData );
+	FsmRun fsmRun( &program );
 
 	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
 		//cerr << "parsing replacement: " << repl->data << endl;
-- 
cgit v1.2.1


From 5b919dce01b8f6c1df5507905fb318f5ca7d8a2c Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 2 Nov 2008 00:03:19 +0000
Subject: We cannot always clear the rcode at the end of a full commit. We have
 to compute when it is safe to do so.

Need to set the fsmRun->parser field before invoking a full parse undo.
---
 colm/bytecode.cpp | 4 ++--
 colm/fsmrun.cpp   | 7 +++++--
 colm/pdarun.cpp   | 6 ++++--
 3 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 8c25079d..d418aedc 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -1963,7 +1963,7 @@ again:
 		default: {
 			cerr << "UNKNOWN INSTRUCTION: " << (ulong)instr[-1] << 
 					" -- reverse code downref" << endl;
-			exit(1);
+			assert(false);
 			break;
 		}
 	}
@@ -4084,7 +4084,7 @@ again:
 		default: {
 			cerr << "UNKNOWN INSTRUCTION: " << (ulong)instr[-1] << 
 					" -- something is wrong" << endl;
-			exit(1);
+			assert(false);
 			break;
 		}
 	}
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 8eb2101b..d4726d87 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -82,8 +82,6 @@ void FsmRun::streamPush( const char *data, long length )
 		assert(false);
 	}
 	else {
-		cerr << "case 3" << endl;
-
 		/* Send back the second half of the current run buffer. */
 		RunBuf *dup = new RunBuf;
 		memcpy( dup, runBuf, sizeof(RunBuf) );
@@ -717,8 +715,13 @@ long PdaRun::undoParse( Tree *tree, CodeVect *rev )
 	numRetry += 1;
 	allReverseCode.transfer( *rev );
 
+	PdaRun *prevParser = fsmRun->parser;
+	fsmRun->parser = this;
+
 	parseToken( 0 );
 
+	fsmRun->parser = prevParser;
+
 	assert( stackTop->next == 0 );
 
 	prg->algPool.free( stackTop->tree->alg );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 04e2adef..3980c6b9 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -260,8 +260,10 @@ void PdaRun::commit()
 	 * was when we started. */
 	assert( sp == root );
 
-	/* Now clear all the rcode. */
-	rcode_downref_all( root, prg, &allReverseCode );
+	/* We cannot always clear all the rcode here. We may need to backup over
+	 * the parse statement. In the future we should compute when it is safe to
+	 * do so, but for now just leave everything until later. */
+	//rcode_downref_all( root, prg, &allReverseCode );
 }
 
 
-- 
cgit v1.2.1


From ea23064878be6c7bae8c9e1caee6dae23c7c8192 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 2 Nov 2008 00:06:31 +0000
Subject: strip empty lines

---
 test/cxx/preproc | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/cxx/preproc b/test/cxx/preproc
index 14e8fe6b..ed708599 100755
--- a/test/cxx/preproc
+++ b/test/cxx/preproc
@@ -1,4 +1,4 @@
 #!/bin/bash
 #
 
-g++ -E -undef -D'__attribute__(xyz)=' "$@" | sed 's/#.*$//'
+g++ -E -undef -D'__attribute__(xyz)=' "$@" | sed 's/#.*$//' | grep -v '^[ \t]*$'
-- 
cgit v1.2.1


From 10baa7815cc93ca8655c99454ce6b10e1f8b8f73 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 2 Nov 2008 16:29:57 +0000
Subject: The makeToken function now returns a new token, which must be sent by
 the caller.

---
 colm/fsmrun.cpp | 12 ++++++++----
 colm/fsmrun.h   |  5 +++--
 2 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index d4726d87..f159340f 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -46,6 +46,8 @@ FsmRun::FsmRun( Program *prg ) :
 	prg(prg),
 	tables(prg->rtd->fsmTables),
 	parser(0),
+	line(1),
+	col(1),
 	position(0)
 {
 }
@@ -389,7 +391,8 @@ void FsmRun::sendToken( long id )
 		sendQueuedTokens();
 	}
 	else {
-		makeToken( id, tokdata, false, 0 );
+		Kid *input = makeToken( id, tokdata, false, 0 );
+		sendLangEl( input );
 		assert( parser->queue == 0 );
 	}
 
@@ -416,7 +419,8 @@ void FsmRun::sendNamedLangEl()
 	if ( data != 0 )
 		tokdata = string_alloc_new( prg, data, length );
 
-	makeToken( klangEl->id, tokdata, true, bindId );
+	Kid *input = makeToken( klangEl->id, tokdata, true, bindId );
+	sendLangEl( input );
 }
 
 void FsmRun::set_AF_GROUP_MEM()
@@ -466,7 +470,7 @@ void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindI
 	set_AF_GROUP_MEM();
 }
 
-void FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
+Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 {
 	/* Make the token object. */
 	long objectLength = parser->tables->gbl->lelInfo[id].objectLength;
@@ -503,7 +507,7 @@ void FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 		tree_upref( input->tree );
 	}
 
-	sendLangEl( input );
+	return input;
 }
 
 /* Send back the accumulated ignore tokens. */
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 1637c259..6ff49a0d 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -89,7 +89,7 @@ struct FsmRun
 	void set_AF_GROUP_MEM();
 
 	void sendLangEl( Kid *input );
-	void makeToken( int id, Head *tokdata, bool namedLangEl, int bindId );
+	Kid *makeToken( int id, Head *tokdata, bool namedLangEl, int bindId );
 	void translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId );
 	void sendNamedLangEl();
 	void sendEOF();
@@ -119,13 +119,14 @@ struct FsmRun
 	InputStream *inputStream;
 
 	/* FsmRun State. */
-	int region, cs, act;
+	long region, cs, act;
 	char *tokstart, *tokend;
 	char *p, *pe, *peof;
 	bool eofSent;
 	RunBuf *runBuf;
 	bool gotoResume;
 	long position;
+	long line, col;
 	char *mark_enter[32];
 	char *mark_leave[32];
 };
-- 
cgit v1.2.1


From 481afc32eef7ff1f1701d709e1dd59698deb404d Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 2 Nov 2008 17:14:58 +0000
Subject: The parse-wide reverse code stack is now dynamically allocated so it
 can be transferred out of the PdaRun structure when parsing is complete.

Added a couple missing tree downrefs for stream objects.
---
 colm/bytecode.cpp | 39 +++++++++++++++++++++------------------
 colm/bytecode.h   |  2 +-
 colm/fsmrun.cpp   |  6 +++---
 colm/fsmrun.h     |  2 +-
 colm/pdarun.cpp   |  4 +++-
 colm/pdarun.h     |  4 ++--
 6 files changed, 31 insertions(+), 26 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index d418aedc..41886e75 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -324,18 +324,18 @@ Tree *parse( Tree **&sp, Program *prg, Stream *stream,
 	tree_upref( tree );
 	parser.clean();
 
-	cv = new CodeVect;
-	cv->transfer( parser.allReverseCode );
+	/* Return the reverse code. */
+	cv = parser.allReverseCode;
 	return tree;
 }
 
-Tree *undo_parse( Tree **&sp, Program *prg, Stream *stream, 
+void undo_parse( Tree **&sp, Program *prg, Stream *stream, 
 		long parserId, Tree *tree, CodeVect *rev )
 {
 	PdaTables *tables = prg->rtd->parsers[parserId];
 	PdaRun parser( sp, prg, tables, stream->scanner, 0 );
 	parser.undoParse( tree, rev );
-	return 0;
+	delete rev;
 }
 
 Tree *stream_pull( Program *prg, Stream *stream, Tree *length )
@@ -1726,7 +1726,7 @@ void Program::run()
 
 	if ( rtd->rootCodeLen > 0 ) {
 		CodeVect reverseCode;
-		CodeVect allReverseCode;
+		CodeVect *allReverseCode = new CodeVect;
 		Execution execution( this, reverseCode, 0, rtd->rootCode, 0, 0 );
 		execution.execute( root );
 
@@ -1737,7 +1737,8 @@ void Program::run()
 
 		bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
 		if ( hasrcode )
-			rcode_downref( root, this, allReverseCode.data );
+			rcode_downref( root, this, allReverseCode->data );
+		delete allReverseCode;
 	}
 }
 
@@ -1777,6 +1778,7 @@ void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *rev )
 		/* Backup over it. */
 		rev->tabLen -= len + 4;
 	}
+	delete rev;
 }
 
 void rcode_downref( Tree **stack_root, Program *prg, Code *instr )
@@ -1825,7 +1827,7 @@ again:
 			cerr << "IN_STREAM_PUSH_BKT" << endl;
 			#endif
 
-			// FIXME: Implement
+			tree_downref( prg, stream );
 			break;
 		}
 		case IN_LOAD_GLOBAL_BKT: {
@@ -1989,7 +1991,7 @@ void Execution::execute( Tree **root )
 	assert( sp == root );
 }
 
-bool makeReverseCode( CodeVect &all, CodeVect &reverseCode )
+bool makeReverseCode( CodeVect *all, CodeVect &reverseCode )
 {
 	/* Do we need to revert the left hand side? */
 
@@ -1997,7 +1999,7 @@ bool makeReverseCode( CodeVect &all, CodeVect &reverseCode )
 	if ( reverseCode.length() == 0 )
 		return false;
 
-	long prevAllLength = all.length();
+	long prevAllLength = all->length();
 
 	/* Go backwards, group by group, through the reverse code. Push each group
 	 * to the global reverse code stack. */
@@ -2006,13 +2008,13 @@ bool makeReverseCode( CodeVect &all, CodeVect &reverseCode )
 		p--;
 		long len = *p;
 		p = p - len;
-		all.append( p, len );
+		all->append( p, len );
 	}
 
 	/* Stop, then place a total length in the global stack. */
-	all.append( IN_STOP );
-	long length = all.length() - prevAllLength;
-	all.appendWord( length );
+	all->append( IN_STOP );
+	long length = all->length() - prevAllLength;
+	all->appendWord( length );
 
 	/* Clear the revere code buffer. */
 	reverseCode.tabLen = 0;
@@ -2020,16 +2022,16 @@ bool makeReverseCode( CodeVect &all, CodeVect &reverseCode )
 	return true;
 }
 
-void Execution::rexecute( Tree **root, Code *rcode, CodeVect &allRev )
+void Execution::rexecute( Tree **root, CodeVect *allRev )
 {
 	/* Read the length */
-	Code *prcode = allRev.data + allRev.length() - 4;
+	Code *prcode = allRev->data + allRev->length() - 4;
 	Word len;
 	read_word_p( len, prcode );
 
 	/* Find the start of block. */
-	long start = allRev.length() - len - 4;
-	prcode = allRev.data + start;
+	long start = allRev->length() - len - 4;
+	prcode = allRev->data + start;
 
 	/* Execute it. */
 	Tree **sp = root;
@@ -2037,7 +2039,7 @@ void Execution::rexecute( Tree **root, Code *rcode, CodeVect &allRev )
 	assert( sp == root );
 
 	/* Backup over it. */
-	allRev.tabLen -= len + 4;
+	allRev->tabLen -= len + 4;
 }
 
 void Execution::execute( Tree **&sp, Code *instr )
@@ -3079,6 +3081,7 @@ again:
 			#endif
 
 			undo_stream_push( sp, prg, (Stream*)stream, len );
+			tree_downref( prg, stream );
 			break;
 		}
 		case IN_PARSE_BKT: {
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 885d2f4b..d3ccd1d7 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -607,7 +607,7 @@ struct Execution
 	long rcodeUnitLen;
 
 	void execute( Tree **root );
-	void rexecute( Tree **root, Code *revcode, CodeVect &allRev );
+	void rexecute( Tree **root, CodeVect *allRev );
 	void execute( Tree **&sp, Code *instr );
 	void rdownref( Code *instr );
 };
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index f159340f..6d55c567 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -237,7 +237,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 					parser, 0, 0, 0 );
 
 			/* Do the reverse exeuction. */
-			execution.rexecute( parser->root, 0, parser->allReverseCode );
+			execution.rexecute( parser->root, parser->allReverseCode );
 			alg->flags &= ~AF_HAS_RCODE;
 		}
 
@@ -278,7 +278,7 @@ void FsmRun::sendBack( Kid *input )
 				parser, 0, 0, 0 );
 
 		/* Do the reverse exeuction. */
-		execution.rexecute( parser->root, 0, parser->allReverseCode );
+		execution.rexecute( parser->root, parser->allReverseCode );
 		alg->flags &= ~AF_HAS_RCODE;
 	}
 
@@ -717,7 +717,7 @@ long PdaRun::undoParse( Tree *tree, CodeVect *rev )
 	top->tree = tree;
 	stackTop = top;
 	numRetry += 1;
-	allReverseCode.transfer( *rev );
+	allReverseCode = rev;
 
 	PdaRun *prevParser = fsmRun->parser;
 	fsmRun->parser = this;
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 6ff49a0d..a0fcbd7c 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -125,8 +125,8 @@ struct FsmRun
 	bool eofSent;
 	RunBuf *runBuf;
 	bool gotoResume;
-	long position;
 	long line, col;
+	long position;
 	char *mark_enter[32];
 	char *mark_leave[32];
 };
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 3980c6b9..66c9312d 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -85,6 +85,8 @@ void PdaRun::init()
 
 	/* Bindings are indexed at 1. Need a no-binding. */
 	bindings.push(0);
+
+	allReverseCode = new CodeVect;
 }
 
 long PdaRun::stackTopTarget()
@@ -559,7 +561,7 @@ parseError:
 				Execution execution( prg, reverseCode, this, 0, 0, 0 );
 
 				/* Do the reverse exeuction. */
-				execution.rexecute( root, 0, allReverseCode );
+				execution.rexecute( root, allReverseCode );
 				alg->flags &= ~AF_HAS_RCODE;
 			}
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 84ab5682..afac5d77 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -436,7 +436,7 @@ struct PdaTables
 	RuntimeData *gbl;
 };
 
-bool makeReverseCode( CodeVect &all, CodeVect &reverseCode );
+bool makeReverseCode( CodeVect *all, CodeVect &reverseCode );
 
 typedef Vector<Tree*> Bindings;
 
@@ -495,7 +495,7 @@ struct PdaRun
 
 	/* Reused. */
 	CodeVect reverseCode;
-	CodeVect allReverseCode;
+	CodeVect *allReverseCode;
 
 	bool stopParsing;
 	long stopTarget;
-- 
cgit v1.2.1


From a781b54819c0e128790f8a40ecc80830fa268421 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 3 Nov 2008 04:44:04 +0000
Subject: Added svn:ignore properties for test directories. Ragel -> Colm in
 the license headers. Added the mediawiki grammar (a work in progress).

---
 test/Makefile               |  10 +--
 test/cxx/Makefile           |   8 +-
 test/diff/Makefile          |   8 +-
 test/html/Makefile          |   8 +-
 test/http/Makefile          |   8 +-
 test/mediawiki/Makefile     |  43 ++++++++++
 test/mediawiki/garticle.rl  | 133 ++++++++++++++++++++++++++++++
 test/mediawiki/mediawiki.lm | 196 ++++++++++++++++++++++++++++++++++++++++++++
 test/mediawiki/pdump.rl     | 115 ++++++++++++++++++++++++++
 test/python/Makefile        |  15 ++++
 test/ruby/Makefile          |   8 +-
 test/xml/Makefile           |   8 +-
 12 files changed, 531 insertions(+), 29 deletions(-)
 create mode 100644 test/mediawiki/Makefile
 create mode 100644 test/mediawiki/garticle.rl
 create mode 100644 test/mediawiki/mediawiki.lm
 create mode 100644 test/mediawiki/pdump.rl

diff --git a/test/Makefile b/test/Makefile
index f86db51d..492bfaf2 100644
--- a/test/Makefile
+++ b/test/Makefile
@@ -2,26 +2,26 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
 SRC = $(wildcard *.lm)
 BIN = $(SRC:%.lm=%.bin)
-SUBDIRS = xml python http dns diff html cxx ruby
+SUBDIRS = xml python http dns diff html cxx ruby mediawiki
 
 all: $(BIN) $(SUBDIRS)
 
diff --git a/test/cxx/Makefile b/test/cxx/Makefile
index c19f557b..9fb58795 100644
--- a/test/cxx/Makefile
+++ b/test/cxx/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
diff --git a/test/diff/Makefile b/test/diff/Makefile
index 3e51996f..d647261a 100644
--- a/test/diff/Makefile
+++ b/test/diff/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
diff --git a/test/html/Makefile b/test/html/Makefile
index 3e51996f..d647261a 100644
--- a/test/html/Makefile
+++ b/test/html/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
diff --git a/test/http/Makefile b/test/http/Makefile
index 3e51996f..d647261a 100644
--- a/test/http/Makefile
+++ b/test/http/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
diff --git a/test/mediawiki/Makefile b/test/mediawiki/Makefile
new file mode 100644
index 00000000..3e6bf661
--- /dev/null
+++ b/test/mediawiki/Makefile
@@ -0,0 +1,43 @@
+#
+#   Copyright 2008 Adrian Thurston <thurston@complang.org>
+#
+
+#   This file is part of Colm.
+#
+#   Colm is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Colm is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Colm; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
+
+SRC = $(wildcard *.lm)
+BIN = $(SRC:%.lm=%.bin)
+COLM = ../../colm/colm
+
+all: pdump garticle mediawiki.bin
+
+pdump.cpp: pdump.rl
+	ragel -G2 -o pdump.cpp pdump.rl
+
+pdump: pdump.cpp
+	g++ -O3 -Wall -o pdump pdump.cpp
+
+garticle.cpp: garticle.rl
+	ragel -G2 -o garticle.cpp garticle.rl
+
+garticle: garticle.cpp
+	g++ -O3 -Wall -o garticle garticle.cpp
+
+mediawiki.bin: mediawiki.lm
+	$(COLM) mediawiki.lm
+
+clean:
+	rm -f mediawiki.cpp *.bin garticle.cpp garticle pdump.cpp pdump
diff --git a/test/mediawiki/garticle.rl b/test/mediawiki/garticle.rl
new file mode 100644
index 00000000..ca711a85
--- /dev/null
+++ b/test/mediawiki/garticle.rl
@@ -0,0 +1,133 @@
+#include <iostream>
+#include <fstream>
+
+using std::cout;
+using std::cerr;
+using std::endl;
+using std::ifstream;
+using std::ofstream;
+
+%%{
+	machine garticle;
+	write data;
+}%%
+
+
+int main( int argc, char **argv )
+{
+	std::ios::sync_with_stdio(false);
+
+	if ( argc != 5 ) {
+		cerr << "usage: garticle <dump-file> <article-index> <section> <article>" << endl;
+		return -1;
+	}
+
+	char *dumpFile = argv[1];
+	char *articleIndex = argv[2];
+	char *section = argv[3];
+	char *article = argv[4];
+
+	ifstream dump( dumpFile );
+	if ( !dump.is_open() ) {
+		cerr << "error: unable to open " << dumpFile << " for reading" << endl;
+		return -1;
+	}
+
+	ifstream index( articleIndex );
+	if ( !index.is_open() ) {
+		cerr << "error: unable to open " << articleIndex <<  " for writing" << endl;
+		return -1;
+	}
+
+	long long articleNum = atoll(article);
+	index.seekg( articleNum * sizeof(long long) );
+
+	long long start, end;
+	index.read( (char*)&start, sizeof(long long) );
+	index.read( (char*)&end, sizeof(long long) );
+
+	long long len = end - start;
+	char *buf = new char[len];
+	dump.seekg( start-5 );
+	dump.read( buf, len );
+
+	char tn[2048];
+	long ptn = 0;
+	bool emit = false;
+
+	char *p = buf, *pe = buf+len;
+	int cs;
+
+	%%{
+		newline = '\n';
+		sp = [ \t\n\r];
+
+		name = [a-zA-Z:_0-9]+;
+
+		# Tag names.
+		tag_name = name
+			>{ ptn = 0; }
+			${ tn[ptn++] = *p; }
+			%{ tn[ptn++] = 0; }
+			;
+
+		attr_name = name;
+
+		# Attributes
+		attr_val = '"' ( [^"\\] | newline | ( '\\' any ) )* '"';
+		attr = attr_name '=' attr_val;
+		attrs = ( sp attr )*;
+
+		action maybe_open {
+			if ( strcmp( tn, section ) == 0 )
+				emit = true;
+		}
+
+		action maybe_close {
+			if ( strcmp( tn, section ) == 0 )
+				emit = false;
+		}
+
+		# Tags
+		tag = '<' tag_name %maybe_open attrs sp? ( '>' | '/>' );
+		close_tag = '</' tag_name %maybe_close '>';
+
+		# Character data, not spaces and not tag starts.
+		char_data_char = ^('<'|'&');
+		char_data = char_data_char+
+			${ 
+				if ( emit )
+					cout << *p;
+			} ;
+
+		defined_entities =
+			'quot' %{if (emit) cout << '"';} |
+			'amp' %{if (emit) cout << '&';} |
+			'apos' %{if (emit) cout << '\'';} |
+			'lt' %{if (emit) cout << '<';} |
+			'gt' %{if (emit) cout << '>';};
+
+		entity_ref = '&' defined_entities ';';
+
+		main := ( 
+				tag |
+				close_tag |
+				entity_ref |
+				char_data
+			)*
+			;
+
+		write init;
+		write exec;
+	}%%
+
+	if ( cs < garticle_first_final ) {
+		cerr << endl << endl << "garticle: error parsing dump file" << endl;
+		return 1;
+	}
+
+	//cout.write( buf, len );
+	cout << endl;
+
+	return 0;
+}
diff --git a/test/mediawiki/mediawiki.lm b/test/mediawiki/mediawiki.lm
new file mode 100644
index 00000000..e8dd3a27
--- /dev/null
+++ b/test/mediawiki/mediawiki.lm
@@ -0,0 +1,196 @@
+def open_item
+	str type
+	int num
+	[]
+
+list open_stack [open_item]
+global open_stack OpenStack = construct open_stack []
+open_item Sentinal = construct open_item( type: '** SENTINAL **', num: 1 ) []
+OpenStack.push( Sentinal )
+
+lex start
+{
+	token stray_close //
+
+	token ocurly /'{'+/
+	{
+		open_item OI = construct open_item( type: '{', num: match_length ) []
+		OpenStack.push( OI )
+		int i = 0
+		while ( i < match_length ) {
+			send( make_token( typeid ocurly, pull(stdin, 1 ) ) )
+			i = i + 1
+		}
+	}
+
+	token ccurly1 //
+	token ccurly2 //
+	token ccurly3 //
+	token missing_curly //
+
+	token tmp1 /'}'+/
+	{
+		if OpenStack.length > 0 && OpenStack.tail.type == '{' {
+			int length = 3
+			if ( length > match_length )
+				length = match_length
+
+			open_item Tail = OpenStack.pop()
+			if ( length > Tail.num )
+				length = Tail.num
+
+			if ( length == 1 )
+				send( make_token( typeid ccurly1, pull( stdin, 1 ) ) )
+			else if ( length == 2 )
+				send( make_token( typeid ccurly2, pull( stdin, 2 ) ) )
+			else if ( length == 3 )
+				send( make_token( typeid ccurly3, pull( stdin, 3 ) ) )
+
+			Tail.num = Tail.num - length
+
+			if ( Tail.num > 0 )
+				OpenStack.push( Tail )
+		}
+		else {
+			send( make_token( typeid stray_close, pull( stdin, match_length ) ) )
+		}
+	}
+	
+	token osquare /'['+/
+	{
+		open_item OI = construct open_item( type: '[', num: match_length ) []
+		OpenStack.push( OI )
+		int i = 0
+		while ( i < match_length ) {
+			send( make_token( typeid osquare, pull(stdin, 1 ) ) )
+			i = i + 1
+		}
+	}
+
+	token csquare1 //
+	token csquare2 //
+	token missing_square //
+
+	token tmp2 /']'+/
+	{
+		if OpenStack.length > 0 && OpenStack.tail.type == '[' {
+			int length = 2
+			if ( length > match_length )
+				length = match_length
+
+			open_item Tail = OpenStack.pop()
+			if ( length > Tail.num )
+				length = Tail.num
+
+			if ( length == 1 )
+				send( make_token( typeid csquare1, pull( stdin, 1 ) ) )
+			else if ( length == 2 )
+				send( make_token( typeid csquare2, pull( stdin, 2 ) ) )
+
+			Tail.num = Tail.num - length
+
+			if ( Tail.num > 0 )
+				OpenStack.push( Tail )
+		}
+		else {
+			send( make_token( typeid stray_close, pull( stdin, match_length ) ) )
+		}
+	}
+	
+	literal '|'
+	token char /any/
+
+	preeof {
+		while ( OpenStack.length > 0 ) {
+			open_item Tail = OpenStack.pop()
+			int i
+			if ( Tail.type == '{' ) {
+				i = 0
+				while ( i < Tail.num ) {
+					send( make_token( typeid missing_curly, '}' ) )
+					i = i + 1
+				}
+			}
+			else if ( Tail.type == '[' ) {
+				i = 0
+				while ( i < Tail.num ) {
+					send( make_token( typeid missing_square, ']' ) )
+					i = i + 1
+				}
+			}
+		}
+	}
+}
+
+#
+# Internal Links
+#
+
+
+lex el_prefix
+{
+	literal 'http:'
+	literal 'ftp:'
+	literal 'mailto:'
+}
+
+def el_prefix
+	['http:']
+|	['ftp:']
+|	['mailto:']
+
+def external_link
+	[osquare item* csquare1]
+
+def internal_link
+	[osquare osquare item* csquare2]
+
+def unclosed_square
+	[osquare item* missing_square]
+
+#
+# Templates
+#
+
+def sing_template
+	[ocurly item* ccurly1]
+
+def template
+	[ocurly ocurly item* ccurly2]
+
+def parameter
+	[ocurly ocurly ocurly item* ccurly3] 
+
+def unclosed_curly
+	[ocurly item* missing_curly]
+
+#
+# Template Parameters
+#
+
+
+def U1 []
+def U2 []
+def U3 []
+
+def item
+	[external_link]
+|	[internal_link]
+|	[unclosed_curly]
+|	[sing_template]
+|	[template]
+|	[parameter]
+|	[unclosed_curly]
+|	[stray_close]
+|	[osquare]
+|	['|']
+|	[char]
+
+def start 
+	[item*]
+
+start S = parse start(stdin)
+for I: internal_link in S
+	print( I, '\n' )
+print_xml( S )
+#print_xml( OpenStack )
diff --git a/test/mediawiki/pdump.rl b/test/mediawiki/pdump.rl
new file mode 100644
index 00000000..8b19bf37
--- /dev/null
+++ b/test/mediawiki/pdump.rl
@@ -0,0 +1,115 @@
+#include <iostream>
+#include <fstream>
+
+using std::cout;
+using std::cerr;
+using std::endl;
+using std::ifstream;
+using std::ofstream;
+
+
+#define RBS 65536
+
+%%{
+	machine pdump;
+	write data;
+}%%
+
+int main( int argc, char **argv )
+{
+	std::ios::sync_with_stdio(false);
+
+	if ( argc != 3 ) {
+		cerr << "usage: pdump <dump-file> <article-index>" << endl;
+		return -1;
+	}
+
+	ifstream input( argv[1] );
+	if ( !input.is_open() ) {
+		cerr << "error: unable to open " << argv[1] << " for reading" << endl;
+		return -1;
+	}
+
+	ofstream output( argv[2] );
+	if ( !output.is_open() ) {
+		cerr << "error: unable to open " << argv[2] <<  " for writing" << endl;
+		return -1;
+	}
+
+	long cs;
+	%% write init;
+
+	long long line = 1;
+	long long total = 0;
+	static char buf[RBS];
+	while ( true ) {
+		if ( input.eof() )
+			break;
+
+		input.read( buf, RBS );
+		long ss = input.gcount();
+
+		char *p = buf, *pe = buf + ss;
+
+		%%{
+
+		action newline { line++; }
+		newline = '\n'@newline;
+		any_nl = any | newline;
+
+		sp_char = [ \t\n\r];
+		sp = sp_char | newline;
+
+		# Tag names.
+		any_tag_name = [a-zA-Z:0-9]+ ;
+
+		page_tag_name = 'page'
+			%{
+				long inbuf = p - buf;
+				long long pos = total + inbuf;
+				output.write( (char*)&pos, sizeof(long long) );
+			};
+
+		tag_name = any_tag_name | page_tag_name;
+
+		attr_name = [a-zA-Z:0-9]+;
+
+		# Attributes
+		attr_val = '"' ( [^"\\] | newline | ( '\\' any_nl ) )* '"';
+		attr = attr_name '=' attr_val;
+		attrs = ( sp attr )*;
+
+		# Tags
+		tag = '<' tag_name attrs sp? ( '>' | '/>' );
+		close_tag = '</' any_tag_name '>';
+
+		# Character data, not spaces and not tag starts.
+		char_data_char = ^(sp_char | '<');
+		char_data = char_data_char+;
+
+		main := ( 
+				tag |
+				close_tag |
+				newline |
+				sp |
+				char_data
+			)*
+			;
+
+		write exec;
+
+		}%%
+
+		if ( cs == pdump_error ) {
+			cerr << "error:" << line << ": parse error" << endl;
+			return -1;
+		}
+
+		total += ss;
+	}
+
+	input.close();
+	output.close();
+		
+	return 0;
+}
diff --git a/test/python/Makefile b/test/python/Makefile
index 7ee4cbe7..6ee0fde1 100644
--- a/test/python/Makefile
+++ b/test/python/Makefile
@@ -2,6 +2,21 @@
 #   Copyright 2007 Adrian Thurston <thurston@complang.org>
 #
 
+#   This file is part of Colm.
+#
+#   Colm is free software; you can redistribute it and/or modify
+#   it under the terms of the GNU General Public License as published by
+#   the Free Software Foundation; either version 2 of the License, or
+#   (at your option) any later version.
+#
+#   Colm is distributed in the hope that it will be useful,
+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#   GNU General Public License for more details.
+#
+#   You should have received a copy of the GNU General Public License
+#   along with Colm; if not, write to the Free Software
+#   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 SRC = $(wildcard *.lm)
 BIN = $(SRC:%.lm=%.bin)
diff --git a/test/ruby/Makefile b/test/ruby/Makefile
index bb1a9fe3..16285a0a 100644
--- a/test/ruby/Makefile
+++ b/test/ruby/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2008 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
diff --git a/test/xml/Makefile b/test/xml/Makefile
index 3e51996f..d647261a 100644
--- a/test/xml/Makefile
+++ b/test/xml/Makefile
@@ -2,20 +2,20 @@
 #   Copyright 2002-2006 Adrian Thurston <thurston@complang.org>
 #
 
-#   This file is part of Ragel.
+#   This file is part of Colm.
 #
-#   Ragel is free software; you can redistribute it and/or modify
+#   Colm is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 #
-#   Ragel is distributed in the hope that it will be useful,
+#   Colm is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 #
 #   You should have received a copy of the GNU General Public License
-#   along with Ragel; if not, write to the Free Software
+#   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
 
-- 
cgit v1.2.1


From 1f85b3e2bfad623a76022cc2dad22085d125d6c8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 3 Nov 2008 17:20:10 +0000
Subject: Added a README with info on building, syntax highlighting and
 running.

---
 README | 43 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 43 insertions(+)
 create mode 100644 README

diff --git a/README b/README
new file mode 100644
index 00000000..a4119acc
--- /dev/null
+++ b/README
@@ -0,0 +1,43 @@
+BUILDING
+========
+
+Colm is currently supported only on Unix-like systems. It depends on the mmap
+function and it must be able to find g++ on the path.
+
+Building Colm from the source repository requires that you have ragel and kelbt
+installed. Building these two packages is straightforward. The usual
+./configure && make should be all that's needed. Alternatively, you may find
+packages for your system.
+
+http://www.complang.org/ragel/
+http://www.complang.org/kelbt/
+
+SYNTAX HIGHLIGHTING
+===================
+
+There is a vim syntax definition file colm.vim
+
+RUNNING
+=======
+
+The colm executable takes a Colm program and generates a .cpp file from it. It
+then compiles this program using g++. The g++ compile phase depends on include
+directories in the colm distribution, as well as a runtime library. Colm finds
+these using argv[0]:
+
+    -I dirname(argv[0])"../aapl"
+    -I dirname(argv[0])"../colm"
+    dirname(argv[0])"../colm/runtime.a"
+
+Therefore it is easiest to just run colm from the place it was built. This is
+temporary. In the future a proper install scheme will be provided.
+
+$ ./colm prog.lm
+
+Will produce:
+    prog.cpp
+    prog.bin
+
+The prog.bin program can then be run on some input:
+
+$ ./prog.bin < inputfile
-- 
cgit v1.2.1


From 131190487afd249d3871bea0c92246bfb628a499 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 3 Nov 2008 22:04:13 +0000
Subject: Improved management of tokstart. Don't leave it set through the
 processing of tokens. When a match is made extract the text then either
 advance over the text or leave the stream untouchged (generation actions) and
 immediately reset tokstart.

---
 colm/fsmrun.cpp | 55 ++++++++++++++++++++-----------------------------------
 1 file changed, 20 insertions(+), 35 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 6d55c567..0515f1cc 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -382,15 +382,24 @@ void FsmRun::sendToken( long id )
 	bool ctxDepParsing = prg->ctxDepParsing;
 	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
 
-	/* Copy the token data. */
+	/* Make the token data. */
 	long length = p-tokstart;
 	Head *tokdata = string_alloc_const( prg, tokstart, length );
 
 	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
+		/* We don't want the generation actions to automatically consume text
+		 * so reset p since the scanner leaves it at tokend. */
+		p = tokstart;
+		tokstart = 0;
+
 		translateLangEl( id, tokdata, false, 0 );
 		sendQueuedTokens();
 	}
 	else {
+		/* By default the match is consumed and this is what we need. Just
+		 * need to reset tokstart. */
+		tokstart = 0;
+
 		Kid *input = makeToken( id, tokdata, false, 0 );
 		sendLangEl( input );
 		assert( parser->queue == 0 );
@@ -439,13 +448,8 @@ void FsmRun::set_AF_GROUP_MEM()
 }
 
 /* 
- * Implmented:
- *  -shorten the match (possibly to zero length)
- *  -change the token to a new identifier 
- *  -change global state (it can, but it isn't reverted during backtracking).
- *
- * Not implemented:
- *  -invoke failure (and hence the backtracker)
+ * Not supported:
+ *  -invoke failure (the backtracker)
  */
 
 void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId )
@@ -458,8 +462,6 @@ void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindI
 	Code *code = parser->tables->gbl->frameInfo[
 			parser->tables->gbl->lelInfo[id].frameId].code;
 	
-	p = tokstart;
-
 	/* Execute the translation. */
 	Execution execution( prg, parser->reverseCode, 
 			parser, code, 0, tokdata );
@@ -580,9 +582,6 @@ void FsmRun::sendLangEl( Kid *input )
 		}
 	}
 
-	/* Reset tokstart. */
-	tokstart = 0;
-
 	#ifdef COLM_LOG_PARSE
 	cerr << "new token region: " << 
 			parser->tables->gbl->regionInfo[region].name << endl;
@@ -610,14 +609,14 @@ void PdaRun::ignore( Tree *tree )
 
 void FsmRun::sendIgnore( long id )
 {
-	int length = p-tokstart;
-
 	#ifdef COLM_LOG_PARSE
 	cerr << "ignoring: " << parser->tables->gbl->lelInfo[id].name << endl;
 	#endif
 
 	/* Make the ignore string. */
+	int length = p - tokstart;
 	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
+	tokstart = 0;
 	
 	Tree *tree = prg->treePool.allocate();
 	tree->refs = 1;
@@ -628,7 +627,6 @@ void FsmRun::sendIgnore( long id )
 	parser->ignore( tree );
 
 	/* Prepare for more scanning. */
-	tokstart = 0;
 	position += length;
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
@@ -649,23 +647,11 @@ void FsmRun::emitToken( KlangEl *token )
 Head *FsmRun::extractToken( long length )
 {
 	/* How much do we have already? Tokstart may or may not be set. */
-	long have = 0;
-	if ( tokstart != 0 )
-		have = p - tokstart;
-	else
-		tokstart = p;
+	assert( tokstart == 0 );
 
 	/* The generated token length has been stuffed into tokdata. */
-	if ( tokstart + length > pe ) {
-		/* There is not enough data in the buffer to generate the token.
-		 * Shift data over and fill the buffer. */
-		if ( have > 0 ) {
-			/* There is data that needs to be shifted over. */
-			memmove( runBuf->buf, tokstart, have );
-			tokend -= (tokstart - runBuf->buf);
-			tokstart = runBuf->buf;
-		}
-		p = pe = runBuf->buf + have;
+	if ( p + length > pe ) {
+		p = pe = runBuf->buf;
 		peof = 0;
 
 		long space = runBuf->buf + FSM_BUFSIZE - pe;
@@ -677,12 +663,11 @@ Head *FsmRun::extractToken( long length )
 		pe = p + len;
 	}
 
-	if ( tokstart + length > pe )
+	if ( p + length > pe )
 		cerr << "NOT ENOUGH DATA TO FETCH TOKEN" << endp;
 
-	Head *tokdata = string_alloc_const( prg, tokstart, length );
-	p = tokstart + length;
-	tokstart = 0;
+	Head *tokdata = string_alloc_const( prg, p, length );
+	p += length;
 
 	return tokdata;
 }
-- 
cgit v1.2.1


From c67badc33e7be18137afe8a57b16607421a28fe7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 3 Nov 2008 22:31:39 +0000
Subject: Some cleanup and a little bit of prep for moving to C as the target.

---
 colm/fsmrun.cpp | 39 ++++++++++++++++++++++++---------------
 colm/fsmrun.h   |  7 ++++---
 2 files changed, 28 insertions(+), 18 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 0515f1cc..07d4e2de 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -328,9 +328,11 @@ void FsmRun::sendEOF( )
 				parser, code, 0, 0 );
 		execution.execute( parser->root );
 
+		/* Mark generated tokens as belonging to a group. */
 		set_AF_GROUP_MEM();
 
-		sendQueuedTokens();
+		/* Send the generated tokens. */
+		send_queued_tokens( this, parser );
 	}
 
 	parser->send( input );
@@ -345,7 +347,7 @@ void FsmRun::sendEOF( )
 	cs = tables->entryByRegion[region];
 }
 
-void FsmRun::sendQueuedTokens()
+void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 {
 	while ( parser->queue != 0 ) {
 		/* Pull an item to send off the queue. */
@@ -361,14 +363,15 @@ void FsmRun::sendQueuedTokens()
 			#endif
 			
 			parser->ignore( send->tree );
-			prg->kidPool.free( send );
+			fsmRun->prg->kidPool.free( send );
 		}
 		else {
 			#ifdef COLM_LOG_PARSE
 			cerr << "sending queue item: " << 
 					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
 			#endif
-			sendLangEl( send );
+
+			send_handle_error( fsmRun, parser, send );
 		}
 	}
 }
@@ -392,8 +395,7 @@ void FsmRun::sendToken( long id )
 		p = tokstart;
 		tokstart = 0;
 
-		translateLangEl( id, tokdata, false, 0 );
-		sendQueuedTokens();
+		generationAction( id, tokdata, false, 0 );
 	}
 	else {
 		/* By default the match is consumed and this is what we need. Just
@@ -401,8 +403,7 @@ void FsmRun::sendToken( long id )
 		tokstart = 0;
 
 		Kid *input = makeToken( id, tokdata, false, 0 );
-		sendLangEl( input );
-		assert( parser->queue == 0 );
+		send_handle_error( this, parser, input );
 	}
 
 	memset( mark_leave, 0, sizeof(mark_leave) );
@@ -429,9 +430,11 @@ void FsmRun::sendNamedLangEl()
 		tokdata = string_alloc_new( prg, data, length );
 
 	Kid *input = makeToken( klangEl->id, tokdata, true, bindId );
-	sendLangEl( input );
+	send_handle_error( this, parser, input );
 }
 
+/* Sets the AF_GROUP_MEM so the backtracker can tell which tokens were sent
+ * generated from a single action. */
 void FsmRun::set_AF_GROUP_MEM()
 {
 	/* Set AF_GROUP_MEM now. */
@@ -452,13 +455,14 @@ void FsmRun::set_AF_GROUP_MEM()
  *  -invoke failure (the backtracker)
  */
 
-void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId )
+void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bindId )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "translating: " << 
+	cerr << "generation action: " << 
 			parser->tables->gbl->lelInfo[id].name << endl;
 	#endif
 
+	/* Find the code. */
 	Code *code = parser->tables->gbl->frameInfo[
 			parser->tables->gbl->lelInfo[id].frameId].code;
 	
@@ -467,9 +471,14 @@ void FsmRun::translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindI
 			parser, code, 0, tokdata );
 	execution.execute( parser->root );
 
+	/* Finished with the match text. */
 	string_free( prg, tokdata );
 
+	/* Mark generated tokens as belonging to a group. */
 	set_AF_GROUP_MEM();
+
+	/* Send the queued tokens. */
+	send_queued_tokens( this, parser );
 }
 
 Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
@@ -556,7 +565,7 @@ void PdaRun::send( Kid *input )
 	parseToken( input );
 }
 
-void FsmRun::sendLangEl( Kid *input )
+void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input )
 {
 	long id = input->tree->id;
 
@@ -570,14 +579,14 @@ void FsmRun::sendLangEl( Kid *input )
 	}
 	else {
 		/* Set the current state from the next region. */
-		region = parser->getNextRegion();
-		cs = tables->entryByRegion[region];
+		fsmRun->region = parser->getNextRegion();
+		fsmRun->cs = fsmRun->tables->entryByRegion[fsmRun->region];
 
 		if ( parser->isParserStopFinished() ) {
 			#ifdef COLM_LOG_PARSE
 			cerr << "stopping the parse" << endl;
 			#endif
-			cs = tables->errorState;
+			fsmRun->cs = fsmRun->tables->errorState;
 			parser->stopParsing = true;
 		}
 	}
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index a0fcbd7c..2ba936fe 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -88,13 +88,11 @@ struct FsmRun
 
 	void set_AF_GROUP_MEM();
 
-	void sendLangEl( Kid *input );
 	Kid *makeToken( int id, Head *tokdata, bool namedLangEl, int bindId );
-	void translateLangEl( int id, Head *tokdata, bool namedLangEl, int bindId );
+	void generationAction( int id, Head *tokdata, bool namedLangEl, int bindId );
 	void sendNamedLangEl();
 	void sendEOF();
 	void sendIgnore( long id );
-	void sendQueuedTokens();
 	void sendToken( long id );
 
 	void sendBackIgnore( Kid *ignore );
@@ -131,4 +129,7 @@ struct FsmRun
 	char *mark_leave[32];
 };
 
+void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser );
+void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input );
+
 #endif
-- 
cgit v1.2.1


From 6847f32f20b4c4f536374776f254db72197889e3 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 00:00:10 +0000
Subject: Track the current line and print it in PdaRun::parse_error().

---
 colm/fsmrun.cpp | 70 ++++++++++++++++++++++++++++++++++++---------------------
 colm/fsmrun.h   |  4 +---
 colm/pdarun.cpp |  7 +-----
 3 files changed, 47 insertions(+), 34 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 07d4e2de..23ec2242 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -47,7 +47,6 @@ FsmRun::FsmRun( Program *prg ) :
 	tables(prg->rtd->fsmTables),
 	parser(0),
 	line(1),
-	col(1),
 	position(0)
 {
 }
@@ -115,6 +114,28 @@ void FsmRun::streamPush( const char *data, long length )
 	}
 }
 
+/* Keep the position up to date after consuming text. */
+void update_position( FsmRun *fsmRun, const char *data, long length )
+{
+	for ( int i = 0; i < length; i++ ) {
+		if ( data[i] == '\n' )
+			fsmRun->line += 1;
+	}
+
+	fsmRun->position += length;
+}
+
+/* Keep the position up to date after sending back text. */
+void undo_position( FsmRun *fsmRun, const char *data, long length )
+{
+	for ( int i = 0; i < length; i++ ) {
+		if ( data[i] == '\n' )
+			fsmRun->line -= 1;
+	}
+
+	fsmRun->position -= length;
+}
+
 /* Should only be sending back whole tokens/ignores, therefore the send back
  * should never cross a buffer boundary. Either we slide back p, or we move to
  * a previous buffer and slide back p. */
@@ -160,7 +181,7 @@ void FsmRun::sendBackText( const char *data, long length )
 
 	assert( memcmp( data, p, length ) == 0 );
 		
-	position -= length;
+	undo_position( this, data, length );
 
 	/* We are adjusting p so this must be reset. */
 	tokstart = 0;
@@ -301,6 +322,23 @@ void FsmRun::sendBack( Kid *input )
 	prg->kidPool.free( input );
 }
 
+/* Sets the AF_GROUP_MEM so the backtracker can tell which tokens were sent
+ * generated from a single action. */
+void set_AF_GROUP_MEM( PdaRun *parser )
+{
+	/* Set AF_GROUP_MEM now. */
+	long sendCount = 0;
+	Kid *queued = parser->queue;
+	while ( queued != 0 ) {
+		if ( !(queued->tree->alg->flags & AF_IGNORE) ) {
+			if ( sendCount > 0 )
+				queued->tree->alg->flags |= AF_GROUP_MEM;
+			sendCount += 1;
+		}
+		queued = queued->next;
+	}
+}
+
 void FsmRun::sendEOF( )
 {
 	#ifdef COLM_LOG_PARSE
@@ -329,7 +367,7 @@ void FsmRun::sendEOF( )
 		execution.execute( parser->root );
 
 		/* Mark generated tokens as belonging to a group. */
-		set_AF_GROUP_MEM();
+		set_AF_GROUP_MEM( parser );
 
 		/* Send the generated tokens. */
 		send_queued_tokens( this, parser );
@@ -388,6 +426,7 @@ void FsmRun::sendToken( long id )
 	/* Make the token data. */
 	long length = p-tokstart;
 	Head *tokdata = string_alloc_const( prg, tokstart, length );
+	update_position( this, tokstart, length );
 
 	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
 		/* We don't want the generation actions to automatically consume text
@@ -433,23 +472,6 @@ void FsmRun::sendNamedLangEl()
 	send_handle_error( this, parser, input );
 }
 
-/* Sets the AF_GROUP_MEM so the backtracker can tell which tokens were sent
- * generated from a single action. */
-void FsmRun::set_AF_GROUP_MEM()
-{
-	/* Set AF_GROUP_MEM now. */
-	long sendCount = 0;
-	Kid *queued = parser->queue;
-	while ( queued != 0 ) {
-		if ( !(queued->tree->alg->flags & AF_IGNORE) ) {
-			if ( sendCount > 0 )
-				queued->tree->alg->flags |= AF_GROUP_MEM;
-			sendCount += 1;
-		}
-		queued = queued->next;
-	}
-}
-
 /* 
  * Not supported:
  *  -invoke failure (the backtracker)
@@ -475,7 +497,7 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 	string_free( prg, tokdata );
 
 	/* Mark generated tokens as belonging to a group. */
-	set_AF_GROUP_MEM();
+	set_AF_GROUP_MEM( parser );
 
 	/* Send the queued tokens. */
 	send_queued_tokens( this, parser );
@@ -543,10 +565,6 @@ Kid *PdaRun::extractIgnore()
 
 void PdaRun::send( Kid *input )
 {
-	long length = string_length( input->tree->tokdata );
-	//input->tree->pos = fsmRun->position;
-	fsmRun->position += length;
-
 	/* Pull the ignore tokens out and store in the token. */
 	Kid *ignore = extractIgnore();
 	if ( ignore != 0 ) {
@@ -625,6 +643,7 @@ void FsmRun::sendIgnore( long id )
 	/* Make the ignore string. */
 	int length = p - tokstart;
 	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
+	update_position( this, tokstart, length );
 	tokstart = 0;
 	
 	Tree *tree = prg->treePool.allocate();
@@ -676,6 +695,7 @@ Head *FsmRun::extractToken( long length )
 		cerr << "NOT ENOUGH DATA TO FETCH TOKEN" << endp;
 
 	Head *tokdata = string_alloc_const( prg, p, length );
+	update_position( this, p, length );
 	p += length;
 
 	return tokdata;
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 2ba936fe..af1edc10 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -86,8 +86,6 @@ struct FsmRun
 	FsmRun( Program *prg );
 	~FsmRun();
 
-	void set_AF_GROUP_MEM();
-
 	Kid *makeToken( int id, Head *tokdata, bool namedLangEl, int bindId );
 	void generationAction( int id, Head *tokdata, bool namedLangEl, int bindId );
 	void sendNamedLangEl();
@@ -123,7 +121,7 @@ struct FsmRun
 	bool eofSent;
 	RunBuf *runBuf;
 	bool gotoResume;
-	long line, col;
+	long line;
 	long position;
 	char *mark_enter[32];
 	char *mark_leave[32];
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 66c9312d..8ba1b98c 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -628,12 +628,7 @@ _out:
 
 ostream &PdaRun::parse_error( int tokId, Tree *tree )
 {
-	/* Maintain the error count. */
-	// FIXME: what to put here?
-	// gblErrorCount += 1;
-
-	//cerr << token.loc.fileName << ":" << token.loc.line << ":" << token.loc.col << ": ";
-	cerr << "error: at token ";
+	cerr << "error:" << fsmRun->line << ": at token ";
 	if ( tokId < 128 )
 		cerr << "\"" << tables->gbl->lelInfo[tokId].name << "\"";
 	else 
-- 
cgit v1.2.1


From 65806528c347e6a4689065d82aa9b60b12801b9a Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 02:41:59 +0000
Subject: delete code vectors in the PARSE_BKT instruction

---
 colm/bytecode.cpp | 4 ++--
 colm/pdarun.cpp   | 2 +-
 colm/tree.cpp     | 4 ++--
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 41886e75..f6f7f797 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -335,7 +335,6 @@ void undo_parse( Tree **&sp, Program *prg, Stream *stream,
 	PdaTables *tables = prg->rtd->parsers[parserId];
 	PdaRun parser( sp, prg, tables, stream->scanner, 0 );
 	parser.undoParse( tree, rev );
-	delete rev;
 }
 
 Tree *stream_pull( Program *prg, Stream *stream, Tree *length )
@@ -1778,7 +1777,6 @@ void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *rev )
 		/* Backup over it. */
 		rev->tabLen -= len + 4;
 	}
-	delete rev;
 }
 
 void rcode_downref( Tree **stack_root, Program *prg, Code *instr )
@@ -1802,6 +1800,7 @@ again:
 			rcode_downref_all( stack_root, prg, (CodeVect*)wrev );
 			tree_downref( prg, stream );
 			tree_downref( prg, tree );
+			delete (CodeVect*)wrev;
 			break;
 		}
 		case IN_STREAM_PULL_BKT: {
@@ -3099,6 +3098,7 @@ again:
 
 			undo_parse( sp, prg, (Stream*)stream, parserId, tree, (CodeVect*)wrev );
 			tree_downref( prg, stream );
+			delete (CodeVect*)wrev;
 			break;
 		}
 		case IN_CONSTRUCT: {
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 8ba1b98c..03e3f3b6 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -265,7 +265,7 @@ void PdaRun::commit()
 	/* We cannot always clear all the rcode here. We may need to backup over
 	 * the parse statement. In the future we should compute when it is safe to
 	 * do so, but for now just leave everything until later. */
-	//rcode_downref_all( root, prg, &allReverseCode );
+//	rcode_downref_all( root, prg, allReverseCode );
 }
 
 
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 76c92ae3..242f4003 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -79,7 +79,7 @@ void tree_upref( Tree *tree )
 {
 	if ( tree != 0 )
 		tree->refs += 1;
-};
+}
 
 void tree_downref( Program *prg, Tree *tree )
 {
@@ -89,7 +89,7 @@ void tree_downref( Program *prg, Tree *tree )
 		if ( tree->refs == 0 )
 			tree_free( prg, tree );
 	}
-};
+}
 
 /* Find the first child of a tree. */
 Kid *tree_child( Program *prg, Tree *tree )
-- 
cgit v1.2.1


From 9a2d2bf5a68e3573dae8b8b4471367bd03335468 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 17:15:50 +0000
Subject: Tree downref needs a VM stack pointer. It can't be recursive.

---
 colm/bytecode.cpp   | 340 +++++++++++++++++++++++++++-------------------------
 colm/bytecode.h     |  13 +-
 colm/fsmcodegen.cpp |   2 -
 colm/fsmrun.cpp     |   6 +-
 colm/pdarun.cpp     |   8 +-
 colm/tree.cpp       |  16 +--
 6 files changed, 199 insertions(+), 186 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index f6f7f797..3a60faac 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -637,12 +637,12 @@ Tree *get_ptr_val_split( Program *prg, Pointer *ptr )
 	return split;
 }
 
-void list_free( Program *prg, List *list )
+void list_free( Program *prg, Tree **sp, List *list )
 {
 	ListEl *el = list->head;
 	while ( el != 0 ) {
 		ListEl *next = el->next;
-		tree_downref( prg, el->value );
+		tree_downref( prg, sp, el->value );
 		prg->listElPool.free( el );
 		el = next;
 	}
@@ -650,13 +650,13 @@ void list_free( Program *prg, List *list )
 }
 
 
-void map_free( Program *prg, Map *map )
+void map_free( Program *prg, Tree **sp, Map *map )
 {
 	MapEl *el = map->head;
 	while ( el != 0 ) {
 		MapEl *next = el->next;
-		tree_downref( prg, el->key );
-		tree_downref( prg, el->tree );
+		tree_downref( prg, sp, el->key );
+		tree_downref( prg, sp, el->tree );
 		prg->mapElPool.free( el );
 		el = next;
 	}
@@ -672,14 +672,14 @@ void stream_free( Program *prg, Stream *s )
 	prg->mapElPool.free( (MapEl*)s );
 }
 
-void downref_local_trees( Program *prg, Tree **frame, char *trees, long treesLen )
+void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, long treesLen )
 {
 	for ( long i = 0; i < treesLen; i++ ) {
 		#ifdef COLM_LOG_BYTECODE
 		cerr << "local tree downref: " << (long)trees[i] << endl;
 		#endif
 
-		tree_downref( prg, local(trees[i]) );
+		tree_downref( prg, sp, local(trees[i]) );
 	}
 }
 
@@ -1627,12 +1627,12 @@ Program::Program( bool ctxDepParsing, RuntimeData *rtd )
 	falseVal = (Tree*)falseInt;
 }
 
-void Program::clearGlobal()
+void Program::clearGlobal( Tree **sp )
 {
 	/* Downref all the fields in the global object. */
 	for ( int g = 0; g < rtd->globalSize; g++ ) {
 		//assert( get_attr( global, g )->refs == 1 );
-		tree_downref( this, get_attr( global, g ) );
+		tree_downref( this, sp, get_attr( global, g ) );
 	}
 
 	/* Free the global object. */
@@ -1641,42 +1641,31 @@ void Program::clearGlobal()
 	treePool.free( global );
 }
 
-void Program::freshGlobal()
-{
-	if ( global != 0 )
-		clearGlobal();
-
-	Tree *tree = treePool.allocate();
-	tree->child = alloc_attrs( this, rtd->globalSize );
-	tree->refs = 1;
-	global = tree;
-}
-
-void Program::clear()
+void Program::clear( Tree **sp )
 {
 	#ifdef COLM_LOG_BYTECODE
 	cerr << "clearing the prg" << endl;
 	#endif
 
-	clearGlobal();
+	clearGlobal( sp );
 
 	/* Clear the heap. */
 	Kid *a = heap;
 	while ( a != 0 ) {
 		Kid *next = a->next;
-		tree_downref( this, a->tree );
+		tree_downref( this, sp, a->tree );
 		kidPool.free( a );
 		a = next;
 	}
 
 	//assert( trueVal->refs == 1 );
 	//assert( falseVal->refs == 1 );
-	tree_downref( this, trueVal );
-	tree_downref( this, falseVal );
+	tree_downref( this, sp, trueVal );
+	tree_downref( this, sp, falseVal );
 
-	tree_downref( this, (Tree*)stdinVal );
-	tree_downref( this, (Tree*)stdoutVal );
-	tree_downref( this, (Tree*)stderrVal );
+	tree_downref( this, sp, (Tree*)stdinVal );
+	tree_downref( this, sp, (Tree*)stdoutVal );
+	tree_downref( this, sp, (Tree*)stderrVal );
 
 	long kidLost = kidPool.numlost();
 	if ( kidLost )
@@ -1709,6 +1698,15 @@ void Program::clear()
 	memset( vm_stack, 0, sizeof(Tree*) * VM_STACK_SIZE);
 }
 
+void Program::allocGlobal()
+{
+	/* Alloc the global. */
+	Tree *tree = treePool.allocate();
+	tree->child = alloc_attrs( this, rtd->globalSize );
+	tree->refs = 1;
+	global = tree;
+}
+
 void Program::run()
 {
 	assert( sizeof(Int)      <= sizeof(Tree) );
@@ -1718,11 +1716,22 @@ void Program::run()
 	assert( sizeof(List)     <= sizeof(MapEl) );
 	assert( sizeof(Stream)   <= sizeof(MapEl) );
 
+	/* Allocate the global variable. */
+	allocGlobal();
+
+	/* 
+	 * Allocate the VM stack.
+	 */
+
 	//vm_stack = new Tree*[VM_STACK_SIZE];
 	vm_stack = (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
 		PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, 0, 0 );
 	Tree **root = &vm_stack[VM_STACK_SIZE];
 
+	/*
+	 * Execute
+	 */
+
 	if ( rtd->rootCodeLen > 0 ) {
 		CodeVect reverseCode;
 		CodeVect *allReverseCode = new CodeVect;
@@ -1739,6 +1748,9 @@ void Program::run()
 			rcode_downref( root, this, allReverseCode->data );
 		delete allReverseCode;
 	}
+
+	/* Clear */
+	clear( root );
 }
 
 Execution::Execution( Program *prg, CodeVect &reverseCode,
@@ -1759,7 +1771,7 @@ Execution::Execution( Program *prg, CodeVect &reverseCode,
 	}
 }
 
-void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *rev )
+void rcode_downref_all( Tree **sp, Program *prg, CodeVect *rev )
 {
 	while ( rev->length() > 0 ) {
 		/* Read the length */
@@ -1772,14 +1784,14 @@ void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *rev )
 		prcode = rev->data + start;
 
 		/* Execute it. */
-		rcode_downref( stack_root, prg, prcode );
+		rcode_downref( sp, prg, prcode );
 
 		/* Backup over it. */
 		rev->tabLen -= len + 4;
 	}
 }
 
-void rcode_downref( Tree **stack_root, Program *prg, Code *instr )
+void rcode_downref( Tree **sp, Program *prg, Code *instr )
 {
 again:
 	switch ( *instr++ ) {
@@ -1796,10 +1808,10 @@ again:
 			cerr << "IN_PARSE_BKT " << parserId << endl;
 			#endif
 
-			parsed_downref( stack_root, prg, tree );
-			rcode_downref_all( stack_root, prg, (CodeVect*)wrev );
-			tree_downref( prg, stream );
-			tree_downref( prg, tree );
+			parsed_downref( sp, prg, tree );
+			rcode_downref_all( sp, prg, (CodeVect*)wrev );
+			tree_downref( prg, sp, stream );
+			tree_downref( prg, sp, tree );
 			delete (CodeVect*)wrev;
 			break;
 		}
@@ -1812,8 +1824,8 @@ again:
 			cerr << "IN_STREAM_PULL_BKT" << endl;
 			#endif
 
-			tree_downref( prg, stream );
-			tree_downref( prg, str );
+			tree_downref( prg, sp, stream );
+			tree_downref( prg, sp, str );
 			break;
 		}
 		case IN_STREAM_PUSH_BKT: {
@@ -1826,7 +1838,7 @@ again:
 			cerr << "IN_STREAM_PUSH_BKT" << endl;
 			#endif
 
-			tree_downref( prg, stream );
+			tree_downref( prg, sp, stream );
 			break;
 		}
 		case IN_LOAD_GLOBAL_BKT: {
@@ -1854,7 +1866,7 @@ again:
 			cerr << "IN_SET_FIELD_BKT " << field << endl;
 			#endif
 
-			tree_downref( prg, val );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_PTR_DEREF_BKT: {
@@ -1865,7 +1877,7 @@ again:
 			cerr << "IN_PTR_DEREF_BKT" << endl;
 			#endif
 
-			tree_downref( prg, ptr );
+			tree_downref( prg, sp, ptr );
 			break;
 		}
 		case IN_SET_TOKEN_DATA_BKT: {
@@ -1894,7 +1906,7 @@ again:
 			cerr << "IN_LIST_REMOVE_END_BKT" << endl;
 			#endif
 
-			tree_downref( prg, val );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_GET_LIST_MEM_BKT: {
@@ -1916,7 +1928,7 @@ again:
 			cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
 			#endif
 
-			tree_downref( prg, val );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_MAP_INSERT_BKT: {
@@ -1929,7 +1941,7 @@ again:
 			cerr << "IN_MAP_INSERT_BKT" << endl;
 			#endif
 			
-			tree_downref( prg, key );
+			tree_downref( prg, sp, key );
 			break;
 		}
 		case IN_MAP_STORE_BKT: {
@@ -1941,8 +1953,8 @@ again:
 			cerr << "IN_MAP_STORE_BKT" << endl;
 			#endif
 
-			tree_downref( prg, key );
-			tree_downref( prg, val );
+			tree_downref( prg, sp, key );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_MAP_REMOVE_BKT: {
@@ -1954,8 +1966,8 @@ again:
 			cerr << "IN_MAP_REMOVE_BKT" << endl;
 			#endif
 
-			tree_downref( prg, key );
-			tree_downref( prg, val );
+			tree_downref( prg, sp, key );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_STOP: {
@@ -2105,7 +2117,7 @@ again:
 
 			Tree *tree = pop();
 			print_tree( sp, prg, tree );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_PRINT_XML: {
@@ -2115,7 +2127,7 @@ again:
 
 			Tree *tree = pop();
 			xml_print_tree( sp, prg, tree );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_LOAD_GLOBAL_R: {
@@ -2228,7 +2240,7 @@ again:
 			split_ref( sp, prg, &uiter->ref );
 			Tree *old = uiter->ref.kid->tree;
 			uiter->ref.kid->tree = t;
-			tree_downref( prg, old );
+			tree_downref( prg, sp, old );
 			break;
 		}
 		case IN_GET_LOCAL_R: {
@@ -2266,7 +2278,7 @@ again:
 			#endif
 
 			Tree *val = pop();
-			tree_downref( prg, local(field) );
+			tree_downref( prg, sp, local(field) );
 			set_local( frame, field, val );
 			break;
 		}
@@ -2331,7 +2343,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = get_field( obj, field );
 			tree_upref( val );
@@ -2347,7 +2359,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *split = get_field_split( prg, obj, field );
 			tree_upref( split );
@@ -2363,7 +2375,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *split = get_field_split( prg, obj, field );
 			tree_upref( split );
@@ -2384,7 +2396,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *split = get_field_split( prg, obj, field );
 			tree_upref( split );
@@ -2401,11 +2413,11 @@ again:
 
 			Tree *obj = pop();
 			Tree *val = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			/* Downref the old value. */
 			Tree *prev = get_field( obj, field );
-			tree_downref( prg, prev );
+			tree_downref( prg, sp, prev );
 
 			set_field( prg, obj, field, val );
 			break;
@@ -2420,7 +2432,7 @@ again:
 
 			Tree *obj = pop();
 			Tree *val = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			/* Save the old value, then set the field. */
 			Tree *prev = get_field( obj, field );
@@ -2446,11 +2458,11 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			/* Downref the old value. */
 			Tree *prev = get_field( obj, field );
-			tree_downref( prg, prev );
+			tree_downref( prg, sp, prev );
 
 			set_field( prg, obj, field, val );
 			break;
@@ -2470,7 +2482,7 @@ again:
 
 			/* Downref the old value. */
 			Tree *prev = get_field( obj, field );
-			tree_downref( prg, prev );
+			tree_downref( prg, sp, prev );
 
 			/* Set the field. */
 			set_field( prg, obj, field, val );
@@ -2485,7 +2497,7 @@ again:
 			#endif
 
 			Tree *val = pop();
-			tree_downref( prg, val );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_STR_ATOI: {
@@ -2498,7 +2510,7 @@ again:
 			Tree *integer = construct_integer( prg, res );
 			tree_upref( integer );
 			push( integer );
-			tree_downref( prg, (Tree*)str );
+			tree_downref( prg, sp, (Tree*)str );
 			break;
 		}
 		case IN_INT_TO_STR: {
@@ -2511,7 +2523,7 @@ again:
 			Tree *str = construct_string( prg, res );
 			tree_upref( str );
 			push( str );
-			tree_downref( prg, (Tree*) i );
+			tree_downref( prg, sp, (Tree*) i );
 			break;
 		}
 		case IN_CONCAT_STR: {
@@ -2524,8 +2536,8 @@ again:
 			Head *res = concat_str( s1->value, s2->value );
 			Tree *str = construct_string( prg, res );
 			tree_upref( str );
-			tree_downref( prg, (Tree*)s1 );
-			tree_downref( prg, (Tree*)s2 );
+			tree_downref( prg, sp, (Tree*)s1 );
+			tree_downref( prg, sp, (Tree*)s2 );
 			push( str );
 			break;
 		}
@@ -2539,7 +2551,7 @@ again:
 			Tree *tree = construct_integer( prg, res );
 			tree_upref( tree );
 			push( tree );
-			tree_downref( prg, (Tree*)str );
+			tree_downref( prg, sp, (Tree*)str );
 			break;
 		}
 		case IN_STR_UORD16: {
@@ -2552,7 +2564,7 @@ again:
 			Tree *tree = construct_integer( prg, res );
 			tree_upref( tree );
 			push( tree );
-			tree_downref( prg, (Tree*)str );
+			tree_downref( prg, sp, (Tree*)str );
 			break;
 		}
 
@@ -2566,7 +2578,7 @@ again:
 			Tree *res = construct_integer( prg, len );
 			tree_upref( res );
 			push( res );
-			tree_downref( prg, (Tree*)str );
+			tree_downref( prg, sp, (Tree*)str );
 			break;
 		}
 		case IN_JMP_FALSE: {
@@ -2580,7 +2592,7 @@ again:
 			Tree *tree = pop();
 			if ( test_false( prg, tree ) )
 				instr += dist;
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_JMP_TRUE: {
@@ -2594,7 +2606,7 @@ again:
 			Tree *tree = pop();
 			if ( !test_false( prg, tree ) )
 				instr += dist;
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_JMP: {
@@ -2630,8 +2642,8 @@ again:
 			Tree *val = r ? prg->falseVal : prg->trueVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_NOT_EQL: {
@@ -2645,8 +2657,8 @@ again:
 			Tree *val = r ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_LESS: {
@@ -2660,8 +2672,8 @@ again:
 			Tree *val = r < 0 ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_LESS_EQL: {
@@ -2675,8 +2687,8 @@ again:
 			Tree *val = r <= 0 ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 		}
 		case IN_TST_GRTR: {
 			#ifdef COLM_LOG_BYTECODE
@@ -2689,8 +2701,8 @@ again:
 			Tree *val = r > 0 ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_GRTR_EQL: {
@@ -2704,8 +2716,8 @@ again:
 			Tree *val = r >= 0 ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_LOGICAL_AND: {
@@ -2721,8 +2733,8 @@ again:
 			Tree *val = r ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_TST_LOGICAL_OR: {
@@ -2738,8 +2750,8 @@ again:
 			Tree *val = r ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, o1 );
-			tree_downref( prg, o2 );
+			tree_downref( prg, sp, o1 );
+			tree_downref( prg, sp, o2 );
 			break;
 		}
 		case IN_NOT: {
@@ -2752,7 +2764,7 @@ again:
 			Tree *val = r ? prg->trueVal : prg->falseVal;
 			tree_upref( val );
 			push( val );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 
@@ -2767,8 +2779,8 @@ again:
 			Tree *tree = construct_integer( prg, r );
 			tree_upref( tree );
 			push( tree );
-			tree_downref( prg, (Tree*)o1 );
-			tree_downref( prg, (Tree*)o2 );
+			tree_downref( prg, sp, (Tree*)o1 );
+			tree_downref( prg, sp, (Tree*)o2 );
 			break;
 		}
 		case IN_MULT_INT: {
@@ -2782,8 +2794,8 @@ again:
 			Tree *tree = construct_integer( prg, r );
 			tree_upref( tree );
 			push( tree );
-			tree_downref( prg, (Tree*)o1 );
-			tree_downref( prg, (Tree*)o2 );
+			tree_downref( prg, sp, (Tree*)o1 );
+			tree_downref( prg, sp, (Tree*)o2 );
 			break;
 		}
 		case IN_SUB_INT: {
@@ -2797,8 +2809,8 @@ again:
 			Tree *tree = construct_integer( prg, r );
 			tree_upref( tree );
 			push( tree );
-			tree_downref( prg, (Tree*)o1 );
-			tree_downref( prg, (Tree*)o2 );
+			tree_downref( prg, sp, (Tree*)o1 );
+			tree_downref( prg, sp, (Tree*)o2 );
 			break;
 		}
 		case IN_DUP_TOP: {
@@ -2852,7 +2864,7 @@ again:
 			Tree *res = tree_search( tree, id );
 			tree_upref( res );
 			push( res );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_TRITER_ADVANCE: {
@@ -2939,7 +2951,7 @@ again:
 			split_iter_cur( sp, prg, iter );
 			Tree *old = tree_iter_deref_cur( iter );
 			set_triter_cur( iter, tree );
-			tree_downref( prg, old );
+			tree_downref( prg, sp, old );
 			break;
 		}
 		case IN_MATCH: {
@@ -2986,7 +2998,7 @@ again:
 				push( bindings[b] );
 			}
 
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_PARSE: {
@@ -3031,7 +3043,7 @@ again:
 			reverseCode.appendWord( (Word) string );
 			reverseCode.append( 9 );
 
-			tree_downref( prg, len );
+			tree_downref( prg, sp, len );
 			break;
 		}
 		case IN_STREAM_PULL_BKT: {
@@ -3044,8 +3056,8 @@ again:
 			#endif
 
 			undo_pull( prg, (Stream*)stream, string );
-			tree_downref( prg, stream );
-			tree_downref( prg, string );
+			tree_downref( prg, sp, stream );
+			tree_downref( prg, sp, string );
 			break;
 		}
 		case IN_STREAM_PUSH: {
@@ -3066,7 +3078,7 @@ again:
 			reverseCode.appendWord( len );
 			reverseCode.append( 9 );
 
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_STREAM_PUSH_BKT: {
@@ -3080,7 +3092,7 @@ again:
 			#endif
 
 			undo_stream_push( sp, prg, (Stream*)stream, len );
-			tree_downref( prg, stream );
+			tree_downref( prg, sp, stream );
 			break;
 		}
 		case IN_PARSE_BKT: {
@@ -3097,7 +3109,7 @@ again:
 			#endif
 
 			undo_parse( sp, prg, (Stream*)stream, parserId, tree, (CodeVect*)wrev );
-			tree_downref( prg, stream );
+			tree_downref( prg, sp, stream );
 			delete (CodeVect*)wrev;
 			break;
 		}
@@ -3161,7 +3173,7 @@ again:
 
 			Tree *result = make_token( sp, prg, parser, nargs );
 			for ( long i = 0; i < nargs; i++ )
-				tree_downref( prg, pop() );
+				tree_downref( prg, sp, pop() );
 			push( result );
 			break;
 		}
@@ -3175,7 +3187,7 @@ again:
 
 			Tree *result = make_tree( sp, prg, parser, nargs );
 			for ( long i = 0; i < nargs; i++ )
-				tree_downref( prg, pop() );
+				tree_downref( prg, sp, pop() );
 			push( result );
 			break;
 		}
@@ -3216,7 +3228,7 @@ again:
 			#endif
 
 			Pointer *ptr = (Pointer*)pop();
-			tree_downref( prg, (Tree*)ptr );
+			tree_downref( prg, sp, (Tree*)ptr );
 
 			Tree *dval = get_ptr_val( ptr );
 			tree_upref( dval );
@@ -3229,7 +3241,7 @@ again:
 			#endif
 
 			Pointer *ptr = (Pointer*)pop();
-			tree_downref( prg, (Tree*)ptr );
+			tree_downref( prg, sp, (Tree*)ptr );
 
 			Tree *dval = get_ptr_val_split( prg, ptr );
 			tree_upref( dval );
@@ -3269,7 +3281,7 @@ again:
 			tree_upref( dval );
 			push( dval );
 
-			tree_downref( prg, (Tree*)ptr );
+			tree_downref( prg, sp, (Tree*)ptr );
 			break;
 		}
 		case IN_REF_FROM_LOCAL: {
@@ -3337,7 +3349,7 @@ again:
 			Tree *str = construct_string( prg, data );
 			tree_upref( str );
 			push( str );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_SET_TOKEN_DATA_WC: {
@@ -3351,8 +3363,8 @@ again:
 			string_free( prg, tree->tokdata );
 			tree->tokdata = head;
 
-			tree_downref( prg, tree );
-			tree_downref( prg, val );
+			tree_downref( prg, sp, tree );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_SET_TOKEN_DATA_WV: {
@@ -3373,8 +3385,8 @@ again:
 			rcodeUnitLen += 5;
 			reverseCode.append( rcodeUnitLen );
 
-			tree_downref( prg, tree );
-			tree_downref( prg, val );
+			tree_downref( prg, sp, tree );
+			tree_downref( prg, sp, val );
 			break;
 		}
 		case IN_SET_TOKEN_DATA_BKT: {
@@ -3389,7 +3401,7 @@ again:
 			Head *head = (Head*)oldval;
 			string_free( prg, tree->tokdata );
 			tree->tokdata = head;
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_GET_TOKEN_POS_R: {
@@ -3401,7 +3413,7 @@ again:
 			Tree *integer = construct_integer( prg, 0 );
 			tree_upref( integer );
 			push( integer );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 
 			/* Requires a new implementation. */
 			assert( false );
@@ -3446,7 +3458,7 @@ again:
 			Tree *obj = pop();
 			Tree *val = pop();
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			list_append( prg, (List*)obj, val );
 			tree_upref( prg->trueVal );
@@ -3467,7 +3479,7 @@ again:
 			Tree *obj = pop();
 			Tree *val = pop();
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			list_append( prg, (List*)obj, val );
 			tree_upref( prg->trueVal );
@@ -3480,10 +3492,10 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *tree = list_remove_end( prg, (List*)obj );
-			tree_downref( prg, tree );
+			tree_downref( prg, sp, tree );
 			break;
 		}
 		case IN_LIST_REMOVE_END_WC: {
@@ -3492,7 +3504,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *end = list_remove_end( prg, (List*)obj );
 			push( end );
@@ -3504,7 +3516,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *end = list_remove_end( prg, (List*)obj );
 			push( end );
@@ -3528,7 +3540,7 @@ again:
 			read_tree( val );
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			list_append( prg, (List*)obj, val );
 			break;
@@ -3542,7 +3554,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = get_list_mem( list(obj), field );
 			tree_upref( val );
@@ -3558,7 +3570,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = get_list_mem_split( prg, list(obj), field );
 			tree_upref( val );
@@ -3574,7 +3586,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = get_list_mem_split( prg, list(obj), field );
 			tree_upref( val );
@@ -3595,7 +3607,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *res = get_list_mem_split( prg, list(obj), field );
 			tree_upref( res );
@@ -3611,11 +3623,11 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = pop();
 			Tree *existing = set_list_mem( list(obj), field, val );
-			tree_downref( prg, existing );
+			tree_downref( prg, sp, existing );
 			break;
 		}
 		case IN_SET_LIST_MEM_WV: {
@@ -3627,7 +3639,7 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *val = pop();
 			Tree *existing = set_list_mem( list(obj), field, val );
@@ -3652,10 +3664,10 @@ again:
 			#endif
 
 			Tree *obj = pop();
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			Tree *undid = set_list_mem( list(obj), field, val );
-			tree_downref( prg, undid );
+			tree_downref( prg, sp, undid );
 			break;
 		}
 		case IN_MAP_INSERT_WV: {
@@ -3667,7 +3679,7 @@ again:
 			Tree *val = pop();
 			Tree *key = pop();
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			bool inserted = map_insert( prg, (Map*)obj, key, val );
 			Tree *result = inserted ? prg->trueVal : prg->falseVal;
@@ -3687,8 +3699,8 @@ again:
 			reverseCode.append( rcodeUnitLen );
 
 			if ( ! inserted ) {
-				tree_downref( prg, key );
-				tree_downref( prg, val );
+				tree_downref( prg, sp, key );
+				tree_downref( prg, sp, val );
 			}
 			break;
 		}
@@ -3701,7 +3713,7 @@ again:
 			Tree *val = pop();
 			Tree *key = pop();
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 
 			bool inserted = map_insert( prg, (Map*)obj, key, val );
 			Tree *result = inserted ? prg->trueVal : prg->falseVal;
@@ -3709,8 +3721,8 @@ again:
 			push( result );
 
 			if ( ! inserted ) {
-				tree_downref( prg, key );
-				tree_downref( prg, val );
+				tree_downref( prg, sp, key );
+				tree_downref( prg, sp, val );
 			}
 			break;
 		}
@@ -3727,12 +3739,12 @@ again:
 			Tree *obj = pop();
 			if ( inserted ) {
 				Tree *val = map_uninsert( prg, (Map*)obj, key );
-				tree_downref( prg, key );
-				tree_downref( prg, val );
+				tree_downref( prg, sp, key );
+				tree_downref( prg, sp, val );
 			}
 
-			tree_downref( prg, obj );
-			tree_downref( prg, key );
+			tree_downref( prg, sp, obj );
+			tree_downref( prg, sp, key );
 			break;
 		}
 		case IN_MAP_STORE_WC: {
@@ -3749,10 +3761,10 @@ again:
 			tree_upref( result );
 			push( result );
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 			if ( existing != 0 ) {
-				tree_downref( prg, key );
-				tree_downref( prg, existing );
+				tree_downref( prg, sp, key );
+				tree_downref( prg, sp, existing );
 			}
 			break;
 		}
@@ -3780,10 +3792,10 @@ again:
 			reverseCode.append( rcodeUnitLen );
 			/* FLUSH */
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 			if ( existing != 0 ) {
-				tree_downref( prg, key );
-				tree_downref( prg, existing );
+				tree_downref( prg, sp, key );
+				tree_downref( prg, sp, existing );
 			}
 			break;
 		}
@@ -3799,12 +3811,12 @@ again:
 			Tree *obj = pop();
 			Tree *stored = map_unstore( prg, (Map*)obj, key, val );
 
-			tree_downref( prg, stored );
+			tree_downref( prg, sp, stored );
 			if ( val == 0 )
-				tree_downref( prg, key );
+				tree_downref( prg, sp, key );
 
-			tree_downref( prg, obj );
-			tree_downref( prg, key );
+			tree_downref( prg, sp, obj );
+			tree_downref( prg, sp, key );
 			break;
 		}
 		case IN_MAP_REMOVE_WC: {
@@ -3818,9 +3830,9 @@ again:
 
 			push( pair.val );
 
-			tree_downref( prg, obj );
-			tree_downref( prg, key );
-			tree_downref( prg, pair.key );
+			tree_downref( prg, sp, obj );
+			tree_downref( prg, sp, key );
+			tree_downref( prg, sp, pair.key );
 			break;
 		}
 		case IN_MAP_REMOVE_WV: {
@@ -3842,8 +3854,8 @@ again:
 			rcodeUnitLen += 9;
 			reverseCode.append( rcodeUnitLen );
 
-			tree_downref( prg, obj );
-			tree_downref( prg, key );
+			tree_downref( prg, sp, obj );
+			tree_downref( prg, sp, key );
 			break;
 		}
 		case IN_MAP_REMOVE_BKT: {
@@ -3862,7 +3874,7 @@ again:
 			if ( key != 0 )
 				map_unremove( prg, (Map*)obj, key, val );
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 			break;
 		}
 		case IN_MAP_LENGTH: {
@@ -3876,7 +3888,7 @@ again:
 			tree_upref( res );
 			push( res );
 
-			tree_downref( prg, obj );
+			tree_downref( prg, sp, obj );
 			break;
 		}
 		case IN_MAP_FIND: {
@@ -3890,8 +3902,8 @@ again:
 			tree_upref( result );
 			push( result );
 
-			tree_downref( prg, obj );
-			tree_downref( prg, key );
+			tree_downref( prg, sp, obj );
+			tree_downref( prg, sp, key );
 			break;
 		}
 		case IN_INIT_LOCALS: {
@@ -3917,7 +3929,7 @@ again:
 			#endif
 
 			FrameInfo *fi = &prg->rtd->frameInfo[frameId];
-			downref_local_trees( prg, frame, fi->trees, fi->treesLen );
+			downref_local_trees( prg, sp, frame, fi->trees, fi->treesLen );
 			popn( size );
 			break;
 		}
@@ -4028,7 +4040,7 @@ again:
 			#endif
 
 			FrameInfo *fi = &prg->rtd->frameInfo[fui->frameId];
-			downref_local_trees( prg, frame, fi->trees, fi->treesLen );
+			downref_local_trees( prg, sp, frame, fi->trees, fi->treesLen );
 
 			popn( fui->frameSize );
 			frame = (Tree**) pop();
@@ -4047,7 +4059,7 @@ again:
 			Tree *res = open_file( prg, name );
 			tree_upref( res );
 			push( res );
-			tree_downref( prg, name );
+			tree_downref( prg, sp, name );
 			break;
 		}
 		case IN_GET_STDIN: {
@@ -4056,7 +4068,7 @@ again:
 			#endif
 
 			/* Pop the root object. */
-			tree_downref( prg, pop() );
+			tree_downref( prg, sp, pop() );
 			if ( prg->stdinVal == 0 ) {
 				prg->stdinVal = open_stream_fd( prg, 0 );
 				tree_upref( (Tree*)prg->stdinVal );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index d3ccd1d7..03010173 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -417,12 +417,12 @@ void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
 void parsed_downref( Tree **root, Program *prg, Tree *tree );
 Stream *open_stream( Program *prg, FILE *file );
 Tree *construct_string( Program *prg, Head *s );
-void list_free( Program *prg, List *list );
+void list_free( Program *prg, Tree **sp, List *list );
 void ignore_free( Program *prg, Tree *tree );
-void map_free( Program *prg, Map *map );
+void map_free( Program *prg, Tree **sp, Map *map );
 void stream_free( Program *prg, Stream *s );
 
-void tree_downref( Program *prg, Tree *tree );
+void tree_downref( Program *prg, Tree **sp, Tree *tree );
 void tree_upref( Tree *tree );
 Kid *tree_child( Program *prg, Tree *tree );
 Kid *tree_extract_child( Program *prg, Tree *tree );
@@ -575,9 +575,10 @@ struct Program
 	Tree *falseVal;
 
 	void run();
-	void clear();
-	void clearGlobal();
-	void freshGlobal();
+
+	void clear( Tree **sp );
+	void clearGlobal( Tree **sp );
+	void allocGlobal();
 
 	Kid *heap;
 
diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 027ac3b5..94a2307e 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -1062,9 +1062,7 @@ void FsmCodeGen::writeCode()
 		"int main( int argc, char **argv )\n"
 		"{\n"
 		"	Program program( true, &main_runtimeData );\n"
-		"	program.freshGlobal();\n"
 		"	program.run();\n"
-		"	program.clear();\n"
 		"	return 0;\n"
 		"}\n"
 		"\n";
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 23ec2242..9ab3b969 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -314,11 +314,11 @@ void FsmRun::sendBack( Kid *input )
 	Tree *lastBound = parser->bindings.top();
 	if ( lastBound == input->tree ) {
 		parser->bindings.pop();
-		tree_downref( prg, input->tree );
+		tree_downref( prg, parser->root, input->tree );
 	}
 
 	/* Downref the tree that was sent back and free the kid. */
-	tree_downref( prg, input->tree );
+	tree_downref( prg, parser->root, input->tree );
 	prg->kidPool.free( input );
 }
 
@@ -550,7 +550,7 @@ void PdaRun::sendBackIgnore()
 	fsmRun->sendBackIgnore( ignore );
 	while ( ignore != 0 ) {
 		Kid *next = ignore->next;
-		tree_downref( prg, ignore->tree );
+		tree_downref( prg, root, ignore->tree );
 		prg->kidPool.free( ignore );
 		ignore = next;
 	}
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 03e3f3b6..09197f67 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -51,7 +51,7 @@ void PdaRun::clean()
 	Kid *kid = stackTop;
 	while ( kid != 0 ) {
 		Kid *next = kid->next;
-		tree_downref( prg, kid->tree );
+		tree_downref( prg, root, kid->tree );
 		prg->kidPool.free( kid );
 		kid = next;
 	}
@@ -215,7 +215,7 @@ head:
 
 	alg->flags |= AF_REV_FREED;
 
-	tree_downref( prg, alg->parsed );
+	tree_downref( prg, sp, alg->parsed );
 	alg->parsed = 0;
 
 	if ( sp != root )
@@ -567,7 +567,7 @@ parseError:
 
 			if ( alg->parsed != 0 ) {
 				/* Get the lhs, it may have been reverted. */
-				tree_downref( prg, undoLel->tree );
+				tree_downref( prg, root, undoLel->tree );
 				undoLel->tree = alg->parsed;
 			}
 
@@ -613,7 +613,7 @@ parseError:
 			}
 
 			/* Free the reduced item. */
-			tree_downref( prg, undoLel->tree );
+			tree_downref( prg, root, undoLel->tree );
 			prg->kidPool.free( undoLel );
 			prg->algPool.free( alg );
 		}
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 242f4003..e3c23b59 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -25,16 +25,18 @@
 #include "fsmrun.h"
 #include "pdarun.h"
 
-void tree_free( Program *prg, Tree *tree )
+/* We can't make recursive calls here since the tree we are freeing may be
+ * very large. Need the VM stack. */
+void tree_free( Program *prg, Tree **sp, Tree *tree )
 {
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 	long genericId = lelInfo[tree->id].genericId;
 	if ( genericId > 0 ) {
 		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
 		if ( generic->type == GEN_LIST )
-			list_free( prg, (List*)tree );
+			list_free( prg, sp, (List*)tree );
 		else if ( generic->type == GEN_MAP )
-			map_free( prg, (Map*)tree );
+			map_free( prg, sp, (Map*)tree );
 		else
 			assert(false);
 	}
@@ -57,7 +59,7 @@ void tree_free( Program *prg, Tree *tree )
 		else { 
 			if ( tree->alg != 0 ) {
 				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-				tree_downref( prg, tree->alg->parsed );
+				tree_downref( prg, sp, tree->alg->parsed );
 				prg->algPool.free( tree->alg );
 			}
 			string_free( prg, tree->tokdata );
@@ -65,7 +67,7 @@ void tree_free( Program *prg, Tree *tree )
 			Kid *child = tree->child;
 			while ( child != 0 ) {
 				Kid *next = child->next;
-				tree_downref( prg, child->tree );
+				tree_downref( prg, sp, child->tree );
 				prg->kidPool.free( child );
 				child = next;
 			}
@@ -81,13 +83,13 @@ void tree_upref( Tree *tree )
 		tree->refs += 1;
 }
 
-void tree_downref( Program *prg, Tree *tree )
+void tree_downref( Program *prg, Tree **sp, Tree *tree )
 {
 	if ( tree != 0 ) {
 		assert( tree->refs > 0 );
 		tree->refs -= 1;
 		if ( tree->refs == 0 )
-			tree_free( prg, tree );
+			tree_free( prg, sp, tree );
 	}
 }
 
-- 
cgit v1.2.1


From 49e328facffdfc383b7254fb01ac0740889b8275 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 20:12:59 +0000
Subject: The tree_free function is no longer recursive. Instead it used the VM
 stack to store child trees that need to be freed.

---
 colm/bytecode.cpp | 35 ---------------------------------
 colm/bytecode.h   |  4 ----
 colm/tree.cpp     | 59 ++++++++++++++++++++++++++++++++++++++++++++++++-------
 3 files changed, 52 insertions(+), 46 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 3a60faac..14f8c4f2 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -637,41 +637,6 @@ Tree *get_ptr_val_split( Program *prg, Pointer *ptr )
 	return split;
 }
 
-void list_free( Program *prg, Tree **sp, List *list )
-{
-	ListEl *el = list->head;
-	while ( el != 0 ) {
-		ListEl *next = el->next;
-		tree_downref( prg, sp, el->value );
-		prg->listElPool.free( el );
-		el = next;
-	}
-	prg->mapElPool.free( (MapEl*)list );
-}
-
-
-void map_free( Program *prg, Tree **sp, Map *map )
-{
-	MapEl *el = map->head;
-	while ( el != 0 ) {
-		MapEl *next = el->next;
-		tree_downref( prg, sp, el->key );
-		tree_downref( prg, sp, el->tree );
-		prg->mapElPool.free( el );
-		el = next;
-	}
-	prg->mapElPool.free( (MapEl*)map );
-}
-
-void stream_free( Program *prg, Stream *s )
-{
-	delete s->scanner;
-	delete s->in;
-	if ( s->file != 0 )
-		fclose( s->file );
-	prg->mapElPool.free( (MapEl*)s );
-}
-
 void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, long treesLen )
 {
 	for ( long i = 0; i < treesLen; i++ ) {
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 03010173..2f0ab499 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -417,10 +417,6 @@ void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
 void parsed_downref( Tree **root, Program *prg, Tree *tree );
 Stream *open_stream( Program *prg, FILE *file );
 Tree *construct_string( Program *prg, Head *s );
-void list_free( Program *prg, Tree **sp, List *list );
-void ignore_free( Program *prg, Tree *tree );
-void map_free( Program *prg, Tree **sp, Map *map );
-void stream_free( Program *prg, Stream *s );
 
 void tree_downref( Program *prg, Tree **sp, Tree *tree );
 void tree_upref( Tree *tree );
diff --git a/colm/tree.cpp b/colm/tree.cpp
index e3c23b59..3f3fc67b 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -25,18 +25,52 @@
 #include "fsmrun.h"
 #include "pdarun.h"
 
+#define push(i) (*(--sp) = (i))
+#define pop() (*sp++)
+
+void stream_free( Program *prg, Stream *s )
+{
+	delete s->scanner;
+	delete s->in;
+	if ( s->file != 0 )
+		fclose( s->file );
+	prg->mapElPool.free( (MapEl*)s );
+}
+
 /* We can't make recursive calls here since the tree we are freeing may be
  * very large. Need the VM stack. */
 void tree_free( Program *prg, Tree **sp, Tree *tree )
 {
+	Tree **top = sp;
+
+free_tree:
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 	long genericId = lelInfo[tree->id].genericId;
 	if ( genericId > 0 ) {
 		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
-		if ( generic->type == GEN_LIST )
-			list_free( prg, sp, (List*)tree );
-		else if ( generic->type == GEN_MAP )
-			map_free( prg, sp, (Map*)tree );
+		if ( generic->type == GEN_LIST ) {
+			List *list = (List*) tree;
+			ListEl *el = list->head;
+			while ( el != 0 ) {
+				ListEl *next = el->next;
+				push( el->value );
+				prg->listElPool.free( el );
+				el = next;
+			}
+			prg->mapElPool.free( (MapEl*)list );
+		}
+		else if ( generic->type == GEN_MAP ) {
+			Map *map = (Map*)tree;
+			MapEl *el = map->head;
+			while ( el != 0 ) {
+				MapEl *next = el->next;
+				push( el->key );
+				push( el->tree );
+				prg->mapElPool.free( el );
+				el = next;
+			}
+			prg->mapElPool.free( (MapEl*)map );
+		}
 		else
 			assert(false);
 	}
@@ -50,7 +84,7 @@ void tree_free( Program *prg, Tree **sp, Tree *tree )
 			prg->treePool.free( tree );
 		else if ( tree->id == LEL_ID_PTR ) {
 			//Pointer *ptr = (Pointer*)tree;
-			//tree_downref( prg, ptr->value->tree );
+			//push( ptr->value->tree );
 			//prg->kidPool.free( ptr->value );
 			prg->treePool.free( tree );
 		}
@@ -59,7 +93,7 @@ void tree_free( Program *prg, Tree **sp, Tree *tree )
 		else { 
 			if ( tree->alg != 0 ) {
 				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-				tree_downref( prg, sp, tree->alg->parsed );
+				push( tree->alg->parsed );
 				prg->algPool.free( tree->alg );
 			}
 			string_free( prg, tree->tokdata );
@@ -67,7 +101,7 @@ void tree_free( Program *prg, Tree **sp, Tree *tree )
 			Kid *child = tree->child;
 			while ( child != 0 ) {
 				Kid *next = child->next;
-				tree_downref( prg, sp, child->tree );
+				push( child->tree );
 				prg->kidPool.free( child );
 				child = next;
 			}
@@ -75,6 +109,17 @@ void tree_free( Program *prg, Tree **sp, Tree *tree )
 			prg->treePool.free( tree );
 		}
 	}
+
+	/* Any trees to downref? */
+	while ( sp != top ) {
+		tree = pop();
+		if ( tree != 0 ) {
+			assert( tree->refs > 0 );
+			tree->refs -= 1;
+			if ( tree->refs == 0 )
+				goto free_tree;
+		}
+	}
 }
 
 void tree_upref( Tree *tree )
-- 
cgit v1.2.1


From 7a884f01ea1748c12850402f388f284f5695b056 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 21:44:48 +0000
Subject: The iter_find function needs to use tree_child() to find the first
 child.

---
 colm/bytecode.cpp | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 14f8c4f2..76a4366b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -676,23 +676,27 @@ void iter_find( Program *prg, Tree **&sp, TreeIter *iter, bool tryFirst )
 {
 	bool anyTree = iter->searchId == prg->rtd->anyId;
 	Tree **top = iter->stackRoot;
+	Kid *child;
 
 rec_call:
 	if ( tryFirst && ( iter->ref.kid->tree->id == iter->searchId || anyTree ) )
 		return;
-	else if ( iter->ref.kid->tree->child != 0 ) {
-		push( (SW) iter->ref.next );
-		push( (SW) iter->ref.kid );
-		iter->ref.kid = iter->ref.kid->tree->child;
-		iter->ref.next = (Ref*)ptop();
-		while ( iter->ref.kid != 0 ) {
-			tryFirst = true;
-			goto rec_call;
-			rec_return:
-			iter->ref.kid = iter->ref.kid->next;
+	else {
+		child = tree_child( prg, iter->ref.kid->tree );
+		if ( child != 0 ) {
+			push( (SW) iter->ref.next );
+			push( (SW) iter->ref.kid );
+			iter->ref.kid = child;
+			iter->ref.next = (Ref*)ptop();
+			while ( iter->ref.kid != 0 ) {
+				tryFirst = true;
+				goto rec_call;
+				rec_return:
+				iter->ref.kid = iter->ref.kid->next;
+			}
+			iter->ref.kid = (Kid*)pop();
+			iter->ref.next = (Ref*)pop();
 		}
-		iter->ref.kid = (Kid*)pop();
-		iter->ref.next = (Ref*)pop();
 	}
 
 	if ( top != ptop() )
-- 
cgit v1.2.1


From cd346f2b361b327ad68f3efb21a8bb32a214a219 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 21:55:59 +0000
Subject: Add unknown_id to the destructor declarator_id forms.

In preproc we need to supply __builtin_va_list.
---
 test/cxx/cxx.lm  | 11 +++++++++++
 test/cxx/preproc |  1 +
 2 files changed, 12 insertions(+)

diff --git a/test/cxx/cxx.lm b/test/cxx/cxx.lm
index 560bfde2..cf0d452b 100644
--- a/test/cxx/cxx.lm
+++ b/test/cxx/cxx.lm
@@ -1330,6 +1330,10 @@ def declarator_id_forms
 	{
 		lhs.lookupId = lookup_id in r4
 	}
+|	[root_qual_opt nested_name_specifier_opt '~' unknown_id]
+	{
+		lhs.lookupId = lookup_id in r4
+	}
 
 def type_id
 	lookup_id lookupId
@@ -2161,3 +2165,10 @@ start S = parse start( stdin )
 #printNamespace()
 #print( '***** SUCCESS *****\n' )
 #print_xml( S )
+#for DI: declarator_id in S {
+#	if match DI 
+#		[root_qual_opt nested_name_specifier_opt '~' UID:unknown_id]
+#	{
+#		print( UID, '\n' )
+#	}
+#}
diff --git a/test/cxx/preproc b/test/cxx/preproc
index ed708599..2661a197 100755
--- a/test/cxx/preproc
+++ b/test/cxx/preproc
@@ -1,4 +1,5 @@
 #!/bin/bash
 #
 
+echo 'struct __builtin_va_list {};'
 g++ -E -undef -D'__attribute__(xyz)=' "$@" | sed 's/#.*$//' | grep -v '^[ \t]*$'
-- 
cgit v1.2.1


From c6fa8907625eaa47cd57a04e595f1f9efa295248 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 23:19:48 +0000
Subject: Moved a lot of code from bytecode.cpp to tree.cpp.

---
 colm/bytecode.cpp | 1372 +----------------------------------------------------
 colm/bytecode.h   |   73 ++-
 colm/pdarun.cpp   |   15 +-
 colm/tree.cpp     | 1317 +++++++++++++++++++++++++++++++++++++++++++++++++-
 4 files changed, 1398 insertions(+), 1379 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 76a4366b..d5c24ecd 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -49,6 +49,13 @@ using std::endl;
 	i = ((uchar) *instr++); \
 } while(0)
 
+#define read_word_p( i, p ) do { \
+	i = ((Word)  p[0]); \
+	i |= ((Word) p[1]) << 8; \
+	i |= ((Word) p[2]) << 16; \
+	i |= ((Word) p[3]) << 24; \
+} while(0)
+
 #define read_word( i ) do { \
 	i = ((Word) *instr++); \
 	i |= ((Word) *instr++) << 8; \
@@ -70,134 +77,7 @@ using std::endl;
 	i |= ((Word) *instr++) << 8; \
 } while(0)
 
-static Tree **vm_stack;
-
-Kid *alloc_attrs( Program *prg, long length )
-{
-	Kid *cur = 0;
-	for ( long i = 0; i < length; i++ ) {
-		Kid *next = cur;
-		cur = prg->kidPool.allocate();
-		cur->next = next;
-	}
-	return cur;
-}
-
-void free_attrs( Program *prg, Kid *attrs )
-{
-	Kid *cur = attrs;
-	while ( cur != 0 ) {
-		Kid *next = cur->next;
-		prg->kidPool.free( cur );
-		cur = next;
-	}
-}
-
-void set_attr( Tree *tree, long pos, Tree *val )
-{
-	Kid *cur = tree->child;
-	for ( long i = 0; i < pos; i++ )
-		cur = cur->next;
-	cur->tree = val;
-}
-
-Tree *get_attr( Tree *tree, long pos )
-{
-	Kid *cur = tree->child;
-	for ( long i = 0; i < pos; i++ )
-		cur = cur->next;
-	return cur->tree;
-}
-
-Kid *copy_obj_data( Program *prg, long length, Kid *src )
-{
-	Kid *cur = 0;
-	for ( long i = 0; i < length; i++ ) {
-		Kid *next = cur;
-		cur = prg->kidPool.allocate();
-		cur->next = next;
-	}
-
-	Kid *dest = cur;
-	for ( long i = 0; i < length; i++ ) {
-		dest->tree = src->tree;
-		dest = dest->next;
-		src = src->next;
-	}
-	return cur;
-}
-
-Kid *kid_list_concat( Kid *list1, Kid *list2 )
-{
-	if ( list1 == 0 )
-		return list2;
-	else if ( list2 == 0 )
-		return list1;
-
-	Kid *dest = list1;
-	while ( dest->next != 0 )
-		dest = dest->next;
-	dest->next = list2;
-	return list1;
-}
-
 /* Type conversions. */
-List *list( Tree *tree ) { return (List*) tree; }
-Map *map( Tree *tree )  { return (Map*) tree; }
-Str *str( Tree *tree )  { return (Str*) tree; }
-
-void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter );
-Tree *split_tree( Program *prg, Tree *t );
-Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
-
-Stream *open_stream_file( Program *prg, FILE *file )
-{
-	Stream *res = (Stream*)prg->mapElPool.allocate();
-	res->id = LEL_ID_STREAM;
-	res->file = file;
-	res->in = new InputStreamFile( file );
-	res->scanner = new FsmRun( prg );
-	res->scanner->attachInputStream( res->in );
-	return res;
-}
-
-Stream *open_stream_fd( Program *prg, long fd )
-{
-	Stream *res = (Stream*)prg->mapElPool.allocate();
-	res->id = LEL_ID_STREAM;
-	res->in = new InputStreamFD( fd );
-	res->scanner = new FsmRun( prg );
-	res->scanner->attachInputStream( res->in );
-	return res;
-}
-
-Tree *open_file( Program *prg, Tree *name )
-{
-	Head *head = ((Str*)name)->value;
-	FILE *file = fopen( string_data(head), "rb" );
-	Tree *res = 0;
-
-	if ( file != 0 ) {
-		res = (Tree*) open_stream_file( prg, file );
-		res = prg->treePool.allocate();
-		res->id = LEL_ID_STREAM;
-		((Stream *)res)->file = file;
-	}
-
-	return res;
-}
-
-void check_parse_tree( Tree *tree )
-{
-	if ( tree->refs != 1 )
-		cerr << "tree->refs: " << tree->refs << endl;
-	
-	Kid *child = tree->child;
-	while ( child != 0 ) {
-		check_parse_tree( child->tree );
-		child = child->next;
-	}
-}
 
 void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 {
@@ -237,82 +117,6 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 	}
 }
 
-Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs )
-{
-	Tree **const sp = root;
-	Tree **base = ptop() + nargs;
-
-	Int *idInt = (Int*)base[-1];
-	Str *textStr = (Str*)base[-2];
-
-	long id = idInt->value;
-	Head *tokdata = string_copy( prg, textStr->value );
-
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-	Tree *tree;
-
-	if ( lelInfo[id].ignore ) {
-		tree = prg->treePool.allocate();
-		tree->refs = 1;
-		tree->id = id;
-		tree->tokdata = tokdata;
-	}
-	else {
-		long objectLength = lelInfo[id].objectLength;
-		Kid *attrs = alloc_attrs( prg, objectLength );
-
-		tree = prg->treePool.allocate();
-		tree->id = id;
-		tree->refs = 1;
-		tree->tokdata = tokdata;
-
-		tree->child = attrs;
-
-		assert( nargs-2 <= objectLength );
-		for ( long id = 0; id < nargs-2; id++ ) {
-			set_attr( tree, id, base[-3-id] );
-			tree_upref( get_attr( tree, id) );
-		}
-	}
-	return tree;
-}
-
-Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, int nargs )
-{
-	Tree **const sp = root;
-	Tree **base = ptop() + nargs;
-
-	Int *idInt = (Int*)base[-1];
-
-	long id = idInt->value;
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-
-	Tree *tree = prg->treePool.allocate();
-	tree->id = id;
-	tree->refs = 1;
-
-	long objectLength = lelInfo[id].objectLength;
-	Kid *attrs = alloc_attrs( prg, objectLength );
-
-	Kid *last = 0, *child = 0;
-	for ( long id = 0; id < nargs-1; id++ ) {
-		Kid *kid = prg->kidPool.allocate();
-		kid->tree = base[-2-id];
-		tree_upref( kid->tree );
-
-		if ( last == 0 )
-			child = kid;
-		else
-			last->next = kid;
-
-		last = kid;
-	}
-
-	tree->child = kid_list_concat( attrs, child );
-
-	return tree;
-}
-
 Tree *parse( Tree **&sp, Program *prg, Stream *stream, 
 		long parserId, long stopId, CodeVect *&cv )
 {
@@ -341,12 +145,7 @@ Tree *stream_pull( Program *prg, Stream *stream, Tree *length )
 {
 	long len = ((Int*)length)->value;
 	Head *tokdata = stream->scanner->extractToken( len );
-
-	Str *str = (Str*) prg->treePool.allocate();
-	str->id = LEL_ID_STR;
-	str->value = tokdata;
-
-	return (Tree*)str;
+	return construct_string( prg, tokdata );
 }
 
 void undo_pull( Program *prg, Stream *stream, Tree *str )
@@ -369,246 +168,6 @@ void undo_stream_push( Tree **&sp, Program *prg, Stream *stream, Word len )
 	stream->scanner->undoStreamPush( len );
 }
 
-
-void print_str( Head *str )
-{
-	cout.write( (char*)(str->data), str->length );
-}
-
-void print_ignore_list( Tree **&sp, Program *prg, Tree *tree )
-{
-	Kid *ignore = tree_ignore( prg, tree );
-
-	/* Record the root of the stack and push everything. */
-	Tree **root = ptop();
-	while ( tree_is_ignore( prg, ignore ) ) {
-		push( (SW)ignore );
-		ignore = ignore->next;
-	}
-
-	/* Pop them off and print. */
-	while ( ptop() != root ) {
-		ignore = (Kid*) pop();
-		print_tree( sp, prg, ignore->tree );
-	}
-}
-
-void print_kid( ostream &out, Tree **&sp, Program *prg, Kid *kid, bool printIgnore )
-{
-	Tree **root = ptop();
-	Kid *child;
-
-rec_call:
-	/* If not currently skipping ignore data, then print it. Ignore data can
-	 * be associated with terminals and nonterminals. */
-	if ( printIgnore && tree_ignore( prg, kid->tree ) != 0 ) {
-		/* Ignorelists are reversed. */
-		print_ignore_list( sp, prg, kid->tree );
-		printIgnore = false;
-	}
-
-	if ( kid->tree->id < prg->rtd->firstNonTermId ) {
-		/* Always turn on ignore printing when we get to a token. */
-		printIgnore = true;
-
-		if ( kid->tree->id == LEL_ID_INT )
-			out << ((Int*)kid->tree)->value;
-		else if ( kid->tree->id == LEL_ID_BOOL ) {
-			if ( ((Int*)kid->tree)->value )
-				out << "true";
-			else
-				out << "false";
-		}
-		else if ( kid->tree->id == LEL_ID_PTR )
-			out << '#' << (void*) ((Pointer*)kid->tree)->value;
-		else if ( kid->tree->id == LEL_ID_STR )
-			print_str( ((Str*)kid->tree)->value );
-		else if ( kid->tree->id == LEL_ID_STREAM )
-			out << '#' << (void*) ((Stream*)kid->tree)->file;
-		else if ( kid->tree->tokdata != 0 && 
-				string_length( kid->tree->tokdata ) > 0 )
-		{
-			out.write( string_data( kid->tree->tokdata ), 
-					string_length( kid->tree->tokdata ) );
-		}
-	}
-	else {
-		/* Non-terminal. */
-		child = tree_child( prg, kid->tree );
-		if ( child != 0 ) {
-			push( (SW)kid );
-			kid = child;
-			while ( kid != 0 ) {
-				goto rec_call;
-				rec_return:
-				kid = kid->next;
-			}
-			kid = (Kid*)pop();
-		}
-	}
-
-	if ( ptop() != root )
-		goto rec_return;
-}
-
-void print_tree( Tree **&sp, Program *prg, Tree *tree )
-{
-	if ( tree == 0 )
-		cout << "NIL";
-	else {
-		Kid kid;
-		kid.tree = tree;
-		kid.next = 0;
-		print_kid( cout, sp, prg, &kid, false );
-	}
-}
-
-void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree )
-{
-	if ( tree == 0 )
-		cout << "NIL";
-	else {
-		Kid kid;
-		kid.tree = tree;
-		kid.next = 0;
-		print_kid( out, sp, prg, &kid, false );
-	}
-}
-
-void xml_escape_data( const char *data, long len )
-{
-	for ( int i = 0; i < len; i++ ) {
-		if ( 32 <= data[i] && data[i] <= 126 )
-			cout << data[i];
-		else
-			cout << "&#" << ((unsigned)data[i]) << ';';
-	}
-}
-
-void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
-{
-	Tree **root = ptop();
-	int i = 0;
-
-rec_call:
-	for ( i = 0; i < depth; i++ )
-		cout << "  ";
-
-	if ( kid->tree == 0 )
-		cout << "NIL" << endl;
-	else {
-		cout << '<' << prg->rtd->lelInfo[kid->tree->id].name;
-		if ( kid->tree->child != 0 ) {
-			cout << '>' << endl;
-			push( (SW) kid );
-			kid = kid->tree->child;
-			while ( kid != 0 ) {
-				depth++;
-				goto rec_call;
-				rec_return:
-				depth--;
-				kid = kid->next;
-
-				/* If the parent kid is a repeat then skip this node and go
-				 * right to the first child (repeated item). */
-				if ( prg->rtd->lelInfo[((Kid*)top())->tree->id].repeat )
-					kid = kid->tree->child;
-			}
-			kid = (Kid*) pop();
-
-			for ( i = 0; i < depth; i++ )
-				cout << "  ";
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else if ( kid->tree->id == LEL_ID_PTR ) {
-			cout << '>' << (void*)((Pointer*)kid->tree)->value << 
-					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else if ( kid->tree->id == LEL_ID_BOOL ) {
-			if ( ((Int*)kid->tree)->value )
-				cout << ">true</";
-			else
-				cout << ">false</";
-			cout << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else if ( kid->tree->id == LEL_ID_INT ) {
-			cout << '>' << ((Int*)kid->tree)->value << 
-					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else if ( kid->tree->id == LEL_ID_STR ) {
-			Head *head = (Head*) ((Str*)kid->tree)->value;
-
-			cout << '>';
-			xml_escape_data( (char*)(head->data), head->length );
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else if ( 0 < kid->tree->id && kid->tree->id < prg->rtd->firstNonTermId &&
-				kid->tree->tokdata != 0 && 
-				string_length( kid->tree->tokdata ) > 0 && 
-				!prg->rtd->lelInfo[kid->tree->id].literal )
-		{
-			cout << '>';
-			xml_escape_data( string_data( kid->tree->tokdata ), 
-					string_length( kid->tree->tokdata ) );
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
-		}
-		else
-			cout << "/>" << endl;
-	}
-
-	if ( ptop() != root )
-		goto rec_return;
-}
-
-void xml_print_tree( Tree **&sp, Program *prg, Tree *tree )
-{
-	Kid kid;
-	kid.tree = tree;
-	kid.next = 0;
-	xml_print_kid( sp, prg, &kid, 0 );
-}
-
-Tree *get_rhs_el( Program *prg, Tree *lhs, long position )
-{
-	Kid *pos = tree_child( prg, lhs );
-	while ( position > 0 ) {
-		pos = pos->next;
-		position -= 1;
-	}
-	return pos->tree;
-}
-
-Tree **alloc_obj_data( long length )
-{
-	Tree **attrs = 0;
-	if ( length > 0 ) {
-		attrs = new Tree*[length];
-		memset( attrs, 0, sizeof(Tree*)*length );
-	}
-	return attrs;
-}
-
-void set_field( Program *prg, Tree *tree, long field, Tree *value )
-{
-	assert( tree->refs == 1 );
-	if ( value != 0 )
-		assert( value->refs >= 1 );
-	set_attr( tree, field, value );
-}
-
-Tree *get_field( Tree *tree, Word field )
-{
-	return get_attr( tree, field );
-}
-
-Tree *get_field_split( Program *prg, Tree *tree, Word field )
-{
-	Tree *val = get_attr( tree, field );
-	Tree *split = split_tree( prg, val );
-	set_attr( tree, field, split );
-	return split;
-}
-
 void set_local( Tree **frame, long field, Tree *tree )
 {
 	if ( tree != 0 )
@@ -624,19 +183,6 @@ Tree *get_local_split( Program *prg, Tree **frame, long field )
 	return split;
 }
 
-Tree *get_ptr_val( Pointer *ptr )
-{
-	return ptr->value->tree;
-}
-
-Tree *get_ptr_val_split( Program *prg, Pointer *ptr )
-{
-	Tree *val = ptr->value->tree;
-	Tree *split = split_tree( prg, val );
-	ptr->value->tree = split;
-	return split;
-}
-
 void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, long treesLen )
 {
 	for ( long i = 0; i < treesLen; i++ ) {
@@ -658,11 +204,6 @@ void upref_uiter_args( Tree **frame, long nargs )
 	}
 }
 
-void set_triter_cur( TreeIter *iter, Tree *tree )
-{
-	iter->ref.kid->tree = tree;
-}
-
 UserIter *uiter_create( Tree **&sp, Program *prg, FunctionInfo *fi, long searchId )
 {
 	pushn( sizeof(UserIter) / sizeof(Word) );
@@ -672,141 +213,6 @@ UserIter *uiter_create( Tree **&sp, Program *prg, FunctionInfo *fi, long searchI
 	return uiter;
 }
 
-void iter_find( Program *prg, Tree **&sp, TreeIter *iter, bool tryFirst )
-{
-	bool anyTree = iter->searchId == prg->rtd->anyId;
-	Tree **top = iter->stackRoot;
-	Kid *child;
-
-rec_call:
-	if ( tryFirst && ( iter->ref.kid->tree->id == iter->searchId || anyTree ) )
-		return;
-	else {
-		child = tree_child( prg, iter->ref.kid->tree );
-		if ( child != 0 ) {
-			push( (SW) iter->ref.next );
-			push( (SW) iter->ref.kid );
-			iter->ref.kid = child;
-			iter->ref.next = (Ref*)ptop();
-			while ( iter->ref.kid != 0 ) {
-				tryFirst = true;
-				goto rec_call;
-				rec_return:
-				iter->ref.kid = iter->ref.kid->next;
-			}
-			iter->ref.kid = (Kid*)pop();
-			iter->ref.next = (Ref*)pop();
-		}
-	}
-
-	if ( top != ptop() )
-		goto rec_return;
-	
-	iter->ref.kid = 0;
-}
-
-Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter )
-{
-	assert( iter->stackSize == iter->stackRoot - ptop() );
-
-	if ( iter->ref.kid == 0 ) {
-		/* Kid is zero, start from the root. */
-		iter->ref = iter->rootRef;
-		iter_find( prg, sp, iter, true );
-	}
-	else {
-		/* Have a previous item, continue searching from there. */
-		iter_find( prg, sp, iter, false );
-	}
-
-	iter->stackSize = iter->stackRoot - ptop();
-
-	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
-}
-
-Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter )
-{
-	assert( iter->stackSize == iter->stackRoot - ptop() );
-
-	if ( iter->ref.kid == 0 ) {
-		/* Kid is zero, start from the first child. */
-		if ( iter->rootRef.kid->tree->child == 0 ) {
-			iter->ref.kid = 0;
-			iter->ref.next = 0;
-		}
-		else {
-			push( (SW) iter->rootRef.next );
-			push( (SW) iter->rootRef.kid );
-			iter->ref.kid = iter->rootRef.kid->tree->child;
-			iter->ref.next = (Ref*)ptop();
-		}
-	}
-	else {
-		iter->ref.kid = iter->ref.kid->next;
-	}
-
-	bool anyTree = iter->searchId == prg->rtd->anyId;
-	if ( ! anyTree ) {
-		/* Have a previous item, go to the next sibling. */
-		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
-			iter->ref.kid = iter->ref.kid->next;
-		}
-	}
-
-	iter->stackSize = iter->stackRoot - ptop();
-
-	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
-}
-
-Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter )
-{
-	assert( iter->stackSize == iter->stackRoot - ptop() );
-
-	if ( iter->ref.kid == 0 ) {
-		/* Kid is zero, start from the first child. */
-		if ( iter->rootRef.kid->tree->child == 0 ) {
-			iter->ref.kid = 0;
-			iter->ref.next = 0;
-		}
-		else {
-			push( (SW) iter->rootRef.next );
-			push( (SW) iter->rootRef.kid );
-
-			Kid *last = iter->rootRef.kid->tree->child;
-			while ( last->next != 0 )
-				last = last->next;
-
-			iter->ref.kid = last;
-			iter->ref.next = (Ref*)ptop();
-		}
-	}
-	else {
-		/* Have a previous item, go to the prev sibling. */
-		Kid *wasAt = iter->ref.kid;
-		Kid *parent = (Kid*) top();
-		Kid *cur = 0, *next = parent->tree->child;
-
-		while ( next != wasAt ) {
-			cur = next;
-			next = next->next;
-		}
-
-		iter->ref.kid = cur;
-	}
-
-	bool anyTree = iter->searchId == prg->rtd->anyId;
-	if ( ! anyTree ) {
-		/* Have a previous item, go to the next sibling. */
-		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
-			iter->ref.kid = iter->ref.kid->next;
-		}
-	}
-
-	iter->stackSize = iter->stackRoot - ptop();
-
-	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
-}
-
 void tree_iter_destroy( Tree **&sp, TreeIter *iter )
 {
 	long curStackSize = iter->stackRoot - ptop();
@@ -828,746 +234,6 @@ void user_iter_destroy( Tree **&sp, UserIter *uiter )
 	popn( argSize );
 }
 
-Tree *tree_iter_deref_cur( TreeIter *iter )
-{
-	return iter->ref.kid == 0 ? 0 : iter->ref.kid->tree;
-}
-
-Tree *tree_search( Kid *kid, long id )
-{
-	if ( kid->tree->id == id )
-		return kid->tree;
-
-	Tree *res = 0;
-	if ( kid->tree->child != 0 )
-		res = tree_search( kid->tree->child, id );
-	
-	if ( res == 0 && kid->next != 0 )
-		res = tree_search( kid->next, id );
-
-	return res;	
-}
-
-Tree *tree_search( Tree *tree, long id )
-{
-	Tree *res = 0;
-	if ( tree->id == id )
-		res = tree;
-	else if ( tree->child != 0 )
-		res = tree_search( tree->child, id );
-	return res;
-}
-
-Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
-{
-	assert( tree->refs >= 2 );
-
-	/* Need to keep a lookout for next down. If 
-	 * copying it, return the copy. */
-	Tree *newTree = prg->treePool.allocate();
-
-	newTree->id = tree->id;
-	newTree->tokdata = string_copy( prg, tree->tokdata );
-//	newTree->pos = tree->pos;
-
-	tree->refs -= 1;
-
-	/* Copy the child list, will handle attributes, ignores 
-	 * and the children. */
-	Kid *child = tree->child, *last = 0;
-	while ( child != 0 ) {
-		Kid *newChild = prg->kidPool.allocate();
-
-		/* Store the first child. */
-		if ( newTree->child == 0 )
-			newTree->child = newChild;
-
-		/* Watch out for next down. */
-		if ( child == oldNextDown )
-			newNextDown = newChild;
-
-		newChild->tree = child->tree;
-		newChild->next = 0;
-
-		/* May be an attribute. */
-		if ( newChild->tree != 0 )
-			newChild->tree->refs += 1;
-
-		if ( last != 0 )
-			last->next = newChild;
-
-		child = child->next;
-		last = newChild;
-	}
-	
-	return newTree;
-}
-
-List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
-{
-	if ( list->refs > 1 ) {
-		#ifdef COLM_LOG_BYTECODE
-		cerr << "splitting list: " << list << " refs: " << 
-				list->refs << endl;
-		#endif
-
-		/* Not a need copy. */
-		List *newList = (List*)prg->mapElPool.allocate();
-		newList->id = list->genericInfo->langElId;
-		newList->genericInfo = list->genericInfo;
-
-		list->refs -= 1;
-
-		ListEl *src = list->head;
-		while( src != 0 ) {
-			ListEl *newEl = prg->listElPool.allocate();
-			newEl->value = src->value;
-			tree_upref( newEl->value );
-
-			newList->append( newEl );
-
-			/* Watch out for next down. */
-			if ( (Kid*)src == oldNextDown )
-				newNextDown = (Kid*)newEl;
-
-			src = src->next;
-		}
-
-		list = newList;
-	}
-	return list;
-}
-
-	
-Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
-{
-	if ( map->refs > 1 ) {
-		#ifdef COLM_LOG_BYTECODE
-		cerr << "splitting map: " << map << " refs: " << 
-				map->refs << endl;
-		#endif
-
-		Map *newMap = (Map*)prg->mapElPool.allocate();
-		newMap->id = map->genericInfo->langElId;
-		newMap->genericInfo = map->genericInfo;
-		newMap->treeSize = map->treeSize;
-		newMap->root = 0;
-
-		/* If there is a root, copy the tree. */
-		if ( map->root != 0 ) {
-			newMap->root = newMap->copyBranch( prg, map->root, 
-					oldNextDown, newNextDown );
-		}
-
-		map->refs -= 1;
-
-		for ( MapEl *el = newMap->head; el != 0; el = el->next ) {
-			assert( map->genericInfo->typeArg == TYPE_TREE );
-			tree_upref( el->tree );
-		}
-
-		map = newMap;
-	}
-	return map;
-}
-
-Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
-{
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-	long genericId = lelInfo[tree->id].genericId;
-	if ( genericId > 0 ) {
-		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
-		if ( generic->type == GEN_LIST )
-			tree = (Tree*) copy_list( prg, (List*) tree, oldNextDown, newNextDown );
-		else if ( generic->type == GEN_MAP )
-			tree = (Tree*) copy_map( prg, (Map*) tree, oldNextDown, newNextDown );
-		else
-			assert(false);
-	}
-	else if ( tree->id == LEL_ID_PTR )
-		assert(false);
-	else if ( tree->id == LEL_ID_BOOL )
-		assert(false);
-	else if ( tree->id == LEL_ID_INT )
-		assert(false);
-	else if ( tree->id == LEL_ID_STR )
-		assert(false);
-	else
-		tree = copy_real_tree( prg, tree, oldNextDown, newNextDown );
-
-	assert( tree->refs == 0 );
-	return tree;
-}
-
-Tree *split_tree( Program *prg, Tree *tree )
-{
-	if ( tree != 0 ) {
-		assert( tree->refs >= 1 );
-
-		if ( tree->refs > 1 ) {
-			#ifdef COLM_LOG_BYTECODE
-			cerr << "splitting tree: " << tree << " refs: " << 
-					tree->refs << endl;
-			#endif
-
-			Kid *oldNextDown = 0, *newNextDown = 0;
-			tree = copy_tree( prg, tree, oldNextDown, newNextDown );
-			tree_upref( tree );
-		}
-
-		assert( tree->refs == 1 );
-	}
-	return tree;
-}
-
-Tree *create_generic( Program *prg, Word genericId )
-{
-	GenericInfo *genericInfo = &prg->rtd->genericInfo[genericId];
-	Tree *newGeneric = 0;
-	switch ( genericInfo->type ) {
-		case GEN_MAP: {
-			Map *map = (Map*)prg->mapElPool.allocate();
-			map->id = genericInfo->langElId;
-			map->genericInfo = genericInfo;
-			newGeneric = (Tree*) map;
-			break;
-		}
-		case GEN_LIST: {
-			List *list = (List*)prg->mapElPool.allocate();
-			list->id = genericInfo->langElId;
-			list->genericInfo = genericInfo;
-			newGeneric = (Tree*) list;
-			break;
-		}
-		default:
-			assert(false);
-			return 0;
-	}
-
-	return newGeneric;
-}
-
-bool map_insert( Program *prg, Map *map, Tree *key, Tree *element )
-{
-	MapEl *mapEl = map->insert( prg, key );
-
-	if ( mapEl != 0 ) {
-		mapEl->tree = element;
-		return true;
-	}
-
-	return false;
-}
-
-void map_unremove( Program *prg, Map *map, Tree *key, Tree *element )
-{
-	MapEl *mapEl = map->insert( prg, key );
-	assert( mapEl != 0 );
-	mapEl->tree = element;
-}
-
-Tree *map_uninsert( Program *prg, Map *map, Tree *key )
-{
-	MapEl *el = map->detach( key );
-	Tree *val = el->tree;
-	prg->mapElPool.free( el );
-	return val;
-}
-
-Tree *map_store( Program *prg, Map *map, Tree *key, Tree *element )
-{
-	Tree *oldTree = 0;
-	MapEl *elInTree = 0;
-	MapEl *mapEl = map->insert( prg, key, &elInTree );
-
-	if ( mapEl != 0 )
-		mapEl->tree = element;
-	else {
-		/* Element with key exists. Overwriting the value. */
-		oldTree = elInTree->tree;
-		elInTree->tree = element;
-	}
-
-	return oldTree;
-}
-
-Tree *map_unstore( Program *prg, Map *map, Tree *key, Tree *existing )
-{
-	Tree *stored = 0;
-	if ( existing == 0 ) {
-		MapEl *mapEl = map->detach( key );
-		stored = mapEl->tree;
-		prg->mapElPool.free( mapEl );
-	}
-	else {
-		MapEl *mapEl = map->find( key );
-		stored = mapEl->tree;
-		mapEl->tree = existing;
-	}
-	return stored;
-}
-
-Tree *map_find( Map *map, Tree *key )
-{
-	MapEl *mapEl = map->find( key );
-	return mapEl == 0 ? 0 : mapEl->tree;
-}
-
-long map_length( Map *map )
-{
-	return map->length();
-}
-
-long list_length( List *list )
-{
-	return list->length();
-}
-
-void list_append( Program *prg, List *list, Tree *val )
-{
-	assert( list->refs == 1 );
-	if ( val != 0 )
-		assert( val->refs >= 1 );
-	ListEl *listEl = prg->listElPool.allocate();
-	listEl->value = val;
-	list->append( listEl );
-}
-
-Tree *list_remove_end( Program *prg, List *list )
-{
-	Tree *tree = list->tail->value;
-	prg->listElPool.free( list->detachLast() );
-	return tree;
-}
-
-Tree *get_list_mem( List *list, Word field )
-{
-	Tree *result = 0;
-	switch ( field ) {
-		case 0: 
-			result = list->head->value;
-			break;
-		case 1: 
-			result = list->tail->value;
-			break;
-		default:
-			assert( false );
-			break;
-	}
-	return result;
-}
-
-Tree *get_list_mem_split( Program *prg, List *list, Word field )
-{
-	Tree *sv = 0;
-	switch ( field ) {
-		case 0: 
-			sv = split_tree( prg, list->head->value );
-			list->head->value = sv; 
-			break;
-		case 1: 
-			sv = split_tree( prg, list->tail->value );
-			list->tail->value = sv; 
-			break;
-		default:
-			assert( false );
-			break;
-	}
-	return sv;
-}
-
-Tree *set_list_mem( List *list, Half field, Tree *value )
-{
-	assert( list->refs == 1 );
-	if ( value != 0 )
-		assert( value->refs >= 1 );
-
-	Tree *existing = 0;
-	switch ( field ) {
-		case 0:
-			existing = list->head->value;
-			list->head->value = value;
-			break;
-		case 1:
-			existing = list->tail->value;
-			list->tail->value = value;
-			break;
-		default:
-			assert( false );
-			break;
-	}
-	return existing;
-}
-
-struct TreePair
-{
-	TreePair() : key(0), val(0) {}
-
-	Tree *key;
-	Tree *val;
-};
-
-TreePair map_remove( Program *prg, Map *map, Tree *key )
-{
-	MapEl *mapEl = map->find( key );
-	TreePair result;
-	if ( mapEl != 0 ) {
-		map->detach( mapEl );
-		result.key = mapEl->key;
-		result.val = mapEl->tree;
-		prg->mapElPool.free( mapEl );
-	}
-
-	return result;
-}
-
-void split_ref( Tree **&sp, Program *prg, Ref *fromRef )
-{
-	/* Go up the chain of kids, turing the pointers down. */
-	Ref *last = 0, *ref = fromRef, *next = 0;
-	while ( ref->next != 0 ) {
-		next = ref->next;
-		ref->next = last;
-		last = ref;
-		ref = next;
-	}
-	ref->next = last;
-
-	/* Now traverse the list, which goes down. */
-	while ( ref != 0 ) {
-		if ( ref->kid->tree->refs > 1 ) {
-			#ifdef COLM_LOG_BYTECODE
-			cerr << "splitting tree: " << ref->kid << " refs: " << 
-					ref->kid->tree->refs << endl;
-			#endif
-
-			Ref *nextDown = ref->next;
-			while ( nextDown != 0 && nextDown->kid == ref->kid )
-				nextDown = nextDown->next;
-
-			Kid *oldNextKidDown = nextDown != 0 ? nextDown->kid : 0;
-			Kid *newNextKidDown = 0;
-
-			Tree *newTree = copy_tree( prg, ref->kid->tree, 
-					oldNextKidDown, newNextKidDown );
-			tree_upref( newTree );
-
-			while ( ref != 0 && ref != nextDown ) {
-				next = ref->next;
-				ref->next = 0;
-
-				ref->kid->tree = newTree;
-				ref = next;
-			}
-
-			/* Correct kid pointers down from ref. */
-			while ( nextDown != 0 && nextDown->kid == oldNextKidDown ) {
-				nextDown->kid = newNextKidDown;
-				nextDown = nextDown->next;
-			}
-		}
-		else {
-			/* Reset the list as we go down. */
-			next = ref->next;
-			ref->next = 0;
-			ref = next;
-		}
-	}
-}
-
-void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter )
-{
-	if ( iter->ref.kid == 0 )
-		return;
-	
-	split_ref( sp, prg, &iter->ref );
-}
-
-void set_ref_value( Ref *ref, Tree *v )
-{
-	Kid *firstKid = ref->kid;
-	while ( ref != 0 && ref->kid == firstKid ) {
-		ref->kid->tree = v;
-		ref = ref->next;
-	}
-}
-
-long cmp_tree( const Tree *tree1, const Tree *tree2 )
-{
-	long cmpres = 0;
-	if ( tree1 == 0 ) {
-		if ( tree2 == 0 )
-			return 0;
-		else
-			return -1;
-	}
-	else if ( tree2 == 0 )
-		return 1;
-	else if ( tree1->id < tree2->id )
-		return -1;
-	else if ( tree1->id > tree2->id )
-		return 1;
-	else if ( tree1->id == LEL_ID_PTR ) {
-		if ( ((Pointer*)tree1)->value < ((Pointer*)tree2)->value )
-			return -1;
-		else if ( ((Pointer*)tree1)->value > ((Pointer*)tree2)->value )
-			return 1;
-	}
-	else if ( tree1->id == LEL_ID_INT ) {
-		if ( ((Int*)tree1)->value < ((Int*)tree2)->value )
-			return -1;
-		else if ( ((Int*)tree1)->value > ((Int*)tree2)->value )
-			return 1;
-	}
-	else if ( tree1->id == LEL_ID_STR ) {
-		cmpres = cmp_string( ((Str*)tree1)->value, ((Str*)tree2)->value );
-		if ( cmpres != 0 )
-			return cmpres;
-	}
-	else {
-		if ( tree1->tokdata == 0 && tree2->tokdata != 0 )
-			return -1;
-		else if ( tree1->tokdata != 0 && tree2->tokdata == 0 )
-			return 1;
-		else if ( tree1->tokdata != 0 && tree2->tokdata != 0 ) {
-			cmpres = cmp_string( tree1->tokdata, tree2->tokdata );
-			if ( cmpres != 0 )
-				return cmpres;
-		}
-	}
-
-	Kid *kid1 = tree1->child;
-	Kid *kid2 = tree2->child;
-
-	while ( true ) {
-		if ( kid1 == 0 && kid2 == 0 )
-			return 0;
-		else if ( kid1 == 0 && kid2 != 0 )
-			return -1;
-		else if ( kid1 != 0 && kid2 == 0 )
-			return 1;
-		else {
-			cmpres = cmp_tree( kid1->tree, kid2->tree );
-			if ( cmpres != 0 )
-				return cmpres;
-		}
-		kid1 = kid1->next;
-		kid2 = kid2->next;
-	}
-}
-
-/* This must traverse in the same order that the bindId assignments are done
- * in. */
-bool match_pattern( Tree **bindings, Program *prg, int pat, Kid *kid, bool checkNext )
-{
-	PatReplNode *nodes = prg->rtd->patReplNodes;
-
-	#ifdef COLM_LOG_MATCH
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-	cerr << "match_pattern " << ( pat == -1 ? "NULL" : lelInfo[nodes[pat].id].name ) <<
-			" vs " << ( kid == 0 ? "NULL" : lelInfo[kid->tree->id].name ) << endl;
-	#endif
-
-	/* match node, recurse on children. */
-	if ( pat != -1 && kid != 0 ) {
-		if ( nodes[pat].id == kid->tree->id ) {
-			/* If the pattern node has data, then this means we need to match
-			 * the data against the token data. */
-			if ( nodes[pat].data != 0 ) {
-				/* Check the length of token text. */
-				if ( nodes[pat].length != string_length( kid->tree->tokdata ) )
-					return false;
-
-				/* Check the token text data. */
-				if ( nodes[pat].length > 0 && memcmp( nodes[pat].data, 
-						string_data( kid->tree->tokdata ), nodes[pat].length ) != 0 )
-					return false;
-			}
-
-			/* No failure, all okay. */
-			if ( nodes[pat].bindId > 0 ) {
-				#ifdef COLM_LOG_MATCH
-				cerr << "bindId: " << nodes[pat].bindId << endl;
-				#endif
-				bindings[nodes[pat].bindId] = kid->tree;
-			}
-
-			/* If we didn't match a terminal duplicate of a nonterm then check
-			 * down the children. */
-			if ( !nodes[pat].stop ) {
-				/* Check for failure down child branch. */
-				bool childCheck = match_pattern( bindings, prg, 
-						nodes[pat].child, tree_child( prg, kid->tree ), true );
-				if ( ! childCheck )
-					return false;
-			}
-
-			/* If checking next, then look for failure there. */
-			if ( checkNext ) {
-				bool nextCheck = match_pattern( bindings, prg, 
-						nodes[pat].next, kid->next, true );
-				if ( ! nextCheck )
-					return false;
-			}
-
-			return true;
-		}
-	}
-	else if ( pat == -1 && kid == 0 ) {
-		/* Both null is a match. */
-		return 1;
-	}
-
-	return false;
-}
-
-Tree *construct_integer( Program *prg, long i )
-{
-	Int *integer = (Int*) prg->treePool.allocate();
-	integer->id = LEL_ID_INT;
-	integer->value = i;
-
-	return (Tree*)integer;
-}
-
-Tree *construct_string( Program *prg, Head *s )
-{
-	Str *str = (Str*) prg->treePool.allocate();
-	str->id = LEL_ID_STR;
-	str->value = s;
-
-	return (Tree*)str;
-}
-
-Tree *construct_pointer( Program *prg, Tree *tree )
-{
-	Kid *kid = prg->kidPool.allocate();
-	kid->tree = tree;
-	kid->next = prg->heap;
-	prg->heap = kid;
-
-	Pointer *pointer = (Pointer*) prg->treePool.allocate();
-	pointer->id = LEL_ID_PTR;
-	pointer->value = kid;
-	
-	return (Tree*)pointer;
-}
-
-Tree *construct_term( Program *prg, Word id, Head *tokdata )
-{
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-
-	Tree *tree = prg->treePool.allocate();
-	tree->id = id;
-	tree->refs = 0;
-	tree->tokdata = tokdata;
-
-	int objectLength = lelInfo[tree->id].objectLength;
-	tree->child = alloc_attrs( prg, objectLength );
-
-	return tree;
-}
-
-Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, int pat );
-
-Kid *construct_ignore_list( Program *prg, long pat )
-{
-	PatReplNode *nodes = prg->rtd->patReplNodes;
-	long ignore = nodes[pat].ignore;
-
-	Kid *first = 0, *last = 0;
-	while ( ignore >= 0 ) {
-		Head *ignoreData = string_alloc_const( prg, nodes[ignore].data, nodes[ignore].length );
-
-		Tree *ignTree = prg->treePool.allocate();
-		ignTree->refs = 1;
-		ignTree->id = nodes[ignore].id;
-		ignTree->tokdata = ignoreData;
-
-		Kid *ignKid = prg->kidPool.allocate();
-		ignKid->tree = ignTree;
-		ignKid->next = 0;
-
-		if ( last == 0 )
-			first = ignKid;
-		else
-			last->next = ignKid;
-
-		ignore = nodes[ignore].next;
-		last = ignKid;
-	}
-
-	return first;
-}
-
-/* Returns an uprefed tree. Saves us having to downref and bindings to zero to
- * return a zero-ref tree. */
-Tree *construct_replacement_tree( Tree **bindings, Program *prg, int pat )
-{
-	PatReplNode *nodes = prg->rtd->patReplNodes;
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-	Tree *tree = 0;
-
-	if ( nodes[pat].bindId > 0 ) {
-		/* All bindings have been uprefed. */
-		tree = bindings[nodes[pat].bindId];
-
-		long ignore = nodes[pat].ignore;
-		if ( ignore >= 0 ) {
-			tree = split_tree( prg, tree );
-			tree->child = construct_ignore_list( prg, pat );
-		}
-	}
-	else {
-		tree = prg->treePool.allocate();
-		tree->id = nodes[pat].id;
-		tree->refs = 1;
-		tree->tokdata = nodes[pat].length == 0 ? 0 :
-				string_alloc_const( prg, 
-				nodes[pat].data, nodes[pat].length );
-
-		int objectLength = lelInfo[tree->id].objectLength;
-
-		Kid *attrs = alloc_attrs( prg, objectLength );
-		Kid *ignore = construct_ignore_list( prg, pat );
-		Kid *child = construct_replacement_kid( bindings, prg, 
-				0, nodes[pat].child );
-
-		tree->child = kid_list_concat( attrs, 
-				kid_list_concat( ignore, child ) );
-	}
-
-	return tree;
-}
-
-Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, int pat )
-{
-	PatReplNode *nodes = prg->rtd->patReplNodes;
-	Kid *kid = 0;
-
-	if ( pat != -1 ) {
-		kid = prg->kidPool.allocate();
-		kid->tree = construct_replacement_tree( bindings, prg, pat );
-
-		/* Recurse down next. */
-		Kid *next = construct_replacement_kid( bindings, prg, 
-				kid, nodes[pat].next );
-
-		kid->next = next;
-	}
-
-	return kid;
-}
-
-bool test_false( Program *prg, Tree *tree )
-{
-	bool flse = ( 
-		tree == 0 ||
-		tree == prg->falseVal ||
-		tree->id == LEL_ID_INT && ((Int*)tree)->value == 0 );
-	return flse;
-}
-
 /*
  * Execution environment
  */
@@ -1610,7 +276,7 @@ void Program::clearGlobal( Tree **sp )
 	treePool.free( global );
 }
 
-void Program::clear( Tree **sp )
+void Program::clear( Tree **vm_stack, Tree **sp )
 {
 	#ifdef COLM_LOG_BYTECODE
 	cerr << "clearing the prg" << endl;
@@ -1693,7 +359,7 @@ void Program::run()
 	 */
 
 	//vm_stack = new Tree*[VM_STACK_SIZE];
-	vm_stack = (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
+	Tree **vm_stack = (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
 		PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, 0, 0 );
 	Tree **root = &vm_stack[VM_STACK_SIZE];
 
@@ -1719,7 +385,7 @@ void Program::run()
 	}
 
 	/* Clear */
-	clear( root );
+	clear( vm_stack, root );
 }
 
 Execution::Execution( Program *prg, CodeVect &reverseCode,
@@ -2300,7 +966,7 @@ again:
 			Tree *val = pop();
 			Ref *ref = (Ref*) plocal(field);
 			split_ref( sp, prg, ref );
-			set_ref_value( ref, val );
+			ref_set_value( ref, val );
 			break;
 		}
 		case IN_GET_FIELD_R: {
@@ -3525,7 +2191,7 @@ again:
 			Tree *obj = pop();
 			tree_downref( prg, sp, obj );
 
-			Tree *val = get_list_mem( list(obj), field );
+			Tree *val = get_list_mem( (List*)obj, field );
 			tree_upref( val );
 			push( val );
 			break;
@@ -3541,7 +2207,7 @@ again:
 			Tree *obj = pop();
 			tree_downref( prg, sp, obj );
 
-			Tree *val = get_list_mem_split( prg, list(obj), field );
+			Tree *val = get_list_mem_split( prg, (List*)obj, field );
 			tree_upref( val );
 			push( val );
 			break;
@@ -3557,7 +2223,7 @@ again:
 			Tree *obj = pop();
 			tree_downref( prg, sp, obj );
 
-			Tree *val = get_list_mem_split( prg, list(obj), field );
+			Tree *val = get_list_mem_split( prg, (List*)obj, field );
 			tree_upref( val );
 			push( val );
 
@@ -3578,7 +2244,7 @@ again:
 			Tree *obj = pop();
 			tree_downref( prg, sp, obj );
 
-			Tree *res = get_list_mem_split( prg, list(obj), field );
+			Tree *res = get_list_mem_split( prg, (List*)obj, field );
 			tree_upref( res );
 			push( res );
 			break;
@@ -3595,7 +2261,7 @@ again:
 			tree_downref( prg, sp, obj );
 
 			Tree *val = pop();
-			Tree *existing = set_list_mem( list(obj), field, val );
+			Tree *existing = set_list_mem( (List*)obj, field, val );
 			tree_downref( prg, sp, existing );
 			break;
 		}
@@ -3611,7 +2277,7 @@ again:
 			tree_downref( prg, sp, obj );
 
 			Tree *val = pop();
-			Tree *existing = set_list_mem( list(obj), field, val );
+			Tree *existing = set_list_mem( (List*)obj, field, val );
 
 			/* Set up the reverse instruction. */
 			reverseCode.append( IN_SET_LIST_MEM_BKT );
@@ -3635,7 +2301,7 @@ again:
 			Tree *obj = pop();
 			tree_downref( prg, sp, obj );
 
-			Tree *undid = set_list_mem( list(obj), field, val );
+			Tree *undid = set_list_mem( (List*)obj, field, val );
 			tree_downref( prg, sp, undid );
 			break;
 		}
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 2f0ab499..89d0df03 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -37,13 +37,6 @@ using std::ostream;
 typedef unsigned long ulong;
 typedef unsigned char uchar;
 
-#define read_word_p( i, p ) do { \
-	i = ((Word)  p[0]); \
-	i |= ((Word) p[1]) << 8; \
-	i |= ((Word) p[2]) << 16; \
-	i |= ((Word) p[3]) << 24; \
-} while(0)
-
 #define IN_LOAD_INT              0x01
 #define IN_LOAD_STR              0x02
 #define IN_LOAD_NIL              0x03
@@ -291,6 +284,10 @@ typedef unsigned char uchar;
 #define IFR_RIF 1    /* return iframe pointer */
 #define IFR_RFR 0    /* return frame pointer */
 
+#define vm_push(i) (*(--sp) = (i))
+#define vm_pop() (*sp++)
+#define vm_top() (*sp)
+#define vm_ptop() (sp)
 
 struct Kid;
 struct Tree;
@@ -305,6 +302,9 @@ struct Program;
 struct List;
 struct Map;
 struct Stream;
+struct Ref;
+struct TreeIter;
+struct Pointer;
 
 typedef unsigned char Code;
 typedef unsigned long Word;
@@ -387,6 +387,14 @@ struct Head
 	long length;
 };
 
+struct TreePair
+{
+	TreePair() : key(0), val(0) {}
+
+	Tree *key;
+	Tree *val;
+};
+
 struct Program;
 struct Stream;
 
@@ -427,6 +435,55 @@ void print_tree( Tree **&sp, Program *prg, Tree *tree );
 void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
 bool tree_is_ignore( Program *prg, Kid *kid );
 Kid *kid_list_concat( Kid *list1, Kid *list2 );
+Tree *open_file( Program *prg, Tree *name );
+Stream *open_stream_fd( Program *prg, long fd );
+Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
+Tree *create_generic( Program *prg, long genericId );
+void split_ref( Tree **&sp, Program *prg, Ref *fromRef );
+Tree *tree_search( Kid *kid, long id );
+Tree *map_find( Map *map, Tree *key );
+long map_length( Map *map );
+long list_length( List *list );
+void list_append( Program *prg, List *list, Tree *val );
+Tree *list_remove_end( Program *prg, List *list );
+Tree *get_list_mem( List *list, Word field );
+Tree *get_list_mem_split( Program *prg, List *list, Word field );
+Tree *set_list_mem( List *list, Half field, Tree *value );
+Tree *tree_search( Kid *kid, long id );
+Tree *tree_search( Tree *tree, long id );
+bool map_insert( Program *prg, Map *map, Tree *key, Tree *element );
+void map_unremove( Program *prg, Map *map, Tree *key, Tree *element );
+Tree *map_uninsert( Program *prg, Map *map, Tree *key );
+Tree *map_store( Program *prg, Map *map, Tree *key, Tree *element );
+Tree *map_unstore( Program *prg, Map *map, Tree *key, Tree *existing );
+Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter );
+Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter );
+Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter );
+bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
+TreePair map_remove( Program *prg, Map *map, Tree *key );
+
+Tree *construct_integer( Program *prg, long i );
+Tree *construct_string( Program *prg, Head *s );
+Tree *construct_pointer( Program *prg, Tree *tree );
+Tree *construct_term( Program *prg, Word id, Head *tokdata );
+bool test_false( Program *prg, Tree *tree );
+Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat );
+
+void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter );
+Tree *split_tree( Program *prg, Tree *t );
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
+Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, long nargs );
+Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs );
+Tree *tree_iter_deref_cur( TreeIter *iter );
+void ref_set_value( Ref *ref, Tree *v );
+
+Tree *get_ptr_val( Pointer *ptr );
+Tree *get_ptr_val_split( Program *prg, Pointer *ptr );
+Tree *get_field( Tree *tree, Word field );
+Tree *get_field_split( Program *prg, Tree *tree, Word field );
+Tree *get_rhs_el( Program *prg, Tree *lhs, long position );
+void set_field( Program *prg, Tree *tree, long field, Tree *value );
+void set_triter_cur( TreeIter *iter, Tree *tree );
 
 /*
  * Maps
@@ -572,7 +629,7 @@ struct Program
 
 	void run();
 
-	void clear( Tree **sp );
+	void clear( Tree **vm_stack, Tree **sp );
 	void clearGlobal( Tree **sp );
 	void allocGlobal();
 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 09197f67..828596a9 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -102,9 +102,6 @@ long PdaRun::stackTopTarget()
 	return state;
 }
 
-#define push(i) (*(--sp) = (i))
-#define pop() (*sp++)
-
 bool beenCommitted( Kid *kid )
 {
 	return kid->tree->alg->flags & AF_COMMITTED;
@@ -133,7 +130,7 @@ head:
 
 	/* Recurse only on non-generated trees. */
 	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
-		push( (Tree*)lel );
+		vm_push( (Tree*)lel );
 		lel = tree_child( prg, tree );
 
 		while ( lel != 0 ) {
@@ -144,7 +141,7 @@ head:
 			lel = lel->next;
 		}
 
-		lel = (Kid*)pop();
+		lel = (Kid*)vm_pop();
 	}
 
 	/* Commit */
@@ -191,7 +188,7 @@ head:
 
 	/* Recurse. */
 	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
-		push( (Tree*)lel );
+		vm_push( (Tree*)lel );
 		lel = tree_child( prg, tree );
 
 		while ( lel != 0 ) {
@@ -202,7 +199,7 @@ head:
 			lel = lel->next;
 		}
 
-		lel = (Kid*)pop();
+		lel = (Kid*)vm_pop();
 	}
 
 	/* Commit */
@@ -246,13 +243,13 @@ void PdaRun::commit()
 	Kid *kid = stackTop;
 	long topLevel = 0;
 	while ( kid != 0 && !beenCommitted( kid ) ) {
-		push( (Tree*)kid );
+		vm_push( (Tree*)kid );
 		kid = kid->next;
 		topLevel += 1;
 	}
 
 	while ( topLevel > 0 ) {
-		kid = (Kid*)pop();
+		kid = (Kid*)vm_pop();
 		commitKid( sp, kid );
 		parsed_downref_kid( sp, prg, kid );
 		topLevel -= 1;
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 3f3fc67b..a47c233c 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -24,9 +24,539 @@
 #include "dlistval.h"
 #include "fsmrun.h"
 #include "pdarun.h"
+#include <iostream>
 
-#define push(i) (*(--sp) = (i))
-#define pop() (*sp++)
+using std::cout;
+using std::cerr;
+using std::endl;
+using std::ostream;
+
+Kid *alloc_attrs( Program *prg, long length )
+{
+	Kid *cur = 0;
+	for ( long i = 0; i < length; i++ ) {
+		Kid *next = cur;
+		cur = prg->kidPool.allocate();
+		cur->next = next;
+	}
+	return cur;
+}
+
+void free_attrs( Program *prg, Kid *attrs )
+{
+	Kid *cur = attrs;
+	while ( cur != 0 ) {
+		Kid *next = cur->next;
+		prg->kidPool.free( cur );
+		cur = next;
+	}
+}
+
+void set_attr( Tree *tree, long pos, Tree *val )
+{
+	Kid *cur = tree->child;
+	for ( long i = 0; i < pos; i++ )
+		cur = cur->next;
+	cur->tree = val;
+}
+
+Tree *get_attr( Tree *tree, long pos )
+{
+	Kid *cur = tree->child;
+	for ( long i = 0; i < pos; i++ )
+		cur = cur->next;
+	return cur->tree;
+}
+
+Kid *copy_obj_data( Program *prg, long length, Kid *src )
+{
+	Kid *cur = 0;
+	for ( long i = 0; i < length; i++ ) {
+		Kid *next = cur;
+		cur = prg->kidPool.allocate();
+		cur->next = next;
+	}
+
+	Kid *dest = cur;
+	for ( long i = 0; i < length; i++ ) {
+		dest->tree = src->tree;
+		dest = dest->next;
+		src = src->next;
+	}
+	return cur;
+}
+
+Kid *kid_list_concat( Kid *list1, Kid *list2 )
+{
+	if ( list1 == 0 )
+		return list2;
+	else if ( list2 == 0 )
+		return list1;
+
+	Kid *dest = list1;
+	while ( dest->next != 0 )
+		dest = dest->next;
+	dest->next = list2;
+	return list1;
+}
+
+Stream *open_stream_file( Program *prg, FILE *file )
+{
+	Stream *res = (Stream*)prg->mapElPool.allocate();
+	res->id = LEL_ID_STREAM;
+	res->file = file;
+	res->in = new InputStreamFile( file );
+	res->scanner = new FsmRun( prg );
+	res->scanner->attachInputStream( res->in );
+	return res;
+}
+
+Stream *open_stream_fd( Program *prg, long fd )
+{
+	Stream *res = (Stream*)prg->mapElPool.allocate();
+	res->id = LEL_ID_STREAM;
+	res->in = new InputStreamFD( fd );
+	res->scanner = new FsmRun( prg );
+	res->scanner->attachInputStream( res->in );
+	return res;
+}
+
+Tree *open_file( Program *prg, Tree *name )
+{
+	Head *head = ((Str*)name)->value;
+	FILE *file = fopen( string_data(head), "rb" );
+	Tree *res = 0;
+
+	if ( file != 0 ) {
+		res = (Tree*) open_stream_file( prg, file );
+		res = prg->treePool.allocate();
+		res->id = LEL_ID_STREAM;
+		((Stream *)res)->file = file;
+	}
+
+	return res;
+}
+
+Tree *construct_integer( Program *prg, long i )
+{
+	Int *integer = (Int*) prg->treePool.allocate();
+	integer->id = LEL_ID_INT;
+	integer->value = i;
+
+	return (Tree*)integer;
+}
+
+Tree *construct_string( Program *prg, Head *s )
+{
+	Str *str = (Str*) prg->treePool.allocate();
+	str->id = LEL_ID_STR;
+	str->value = s;
+
+	return (Tree*)str;
+}
+
+Tree *construct_pointer( Program *prg, Tree *tree )
+{
+	Kid *kid = prg->kidPool.allocate();
+	kid->tree = tree;
+	kid->next = prg->heap;
+	prg->heap = kid;
+
+	Pointer *pointer = (Pointer*) prg->treePool.allocate();
+	pointer->id = LEL_ID_PTR;
+	pointer->value = kid;
+	
+	return (Tree*)pointer;
+}
+
+Tree *construct_term( Program *prg, Word id, Head *tokdata )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+
+	Tree *tree = prg->treePool.allocate();
+	tree->id = id;
+	tree->refs = 0;
+	tree->tokdata = tokdata;
+
+	int objectLength = lelInfo[tree->id].objectLength;
+	tree->child = alloc_attrs( prg, objectLength );
+
+	return tree;
+}
+
+Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, long pat );
+
+Kid *construct_ignore_list( Program *prg, long pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	long ignore = nodes[pat].ignore;
+
+	Kid *first = 0, *last = 0;
+	while ( ignore >= 0 ) {
+		Head *ignoreData = string_alloc_const( prg, nodes[ignore].data, nodes[ignore].length );
+
+		Tree *ignTree = prg->treePool.allocate();
+		ignTree->refs = 1;
+		ignTree->id = nodes[ignore].id;
+		ignTree->tokdata = ignoreData;
+
+		Kid *ignKid = prg->kidPool.allocate();
+		ignKid->tree = ignTree;
+		ignKid->next = 0;
+
+		if ( last == 0 )
+			first = ignKid;
+		else
+			last->next = ignKid;
+
+		ignore = nodes[ignore].next;
+		last = ignKid;
+	}
+
+	return first;
+}
+
+/* Returns an uprefed tree. Saves us having to downref and bindings to zero to
+ * return a zero-ref tree. */
+Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Tree *tree = 0;
+
+	if ( nodes[pat].bindId > 0 ) {
+		/* All bindings have been uprefed. */
+		tree = bindings[nodes[pat].bindId];
+
+		long ignore = nodes[pat].ignore;
+		if ( ignore >= 0 ) {
+			tree = split_tree( prg, tree );
+			tree->child = construct_ignore_list( prg, pat );
+		}
+	}
+	else {
+		tree = prg->treePool.allocate();
+		tree->id = nodes[pat].id;
+		tree->refs = 1;
+		tree->tokdata = nodes[pat].length == 0 ? 0 :
+				string_alloc_const( prg, 
+				nodes[pat].data, nodes[pat].length );
+
+		int objectLength = lelInfo[tree->id].objectLength;
+
+		Kid *attrs = alloc_attrs( prg, objectLength );
+		Kid *ignore = construct_ignore_list( prg, pat );
+		Kid *child = construct_replacement_kid( bindings, prg, 
+				0, nodes[pat].child );
+
+		tree->child = kid_list_concat( attrs, 
+				kid_list_concat( ignore, child ) );
+	}
+
+	return tree;
+}
+
+Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, long pat )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+	Kid *kid = 0;
+
+	if ( pat != -1 ) {
+		kid = prg->kidPool.allocate();
+		kid->tree = construct_replacement_tree( bindings, prg, pat );
+
+		/* Recurse down next. */
+		Kid *next = construct_replacement_kid( bindings, prg, 
+				kid, nodes[pat].next );
+
+		kid->next = next;
+	}
+
+	return kid;
+}
+
+Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs )
+{
+	Tree **const sp = root;
+	Tree **base = vm_ptop() + nargs;
+
+	Int *idInt = (Int*)base[-1];
+	Str *textStr = (Str*)base[-2];
+
+	long id = idInt->value;
+	Head *tokdata = string_copy( prg, textStr->value );
+
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	Tree *tree;
+
+	if ( lelInfo[id].ignore ) {
+		tree = prg->treePool.allocate();
+		tree->refs = 1;
+		tree->id = id;
+		tree->tokdata = tokdata;
+	}
+	else {
+		long objectLength = lelInfo[id].objectLength;
+		Kid *attrs = alloc_attrs( prg, objectLength );
+
+		tree = prg->treePool.allocate();
+		tree->id = id;
+		tree->refs = 1;
+		tree->tokdata = tokdata;
+
+		tree->child = attrs;
+
+		assert( nargs-2 <= objectLength );
+		for ( long id = 0; id < nargs-2; id++ ) {
+			set_attr( tree, id, base[-3-id] );
+			tree_upref( get_attr( tree, id) );
+		}
+	}
+	return tree;
+}
+
+Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, long nargs )
+{
+	Tree **const sp = root;
+	Tree **base = vm_ptop() + nargs;
+
+	Int *idInt = (Int*)base[-1];
+
+	long id = idInt->value;
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+
+	Tree *tree = prg->treePool.allocate();
+	tree->id = id;
+	tree->refs = 1;
+
+	long objectLength = lelInfo[id].objectLength;
+	Kid *attrs = alloc_attrs( prg, objectLength );
+
+	Kid *last = 0, *child = 0;
+	for ( long id = 0; id < nargs-1; id++ ) {
+		Kid *kid = prg->kidPool.allocate();
+		kid->tree = base[-2-id];
+		tree_upref( kid->tree );
+
+		if ( last == 0 )
+			child = kid;
+		else
+			last->next = kid;
+
+		last = kid;
+	}
+
+	tree->child = kid_list_concat( attrs, child );
+
+	return tree;
+}
+
+bool test_false( Program *prg, Tree *tree )
+{
+	bool flse = ( 
+		tree == 0 ||
+		tree == prg->falseVal ||
+		tree->id == LEL_ID_INT && ((Int*)tree)->value == 0 );
+	return flse;
+}
+
+void print_str( Head *str )
+{
+	cout.write( (char*)(str->data), str->length );
+}
+
+void print_ignore_list( Tree **&sp, Program *prg, Tree *tree )
+{
+	Kid *ignore = tree_ignore( prg, tree );
+
+	/* Record the root of the stack and push everything. */
+	Tree **root = vm_ptop();
+	while ( tree_is_ignore( prg, ignore ) ) {
+		vm_push( (SW)ignore );
+		ignore = ignore->next;
+	}
+
+	/* Pop them off and print. */
+	while ( vm_ptop() != root ) {
+		ignore = (Kid*) vm_pop();
+		print_tree( sp, prg, ignore->tree );
+	}
+}
+
+void print_kid( ostream &out, Tree **&sp, Program *prg, Kid *kid, bool printIgnore )
+{
+	Tree **root = vm_ptop();
+	Kid *child;
+
+rec_call:
+	/* If not currently skipping ignore data, then print it. Ignore data can
+	 * be associated with terminals and nonterminals. */
+	if ( printIgnore && tree_ignore( prg, kid->tree ) != 0 ) {
+		/* Ignorelists are reversed. */
+		print_ignore_list( sp, prg, kid->tree );
+		printIgnore = false;
+	}
+
+	if ( kid->tree->id < prg->rtd->firstNonTermId ) {
+		/* Always turn on ignore printing when we get to a token. */
+		printIgnore = true;
+
+		if ( kid->tree->id == LEL_ID_INT )
+			out << ((Int*)kid->tree)->value;
+		else if ( kid->tree->id == LEL_ID_BOOL ) {
+			if ( ((Int*)kid->tree)->value )
+				out << "true";
+			else
+				out << "false";
+		}
+		else if ( kid->tree->id == LEL_ID_PTR )
+			out << '#' << (void*) ((Pointer*)kid->tree)->value;
+		else if ( kid->tree->id == LEL_ID_STR )
+			print_str( ((Str*)kid->tree)->value );
+		else if ( kid->tree->id == LEL_ID_STREAM )
+			out << '#' << (void*) ((Stream*)kid->tree)->file;
+		else if ( kid->tree->tokdata != 0 && 
+				string_length( kid->tree->tokdata ) > 0 )
+		{
+			out.write( string_data( kid->tree->tokdata ), 
+					string_length( kid->tree->tokdata ) );
+		}
+	}
+	else {
+		/* Non-terminal. */
+		child = tree_child( prg, kid->tree );
+		if ( child != 0 ) {
+			vm_push( (SW)kid );
+			kid = child;
+			while ( kid != 0 ) {
+				goto rec_call;
+				rec_return:
+				kid = kid->next;
+			}
+			kid = (Kid*)vm_pop();
+		}
+	}
+
+	if ( vm_ptop() != root )
+		goto rec_return;
+}
+
+void print_tree( Tree **&sp, Program *prg, Tree *tree )
+{
+	if ( tree == 0 )
+		cout << "NIL";
+	else {
+		Kid kid;
+		kid.tree = tree;
+		kid.next = 0;
+		print_kid( cout, sp, prg, &kid, false );
+	}
+}
+
+void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree )
+{
+	if ( tree == 0 )
+		cout << "NIL";
+	else {
+		Kid kid;
+		kid.tree = tree;
+		kid.next = 0;
+		print_kid( out, sp, prg, &kid, false );
+	}
+}
+
+void xml_escape_data( const char *data, long len )
+{
+	for ( int i = 0; i < len; i++ ) {
+		if ( 32 <= data[i] && data[i] <= 126 )
+			cout << data[i];
+		else
+			cout << "&#" << ((unsigned)data[i]) << ';';
+	}
+}
+
+void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
+{
+	Tree **root = vm_ptop();
+	int i = 0;
+
+rec_call:
+	for ( i = 0; i < depth; i++ )
+		cout << "  ";
+
+	if ( kid->tree == 0 )
+		cout << "NIL" << endl;
+	else {
+		cout << '<' << prg->rtd->lelInfo[kid->tree->id].name;
+		if ( kid->tree->child != 0 ) {
+			cout << '>' << endl;
+			vm_push( (SW) kid );
+			kid = kid->tree->child;
+			while ( kid != 0 ) {
+				depth++;
+				goto rec_call;
+				rec_return:
+				depth--;
+				kid = kid->next;
+
+				/* If the parent kid is a repeat then skip this node and go
+				 * right to the first child (repeated item). */
+				if ( prg->rtd->lelInfo[((Kid*)vm_top())->tree->id].repeat )
+					kid = kid->tree->child;
+			}
+			kid = (Kid*) vm_pop();
+
+			for ( i = 0; i < depth; i++ )
+				cout << "  ";
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_PTR ) {
+			cout << '>' << (void*)((Pointer*)kid->tree)->value << 
+					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_BOOL ) {
+			if ( ((Int*)kid->tree)->value )
+				cout << ">true</";
+			else
+				cout << ">false</";
+			cout << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_INT ) {
+			cout << '>' << ((Int*)kid->tree)->value << 
+					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( kid->tree->id == LEL_ID_STR ) {
+			Head *head = (Head*) ((Str*)kid->tree)->value;
+
+			cout << '>';
+			xml_escape_data( (char*)(head->data), head->length );
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else if ( 0 < kid->tree->id && kid->tree->id < prg->rtd->firstNonTermId &&
+				kid->tree->tokdata != 0 && 
+				string_length( kid->tree->tokdata ) > 0 && 
+				!prg->rtd->lelInfo[kid->tree->id].literal )
+		{
+			cout << '>';
+			xml_escape_data( string_data( kid->tree->tokdata ), 
+					string_length( kid->tree->tokdata ) );
+			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+		}
+		else
+			cout << "/>" << endl;
+	}
+
+	if ( vm_ptop() != root )
+		goto rec_return;
+}
+
+void xml_print_tree( Tree **&sp, Program *prg, Tree *tree )
+{
+	Kid kid;
+	kid.tree = tree;
+	kid.next = 0;
+	xml_print_kid( sp, prg, &kid, 0 );
+}
 
 void stream_free( Program *prg, Stream *s )
 {
@@ -37,6 +567,195 @@ void stream_free( Program *prg, Stream *s )
 	prg->mapElPool.free( (MapEl*)s );
 }
 
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
+{
+	assert( tree->refs >= 2 );
+
+	/* Need to keep a lookout for next down. If 
+	 * copying it, return the copy. */
+	Tree *newTree = prg->treePool.allocate();
+
+	newTree->id = tree->id;
+	newTree->tokdata = string_copy( prg, tree->tokdata );
+
+	tree->refs -= 1;
+
+	/* Copy the child list, will handle attributes, ignores 
+	 * and the children. */
+	Kid *child = tree->child, *last = 0;
+	while ( child != 0 ) {
+		Kid *newChild = prg->kidPool.allocate();
+
+		/* Store the first child. */
+		if ( newTree->child == 0 )
+			newTree->child = newChild;
+
+		/* Watch out for next down. */
+		if ( child == oldNextDown )
+			newNextDown = newChild;
+
+		newChild->tree = child->tree;
+		newChild->next = 0;
+
+		/* May be an attribute. */
+		if ( newChild->tree != 0 )
+			newChild->tree->refs += 1;
+
+		if ( last != 0 )
+			last->next = newChild;
+
+		child = child->next;
+		last = newChild;
+	}
+	
+	return newTree;
+}
+
+List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
+{
+	if ( list->refs > 1 ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "splitting list: " << list << " refs: " << 
+				list->refs << endl;
+		#endif
+
+		/* Not a need copy. */
+		List *newList = (List*)prg->mapElPool.allocate();
+		newList->id = list->genericInfo->langElId;
+		newList->genericInfo = list->genericInfo;
+
+		list->refs -= 1;
+
+		ListEl *src = list->head;
+		while( src != 0 ) {
+			ListEl *newEl = prg->listElPool.allocate();
+			newEl->value = src->value;
+			tree_upref( newEl->value );
+
+			newList->append( newEl );
+
+			/* Watch out for next down. */
+			if ( (Kid*)src == oldNextDown )
+				newNextDown = (Kid*)newEl;
+
+			src = src->next;
+		}
+
+		list = newList;
+	}
+	return list;
+}
+
+	
+Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
+{
+	if ( map->refs > 1 ) {
+		#ifdef COLM_LOG_BYTECODE
+		cerr << "splitting map: " << map << " refs: " << 
+				map->refs << endl;
+		#endif
+
+		Map *newMap = (Map*)prg->mapElPool.allocate();
+		newMap->id = map->genericInfo->langElId;
+		newMap->genericInfo = map->genericInfo;
+		newMap->treeSize = map->treeSize;
+		newMap->root = 0;
+
+		/* If there is a root, copy the tree. */
+		if ( map->root != 0 ) {
+			newMap->root = newMap->copyBranch( prg, map->root, 
+					oldNextDown, newNextDown );
+		}
+
+		map->refs -= 1;
+
+		for ( MapEl *el = newMap->head; el != 0; el = el->next ) {
+			assert( map->genericInfo->typeArg == TYPE_TREE );
+			tree_upref( el->tree );
+		}
+
+		map = newMap;
+	}
+	return map;
+}
+
+Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
+{
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	long genericId = lelInfo[tree->id].genericId;
+	if ( genericId > 0 ) {
+		GenericInfo *generic = &prg->rtd->genericInfo[genericId];
+		if ( generic->type == GEN_LIST )
+			tree = (Tree*) copy_list( prg, (List*) tree, oldNextDown, newNextDown );
+		else if ( generic->type == GEN_MAP )
+			tree = (Tree*) copy_map( prg, (Map*) tree, oldNextDown, newNextDown );
+		else
+			assert(false);
+	}
+	else if ( tree->id == LEL_ID_PTR )
+		assert(false);
+	else if ( tree->id == LEL_ID_BOOL )
+		assert(false);
+	else if ( tree->id == LEL_ID_INT )
+		assert(false);
+	else if ( tree->id == LEL_ID_STR )
+		assert(false);
+	else
+		tree = copy_real_tree( prg, tree, oldNextDown, newNextDown );
+
+	assert( tree->refs == 0 );
+	return tree;
+}
+
+Tree *split_tree( Program *prg, Tree *tree )
+{
+	if ( tree != 0 ) {
+		assert( tree->refs >= 1 );
+
+		if ( tree->refs > 1 ) {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "splitting tree: " << tree << " refs: " << 
+					tree->refs << endl;
+			#endif
+
+			Kid *oldNextDown = 0, *newNextDown = 0;
+			tree = copy_tree( prg, tree, oldNextDown, newNextDown );
+			tree_upref( tree );
+		}
+
+		assert( tree->refs == 1 );
+	}
+	return tree;
+}
+
+Tree *create_generic( Program *prg, long genericId )
+{
+	GenericInfo *genericInfo = &prg->rtd->genericInfo[genericId];
+	Tree *newGeneric = 0;
+	switch ( genericInfo->type ) {
+		case GEN_MAP: {
+			Map *map = (Map*)prg->mapElPool.allocate();
+			map->id = genericInfo->langElId;
+			map->genericInfo = genericInfo;
+			newGeneric = (Tree*) map;
+			break;
+		}
+		case GEN_LIST: {
+			List *list = (List*)prg->mapElPool.allocate();
+			list->id = genericInfo->langElId;
+			list->genericInfo = genericInfo;
+			newGeneric = (Tree*) list;
+			break;
+		}
+		default:
+			assert(false);
+			return 0;
+	}
+
+	return newGeneric;
+}
+
+
 /* We can't make recursive calls here since the tree we are freeing may be
  * very large. Need the VM stack. */
 void tree_free( Program *prg, Tree **sp, Tree *tree )
@@ -53,7 +772,7 @@ free_tree:
 			ListEl *el = list->head;
 			while ( el != 0 ) {
 				ListEl *next = el->next;
-				push( el->value );
+				vm_push( el->value );
 				prg->listElPool.free( el );
 				el = next;
 			}
@@ -64,8 +783,8 @@ free_tree:
 			MapEl *el = map->head;
 			while ( el != 0 ) {
 				MapEl *next = el->next;
-				push( el->key );
-				push( el->tree );
+				vm_push( el->key );
+				vm_push( el->tree );
 				prg->mapElPool.free( el );
 				el = next;
 			}
@@ -84,7 +803,7 @@ free_tree:
 			prg->treePool.free( tree );
 		else if ( tree->id == LEL_ID_PTR ) {
 			//Pointer *ptr = (Pointer*)tree;
-			//push( ptr->value->tree );
+			//vm_push( ptr->value->tree );
 			//prg->kidPool.free( ptr->value );
 			prg->treePool.free( tree );
 		}
@@ -93,7 +812,7 @@ free_tree:
 		else { 
 			if ( tree->alg != 0 ) {
 				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-				push( tree->alg->parsed );
+				vm_push( tree->alg->parsed );
 				prg->algPool.free( tree->alg );
 			}
 			string_free( prg, tree->tokdata );
@@ -101,7 +820,7 @@ free_tree:
 			Kid *child = tree->child;
 			while ( child != 0 ) {
 				Kid *next = child->next;
-				push( child->tree );
+				vm_push( child->tree );
 				prg->kidPool.free( child );
 				child = next;
 			}
@@ -112,7 +831,7 @@ free_tree:
 
 	/* Any trees to downref? */
 	while ( sp != top ) {
-		tree = pop();
+		tree = vm_pop();
 		if ( tree != 0 ) {
 			assert( tree->refs > 0 );
 			tree->refs -= 1;
@@ -205,3 +924,583 @@ bool tree_is_ignore( Program *prg, Kid *kid )
 	return kid != 0 && lelInfo[kid->tree->id].ignore;
 }
 
+Tree *tree_iter_deref_cur( TreeIter *iter )
+{
+	return iter->ref.kid == 0 ? 0 : iter->ref.kid->tree;
+}
+
+void ref_set_value( Ref *ref, Tree *v )
+{
+	Kid *firstKid = ref->kid;
+	while ( ref != 0 && ref->kid == firstKid ) {
+		ref->kid->tree = v;
+		ref = ref->next;
+	}
+}
+
+Tree *get_rhs_el( Program *prg, Tree *lhs, long position )
+{
+	Kid *pos = tree_child( prg, lhs );
+	while ( position > 0 ) {
+		pos = pos->next;
+		position -= 1;
+	}
+	return pos->tree;
+}
+
+void set_field( Program *prg, Tree *tree, long field, Tree *value )
+{
+	assert( tree->refs == 1 );
+	if ( value != 0 )
+		assert( value->refs >= 1 );
+	set_attr( tree, field, value );
+}
+
+Tree *get_field( Tree *tree, Word field )
+{
+	return get_attr( tree, field );
+}
+
+Tree *get_field_split( Program *prg, Tree *tree, Word field )
+{
+	Tree *val = get_attr( tree, field );
+	Tree *split = split_tree( prg, val );
+	set_attr( tree, field, split );
+	return split;
+}
+
+void set_triter_cur( TreeIter *iter, Tree *tree )
+{
+	iter->ref.kid->tree = tree;
+}
+
+Tree *get_ptr_val( Pointer *ptr )
+{
+	return ptr->value->tree;
+}
+
+Tree *get_ptr_val_split( Program *prg, Pointer *ptr )
+{
+	Tree *val = ptr->value->tree;
+	Tree *split = split_tree( prg, val );
+	ptr->value->tree = split;
+	return split;
+}
+
+void iter_find( Program *prg, Tree **&sp, TreeIter *iter, bool tryFirst )
+{
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	Tree **top = iter->stackRoot;
+	Kid *child;
+
+rec_call:
+	if ( tryFirst && ( iter->ref.kid->tree->id == iter->searchId || anyTree ) )
+		return;
+	else {
+		child = tree_child( prg, iter->ref.kid->tree );
+		if ( child != 0 ) {
+			vm_push( (SW) iter->ref.next );
+			vm_push( (SW) iter->ref.kid );
+			iter->ref.kid = child;
+			iter->ref.next = (Ref*)vm_ptop();
+			while ( iter->ref.kid != 0 ) {
+				tryFirst = true;
+				goto rec_call;
+				rec_return:
+				iter->ref.kid = iter->ref.kid->next;
+			}
+			iter->ref.kid = (Kid*)vm_pop();
+			iter->ref.next = (Ref*)vm_pop();
+		}
+	}
+
+	if ( top != vm_ptop() )
+		goto rec_return;
+	
+	iter->ref.kid = 0;
+}
+
+Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - vm_ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the root. */
+		iter->ref = iter->rootRef;
+		iter_find( prg, sp, iter, true );
+	}
+	else {
+		/* Have a previous item, continue searching from there. */
+		iter_find( prg, sp, iter, false );
+	}
+
+	iter->stackSize = iter->stackRoot - vm_ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - vm_ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the first child. */
+		if ( iter->rootRef.kid->tree->child == 0 ) {
+			iter->ref.kid = 0;
+			iter->ref.next = 0;
+		}
+		else {
+			vm_push( (SW) iter->rootRef.next );
+			vm_push( (SW) iter->rootRef.kid );
+			iter->ref.kid = iter->rootRef.kid->tree->child;
+			iter->ref.next = (Ref*)vm_ptop();
+		}
+	}
+	else {
+		iter->ref.kid = iter->ref.kid->next;
+	}
+
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	if ( ! anyTree ) {
+		/* Have a previous item, go to the next sibling. */
+		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
+			iter->ref.kid = iter->ref.kid->next;
+		}
+	}
+
+	iter->stackSize = iter->stackRoot - vm_ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter )
+{
+	assert( iter->stackSize == iter->stackRoot - vm_ptop() );
+
+	if ( iter->ref.kid == 0 ) {
+		/* Kid is zero, start from the first child. */
+		if ( iter->rootRef.kid->tree->child == 0 ) {
+			iter->ref.kid = 0;
+			iter->ref.next = 0;
+		}
+		else {
+			vm_push( (SW) iter->rootRef.next );
+			vm_push( (SW) iter->rootRef.kid );
+
+			Kid *last = iter->rootRef.kid->tree->child;
+			while ( last->next != 0 )
+				last = last->next;
+
+			iter->ref.kid = last;
+			iter->ref.next = (Ref*)vm_ptop();
+		}
+	}
+	else {
+		/* Have a previous item, go to the prev sibling. */
+		Kid *wasAt = iter->ref.kid;
+		Kid *parent = (Kid*) vm_top();
+		Kid *cur = 0, *next = parent->tree->child;
+
+		while ( next != wasAt ) {
+			cur = next;
+			next = next->next;
+		}
+
+		iter->ref.kid = cur;
+	}
+
+	bool anyTree = iter->searchId == prg->rtd->anyId;
+	if ( ! anyTree ) {
+		/* Have a previous item, go to the next sibling. */
+		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
+			iter->ref.kid = iter->ref.kid->next;
+		}
+	}
+
+	iter->stackSize = iter->stackRoot - vm_ptop();
+
+	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+}
+
+Tree *tree_search( Kid *kid, long id )
+{
+	if ( kid->tree->id == id )
+		return kid->tree;
+
+	Tree *res = 0;
+	if ( kid->tree->child != 0 )
+		res = tree_search( kid->tree->child, id );
+	
+	if ( res == 0 && kid->next != 0 )
+		res = tree_search( kid->next, id );
+
+	return res;	
+}
+
+Tree *tree_search( Tree *tree, long id )
+{
+	Tree *res = 0;
+	if ( tree->id == id )
+		res = tree;
+	else if ( tree->child != 0 )
+		res = tree_search( tree->child, id );
+	return res;
+}
+
+bool map_insert( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	MapEl *mapEl = map->insert( prg, key );
+
+	if ( mapEl != 0 ) {
+		mapEl->tree = element;
+		return true;
+	}
+
+	return false;
+}
+
+void map_unremove( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	MapEl *mapEl = map->insert( prg, key );
+	assert( mapEl != 0 );
+	mapEl->tree = element;
+}
+
+Tree *map_uninsert( Program *prg, Map *map, Tree *key )
+{
+	MapEl *el = map->detach( key );
+	Tree *val = el->tree;
+	prg->mapElPool.free( el );
+	return val;
+}
+
+Tree *map_store( Program *prg, Map *map, Tree *key, Tree *element )
+{
+	Tree *oldTree = 0;
+	MapEl *elInTree = 0;
+	MapEl *mapEl = map->insert( prg, key, &elInTree );
+
+	if ( mapEl != 0 )
+		mapEl->tree = element;
+	else {
+		/* Element with key exists. Overwriting the value. */
+		oldTree = elInTree->tree;
+		elInTree->tree = element;
+	}
+
+	return oldTree;
+}
+
+Tree *map_unstore( Program *prg, Map *map, Tree *key, Tree *existing )
+{
+	Tree *stored = 0;
+	if ( existing == 0 ) {
+		MapEl *mapEl = map->detach( key );
+		stored = mapEl->tree;
+		prg->mapElPool.free( mapEl );
+	}
+	else {
+		MapEl *mapEl = map->find( key );
+		stored = mapEl->tree;
+		mapEl->tree = existing;
+	}
+	return stored;
+}
+
+Tree *map_find( Map *map, Tree *key )
+{
+	MapEl *mapEl = map->find( key );
+	return mapEl == 0 ? 0 : mapEl->tree;
+}
+
+long map_length( Map *map )
+{
+	return map->length();
+}
+
+long list_length( List *list )
+{
+	return list->length();
+}
+
+void list_append( Program *prg, List *list, Tree *val )
+{
+	assert( list->refs == 1 );
+	if ( val != 0 )
+		assert( val->refs >= 1 );
+	ListEl *listEl = prg->listElPool.allocate();
+	listEl->value = val;
+	list->append( listEl );
+}
+
+Tree *list_remove_end( Program *prg, List *list )
+{
+	Tree *tree = list->tail->value;
+	prg->listElPool.free( list->detachLast() );
+	return tree;
+}
+
+Tree *get_list_mem( List *list, Word field )
+{
+	Tree *result = 0;
+	switch ( field ) {
+		case 0: 
+			result = list->head->value;
+			break;
+		case 1: 
+			result = list->tail->value;
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return result;
+}
+
+Tree *get_list_mem_split( Program *prg, List *list, Word field )
+{
+	Tree *sv = 0;
+	switch ( field ) {
+		case 0: 
+			sv = split_tree( prg, list->head->value );
+			list->head->value = sv; 
+			break;
+		case 1: 
+			sv = split_tree( prg, list->tail->value );
+			list->tail->value = sv; 
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return sv;
+}
+
+Tree *set_list_mem( List *list, Half field, Tree *value )
+{
+	assert( list->refs == 1 );
+	if ( value != 0 )
+		assert( value->refs >= 1 );
+
+	Tree *existing = 0;
+	switch ( field ) {
+		case 0:
+			existing = list->head->value;
+			list->head->value = value;
+			break;
+		case 1:
+			existing = list->tail->value;
+			list->tail->value = value;
+			break;
+		default:
+			assert( false );
+			break;
+	}
+	return existing;
+}
+
+TreePair map_remove( Program *prg, Map *map, Tree *key )
+{
+	MapEl *mapEl = map->find( key );
+	TreePair result;
+	if ( mapEl != 0 ) {
+		map->detach( mapEl );
+		result.key = mapEl->key;
+		result.val = mapEl->tree;
+		prg->mapElPool.free( mapEl );
+	}
+
+	return result;
+}
+
+void split_ref( Tree **&sp, Program *prg, Ref *fromRef )
+{
+	/* Go up the chain of kids, turing the pointers down. */
+	Ref *last = 0, *ref = fromRef, *next = 0;
+	while ( ref->next != 0 ) {
+		next = ref->next;
+		ref->next = last;
+		last = ref;
+		ref = next;
+	}
+	ref->next = last;
+
+	/* Now traverse the list, which goes down. */
+	while ( ref != 0 ) {
+		if ( ref->kid->tree->refs > 1 ) {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "splitting tree: " << ref->kid << " refs: " << 
+					ref->kid->tree->refs << endl;
+			#endif
+
+			Ref *nextDown = ref->next;
+			while ( nextDown != 0 && nextDown->kid == ref->kid )
+				nextDown = nextDown->next;
+
+			Kid *oldNextKidDown = nextDown != 0 ? nextDown->kid : 0;
+			Kid *newNextKidDown = 0;
+
+			Tree *newTree = copy_tree( prg, ref->kid->tree, 
+					oldNextKidDown, newNextKidDown );
+			tree_upref( newTree );
+
+			while ( ref != 0 && ref != nextDown ) {
+				next = ref->next;
+				ref->next = 0;
+
+				ref->kid->tree = newTree;
+				ref = next;
+			}
+
+			/* Correct kid pointers down from ref. */
+			while ( nextDown != 0 && nextDown->kid == oldNextKidDown ) {
+				nextDown->kid = newNextKidDown;
+				nextDown = nextDown->next;
+			}
+		}
+		else {
+			/* Reset the list as we go down. */
+			next = ref->next;
+			ref->next = 0;
+			ref = next;
+		}
+	}
+}
+
+void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter )
+{
+	if ( iter->ref.kid == 0 )
+		return;
+	
+	split_ref( sp, prg, &iter->ref );
+}
+
+long cmp_tree( const Tree *tree1, const Tree *tree2 )
+{
+	long cmpres = 0;
+	if ( tree1 == 0 ) {
+		if ( tree2 == 0 )
+			return 0;
+		else
+			return -1;
+	}
+	else if ( tree2 == 0 )
+		return 1;
+	else if ( tree1->id < tree2->id )
+		return -1;
+	else if ( tree1->id > tree2->id )
+		return 1;
+	else if ( tree1->id == LEL_ID_PTR ) {
+		if ( ((Pointer*)tree1)->value < ((Pointer*)tree2)->value )
+			return -1;
+		else if ( ((Pointer*)tree1)->value > ((Pointer*)tree2)->value )
+			return 1;
+	}
+	else if ( tree1->id == LEL_ID_INT ) {
+		if ( ((Int*)tree1)->value < ((Int*)tree2)->value )
+			return -1;
+		else if ( ((Int*)tree1)->value > ((Int*)tree2)->value )
+			return 1;
+	}
+	else if ( tree1->id == LEL_ID_STR ) {
+		cmpres = cmp_string( ((Str*)tree1)->value, ((Str*)tree2)->value );
+		if ( cmpres != 0 )
+			return cmpres;
+	}
+	else {
+		if ( tree1->tokdata == 0 && tree2->tokdata != 0 )
+			return -1;
+		else if ( tree1->tokdata != 0 && tree2->tokdata == 0 )
+			return 1;
+		else if ( tree1->tokdata != 0 && tree2->tokdata != 0 ) {
+			cmpres = cmp_string( tree1->tokdata, tree2->tokdata );
+			if ( cmpres != 0 )
+				return cmpres;
+		}
+	}
+
+	Kid *kid1 = tree1->child;
+	Kid *kid2 = tree2->child;
+
+	while ( true ) {
+		if ( kid1 == 0 && kid2 == 0 )
+			return 0;
+		else if ( kid1 == 0 && kid2 != 0 )
+			return -1;
+		else if ( kid1 != 0 && kid2 == 0 )
+			return 1;
+		else {
+			cmpres = cmp_tree( kid1->tree, kid2->tree );
+			if ( cmpres != 0 )
+				return cmpres;
+		}
+		kid1 = kid1->next;
+		kid2 = kid2->next;
+	}
+}
+
+/* This must traverse in the same order that the bindId assignments are done
+ * in. */
+bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext )
+{
+	PatReplNode *nodes = prg->rtd->patReplNodes;
+
+	#ifdef COLM_LOG_MATCH
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+	cerr << "match_pattern " << ( pat == -1 ? "NULL" : lelInfo[nodes[pat].id].name ) <<
+			" vs " << ( kid == 0 ? "NULL" : lelInfo[kid->tree->id].name ) << endl;
+	#endif
+
+	/* match node, recurse on children. */
+	if ( pat != -1 && kid != 0 ) {
+		if ( nodes[pat].id == kid->tree->id ) {
+			/* If the pattern node has data, then this means we need to match
+			 * the data against the token data. */
+			if ( nodes[pat].data != 0 ) {
+				/* Check the length of token text. */
+				if ( nodes[pat].length != string_length( kid->tree->tokdata ) )
+					return false;
+
+				/* Check the token text data. */
+				if ( nodes[pat].length > 0 && memcmp( nodes[pat].data, 
+						string_data( kid->tree->tokdata ), nodes[pat].length ) != 0 )
+					return false;
+			}
+
+			/* No failure, all okay. */
+			if ( nodes[pat].bindId > 0 ) {
+				#ifdef COLM_LOG_MATCH
+				cerr << "bindId: " << nodes[pat].bindId << endl;
+				#endif
+				bindings[nodes[pat].bindId] = kid->tree;
+			}
+
+			/* If we didn't match a terminal duplicate of a nonterm then check
+			 * down the children. */
+			if ( !nodes[pat].stop ) {
+				/* Check for failure down child branch. */
+				bool childCheck = match_pattern( bindings, prg, 
+						nodes[pat].child, tree_child( prg, kid->tree ), true );
+				if ( ! childCheck )
+					return false;
+			}
+
+			/* If checking next, then look for failure there. */
+			if ( checkNext ) {
+				bool nextCheck = match_pattern( bindings, prg, 
+						nodes[pat].next, kid->next, true );
+				if ( ! nextCheck )
+					return false;
+			}
+
+			return true;
+		}
+	}
+	else if ( pat == -1 && kid == 0 ) {
+		/* Both null is a match. */
+		return 1;
+	}
+
+	return false;
+}
+
-- 
cgit v1.2.1


From f951f02349a96192e4d8230a835997c8cc9bb5d6 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 4 Nov 2008 23:31:32 +0000
Subject: Some organization.

---
 colm/bytecode.cpp |  4 +--
 colm/bytecode.h   | 87 ++++++++++++++++++++++++++++---------------------------
 colm/tree.cpp     |  4 +--
 3 files changed, 49 insertions(+), 46 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index d5c24ecd..be4722a4 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -1806,7 +1806,7 @@ again:
 			cerr << "IN_MAKE_TOKEN " << (ulong) nargs << endl;
 			#endif
 
-			Tree *result = make_token( sp, prg, parser, nargs );
+			Tree *result = make_token( sp, prg, nargs );
 			for ( long i = 0; i < nargs; i++ )
 				tree_downref( prg, sp, pop() );
 			push( result );
@@ -1820,7 +1820,7 @@ again:
 			cerr << "IN_MAKE_TREE " << (ulong) nargs << endl;
 			#endif
 
-			Tree *result = make_tree( sp, prg, parser, nargs );
+			Tree *result = make_tree( sp, prg, nargs );
 			for ( long i = 0; i < nargs; i++ )
 				tree_downref( prg, sp, pop() );
 			push( result );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 89d0df03..bfee598e 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -398,92 +398,95 @@ struct TreePair
 struct Program;
 struct Stream;
 
+bool test_false( Program *prg, Tree *tree );
+
 Head *string_alloc_new( Program *prg, const char *data, long length );
 Head *string_alloc_const( Program *prg, const char *data, long length );
 Head *string_copy( Program *prg, Head *head );
 void string_free( Program *prg, Head *head );
-
-void print_str( Head *str );
-
 long string_length( Head *str );
 const char *string_data( Head *str );
 void string_shorten( Head *tokdata, long newlen );
-void ignore_data( Tree *tree, char *dest );
-long ignore_length( Tree *tree );
-void free_obj_data( Program *prg, Kid *attrs );
 Head *concat_str( Head *s1, Head *s2 );
-Word cmp_string( Head *s1, Head *s2 );
 Word str_atoi( Head *str );
-Head *int_to_str( Program *prg, Word i );
 Word str_uord16( Head *head );
 Word str_uord8( Head *head );
-Head *make_literal( Program *prg, long litoffset );
+Word cmp_string( Head *s1, Head *s2 );
+
+Head *int_to_str( Program *prg, Word i );
+
 void rcode_downref( Tree **stack_root, Program *prg, Code *instr );
 void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *cv );
-void xml_print_tree( Tree **&sp, Program *prg, Tree *tree );
-void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
 void parsed_downref( Tree **root, Program *prg, Tree *tree );
-Stream *open_stream( Program *prg, FILE *file );
+
+bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
+Head *make_literal( Program *prg, long litoffset );
 Tree *construct_string( Program *prg, Head *s );
+Tree *construct_integer( Program *prg, long i );
+Tree *construct_string( Program *prg, Head *s );
+Tree *construct_pointer( Program *prg, Tree *tree );
+Tree *construct_term( Program *prg, Word id, Head *tokdata );
+Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat );
+Tree *create_generic( Program *prg, long genericId );
+
+Tree *open_file( Program *prg, Tree *name );
+Stream *open_stream_fd( Program *prg, long fd );
+Stream *open_stream( Program *prg, FILE *file );
 
 void tree_downref( Program *prg, Tree **sp, Tree *tree );
 void tree_upref( Tree *tree );
 Kid *tree_child( Program *prg, Tree *tree );
 Kid *tree_extract_child( Program *prg, Tree *tree );
 Kid *tree_ignore( Program *prg, Tree *tree );
-void print_tree( Tree **&sp, Program *prg, Tree *tree );
-void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
 bool tree_is_ignore( Program *prg, Kid *kid );
 Kid *kid_list_concat( Kid *list1, Kid *list2 );
-Tree *open_file( Program *prg, Tree *name );
-Stream *open_stream_fd( Program *prg, long fd );
+void ignore_data( Tree *tree, char *dest );
+long ignore_length( Tree *tree );
+Tree *split_tree( Program *prg, Tree *t );
 Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
-Tree *create_generic( Program *prg, long genericId );
-void split_ref( Tree **&sp, Program *prg, Ref *fromRef );
-Tree *tree_search( Kid *kid, long id );
-Tree *map_find( Map *map, Tree *key );
-long map_length( Map *map );
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
+Tree *make_tree( Tree **root, Program *prg, long nargs );
+Tree *make_token( Tree **root, Program *prg, long nargs );
+
+void print_tree( Tree **&sp, Program *prg, Tree *tree );
+void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
+void print_str( Head *str );
+void xml_print_tree( Tree **&sp, Program *prg, Tree *tree );
+void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
+
 long list_length( List *list );
 void list_append( Program *prg, List *list, Tree *val );
 Tree *list_remove_end( Program *prg, List *list );
 Tree *get_list_mem( List *list, Word field );
 Tree *get_list_mem_split( Program *prg, List *list, Word field );
 Tree *set_list_mem( List *list, Half field, Tree *value );
-Tree *tree_search( Kid *kid, long id );
-Tree *tree_search( Tree *tree, long id );
+
+Tree *map_find( Map *map, Tree *key );
+long map_length( Map *map );
 bool map_insert( Program *prg, Map *map, Tree *key, Tree *element );
 void map_unremove( Program *prg, Map *map, Tree *key, Tree *element );
 Tree *map_uninsert( Program *prg, Map *map, Tree *key );
 Tree *map_store( Program *prg, Map *map, Tree *key, Tree *element );
 Tree *map_unstore( Program *prg, Map *map, Tree *key, Tree *existing );
-Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter );
-Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter );
-Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter );
-bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
 TreePair map_remove( Program *prg, Map *map, Tree *key );
 
-Tree *construct_integer( Program *prg, long i );
-Tree *construct_string( Program *prg, Head *s );
-Tree *construct_pointer( Program *prg, Tree *tree );
-Tree *construct_term( Program *prg, Word id, Head *tokdata );
-bool test_false( Program *prg, Tree *tree );
-Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat );
-
-void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter );
-Tree *split_tree( Program *prg, Tree *t );
-Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
-Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, long nargs );
-Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs );
-Tree *tree_iter_deref_cur( TreeIter *iter );
-void ref_set_value( Ref *ref, Tree *v );
-
 Tree *get_ptr_val( Pointer *ptr );
 Tree *get_ptr_val_split( Program *prg, Pointer *ptr );
 Tree *get_field( Tree *tree, Word field );
 Tree *get_field_split( Program *prg, Tree *tree, Word field );
 Tree *get_rhs_el( Program *prg, Tree *lhs, long position );
 void set_field( Program *prg, Tree *tree, long field, Tree *value );
+
+Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter );
+Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter );
+Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter );
+Tree *tree_iter_deref_cur( TreeIter *iter );
 void set_triter_cur( TreeIter *iter, Tree *tree );
+void split_iter_cur( Tree **&sp, Program *prg, TreeIter *iter );
+void ref_set_value( Ref *ref, Tree *v );
+Tree *tree_search( Kid *kid, long id );
+Tree *tree_search( Tree *tree, long id );
+void split_ref( Tree **&sp, Program *prg, Ref *fromRef );
 
 /*
  * Maps
diff --git a/colm/tree.cpp b/colm/tree.cpp
index a47c233c..b021785a 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -275,7 +275,7 @@ Kid *construct_replacement_kid( Tree **bindings, Program *prg, Kid *prev, long p
 	return kid;
 }
 
-Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs )
+Tree *make_token( Tree **root, Program *prg, long nargs )
 {
 	Tree **const sp = root;
 	Tree **base = vm_ptop() + nargs;
@@ -315,7 +315,7 @@ Tree *make_token( Tree **root, Program *prg, PdaRun *parser, long nargs )
 	return tree;
 }
 
-Tree *make_tree( Tree **root, Program *prg, PdaRun *parser, long nargs )
+Tree *make_tree( Tree **root, Program *prg, long nargs )
 {
 	Tree **const sp = root;
 	Tree **base = vm_ptop() + nargs;
-- 
cgit v1.2.1


From c1641755c4820f37931f0c1931c43e66b3fea45b Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 03:29:58 +0000
Subject: Updated child() and rev_child() iterators for the merge of attribute,
 ignore and child list. Oter fixes for rev_child().

---
 colm/tree.cpp | 65 ++++++++++++++++++++++++++++-------------------------------
 1 file changed, 31 insertions(+), 34 deletions(-)

diff --git a/colm/tree.cpp b/colm/tree.cpp
index b021785a..1206bf91 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -1042,81 +1042,78 @@ Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter )
 Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter )
 {
 	assert( iter->stackSize == iter->stackRoot - vm_ptop() );
+	Kid *kid = 0;
 
 	if ( iter->ref.kid == 0 ) {
 		/* Kid is zero, start from the first child. */
-		if ( iter->rootRef.kid->tree->child == 0 ) {
-			iter->ref.kid = 0;
+		Kid *child = tree_child( prg, iter->rootRef.kid->tree );
+
+		if ( child == 0 )
 			iter->ref.next = 0;
-		}
 		else {
+			/* Make a reference to the root. */
 			vm_push( (SW) iter->rootRef.next );
 			vm_push( (SW) iter->rootRef.kid );
-			iter->ref.kid = iter->rootRef.kid->tree->child;
 			iter->ref.next = (Ref*)vm_ptop();
+
+			kid = child;
 		}
 	}
 	else {
-		iter->ref.kid = iter->ref.kid->next;
+		/* Start at next. */
+		kid = iter->ref.kid->next;
 	}
 
-	bool anyTree = iter->searchId == prg->rtd->anyId;
-	if ( ! anyTree ) {
+	if ( iter->searchId != prg->rtd->anyId ) {
 		/* Have a previous item, go to the next sibling. */
-		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
-			iter->ref.kid = iter->ref.kid->next;
-		}
+		while ( kid != 0 && kid->tree->id != iter->searchId )
+			kid = kid->next;
 	}
 
+	iter->ref.kid = kid;
 	iter->stackSize = iter->stackRoot - vm_ptop();
 
-	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
+	return ( iter->ref.kid ? prg->trueVal : prg->falseVal );
 }
 
 Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter )
 {
 	assert( iter->stackSize == iter->stackRoot - vm_ptop() );
+	Kid *startAt = 0, *stopAt = 0, *kid = 0;
 
 	if ( iter->ref.kid == 0 ) {
 		/* Kid is zero, start from the first child. */
-		if ( iter->rootRef.kid->tree->child == 0 ) {
-			iter->ref.kid = 0;
+		Kid *child = tree_child( prg, iter->rootRef.kid->tree );
+
+		if ( child == 0 )
 			iter->ref.next = 0;
-		}
 		else {
 			vm_push( (SW) iter->rootRef.next );
 			vm_push( (SW) iter->rootRef.kid );
-
-			Kid *last = iter->rootRef.kid->tree->child;
-			while ( last->next != 0 )
-				last = last->next;
-
-			iter->ref.kid = last;
 			iter->ref.next = (Ref*)vm_ptop();
+
+			startAt = child;
+			stopAt = 0;
 		}
 	}
 	else {
 		/* Have a previous item, go to the prev sibling. */
-		Kid *wasAt = iter->ref.kid;
 		Kid *parent = (Kid*) vm_top();
-		Kid *cur = 0, *next = parent->tree->child;
 
-		while ( next != wasAt ) {
-			cur = next;
-			next = next->next;
-		}
-
-		iter->ref.kid = cur;
+		startAt = tree_child( prg, parent->tree );
+		stopAt = iter->ref.kid;
 	}
 
-	bool anyTree = iter->searchId == prg->rtd->anyId;
-	if ( ! anyTree ) {
-		/* Have a previous item, go to the next sibling. */
-		while ( iter->ref.kid != 0 && iter->ref.kid->tree->id != iter->searchId ) {
-			iter->ref.kid = iter->ref.kid->next;
-		}
+	while ( startAt != stopAt ) {
+		/* If looking for any, or if last the search type then
+		 * store the match. */
+		if ( iter->searchId == prg->rtd->anyId || 
+				startAt->tree->id == iter->searchId )
+			kid = startAt;
+		startAt = startAt->next;
 	}
 
+	iter->ref.kid = kid;
 	iter->stackSize = iter->stackRoot - vm_ptop();
 
 	return (iter->ref.kid ? prg->trueVal : prg->falseVal );
-- 
cgit v1.2.1


From 1a734b27fc5fef6c848cbf141bf547fcd1f14840 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 19:57:46 +0000
Subject: Need to control the generation of revert instructions at the block
 level. Use a flag pd->revertOn for this.

---
 colm/compile.cpp   | 64 +++++++++++++++++++++++++++++++++++-------------------
 colm/fsmrun.cpp    |  2 +-
 colm/parsedata.cpp |  3 ++-
 colm/parsedata.h   |  5 +++++
 colm/parsetree.h   |  4 +++-
 5 files changed, 53 insertions(+), 25 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index c0c31721..4f656660 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -311,7 +311,7 @@ UniqueType *LangVarRef::loadFieldInstr( ParseData *pd, CodeVect &code,
 		/* The instruction, depends on whether or not we are reverting. */
 		if ( elUT->typeId == TYPE_ITER )
 			code.append( elUT->iterDef->inGetCurWC );
-		else if ( revert )
+		else if ( pd->revertOn && revert )
 			code.append( el->inGetWV );
 		else
 			code.append( el->inGetWC );
@@ -399,7 +399,7 @@ void LangVarRef::loadQualification( ParseData *pd, CodeVect &code,
 				/* Always dereference references when used for qualification. If
 				 * this is the last one then we must start with the reverse
 				 * execution business. */
-				if ( qi.pos() == lastPtrInQual && forWriting ) {
+				if ( pd->revertOn && qi.pos() == lastPtrInQual && forWriting ) {
 					/* This is like a global load. */
 					code.append( IN_PTR_DEREF_WV );
 				}
@@ -426,7 +426,7 @@ void LangVarRef::loadGlobalObj( ParseData *pd, CodeVect &code,
 	/* Start the search in the global object. */
 	ObjectDef *rootObj = pd->globalObjectDef;
 
-	if ( forWriting && lastPtrInQual < 0 ) {
+	if ( pd->revertOn && forWriting && lastPtrInQual < 0 ) {
 		/* If we are writing an no reference was found in the qualification
 		 * then load the gloabl with a revert. */
 		code.append( IN_LOAD_GLOBAL_WV );
@@ -571,7 +571,7 @@ void LangVarRef::setFieldInstr( ParseData *pd, CodeVect &code,
 	/* Ensure that the field is referenced. */
 	inObject->referenceField( pd, el );
 
-	if ( revert )
+	if ( pd->revertOn && revert )
 		code.append( el->inSetWV );
 	else
 		code.append( el->inSetWC );
@@ -767,7 +767,7 @@ void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &loo
 	bool revert = lookup.lastPtrInQual >= 0 || !isLocalRef(pd);
 	
 	/* The call instruction. */
-	if ( revert ) 
+	if ( pd->revertOn && revert ) 
 		code.append( lookup.objMethod->opcodeWV );
 	else
 		code.append( lookup.objMethod->opcodeWC );
@@ -1933,6 +1933,7 @@ void ParseData::compileReductionCode( Definition *prod )
 	/* Init the compilation context. */
 	compileContext = CompileReduction;
 	curLocalFrame = block->localFrame;
+	revertOn = true;
 	block->frameId = nextFrameId++;
 
 	/* Add the alloc frame opcode. We don't have the right 
@@ -1968,6 +1969,7 @@ void ParseData::compileTranslateBlock( KlangEl *langEl )
 	/* Set up compilation context. */
 	compileContext = CompileTranslation;
 	curLocalFrame = block->localFrame;
+	revertOn = true;
 	block->frameId = nextFrameId++;
 
 	/* References to the reduce item. */
@@ -2013,6 +2015,7 @@ void ParseData::compilePreEof( TokenRegion *region )
 	/* Set up compilation context. */
 	compileContext = CompileTranslation;
 	curLocalFrame = region->preEofBlock->localFrame;
+	revertOn = true;
 	block->frameId = nextFrameId++;
 
 	/* References to the reduce item. */
@@ -2053,10 +2056,15 @@ void ParseData::compileRootBlock( )
 {
 	CodeBlock *block = rootCodeBlock;
 
+	/* The root block never needs to be reverted. */
+
 	/* Set up the compile context. No locals are needed for the root code
 	 * block, but we need an empty local frame for the compile. */
 	compileContext = CompileRoot;
 	curLocalFrame = rootLocalFrame;
+	revertOn = true;
+
+	/* The block needs a frame id. */
 	block->frameId = nextFrameId++;
 
 	/* Add the alloc frame opcode. We don't have the right 
@@ -2272,6 +2280,7 @@ void ParseData::compileUserIter( Function *func )
 
 	compileContext = CompileFunction;
 	curFunction = func;
+	revertOn = true;
 	block->frameId = nextFrameId++;
 
 	makeFuncVisible( func, true );
@@ -2304,41 +2313,36 @@ void ParseData::compileUserIter( Function *func )
 	/* FIXME: Need to deal with the freeing of local trees. */
 }
 
-void ParseData::compileFunction( Function *func )
+/* Called for each type of function compile: revert and commit. */
+void ParseData::compileFunction( Function *func, CodeVect &code )
 {
 	CodeBlock *block = func->codeBlock;
 
-	compileContext = CompileFunction;
-	curFunction = func;
-	block->frameId = nextFrameId++;
-
-	makeFuncVisible( func, false );
-
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
 
 	/* Compile the block. */
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Set in the alloc frame instruction. */
 	int frameSize = func->localFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
 	/* Check for a return statement. */
 	if ( block->stmtList->length() == 0 ||
 			block->stmtList->tail->type != LangStmt::ReturnType )
 	{
 		/* Push the return value. */
-		block->code.append( IN_LOAD_NIL );
-		block->code.append( IN_SAVE_RET );
+		code.append( IN_LOAD_NIL );
+		code.append( IN_SAVE_RET );
 	}
 
 	/* Compute the jump distance for the return jumps. */
 	for ( LongVect::Iter rj = returnJumps; rj.lte(); rj++ ) {
-		long distance = block->code.length() - *rj - 3;
-		block->code.setHalf( *rj+1, distance );
+		long distance = code.length() - *rj - 3;
+		code.setHalf( *rj+1, distance );
 	}
 
 	/* Reset the vector of return jumps. */
@@ -2346,8 +2350,24 @@ void ParseData::compileFunction( Function *func )
 
 	/* Return cleans up the stack (including the args) and leaves the return
 	 * value on the top. */
-	block->code.append( IN_RET );
-	block->code.appendHalf( func->funcId );
+	code.append( IN_RET );
+	code.appendHalf( func->funcId );
+}
+
+void ParseData::compileFunction( Function *func )
+{
+	CodeBlock *block = func->codeBlock;
+
+	/* Set up the compilation context. */
+	compileContext = CompileFunction;
+	curFunction = func;
+	revertOn = true;
+
+	/* Assign a frame Id. */
+	block->frameId = nextFrameId++;
+
+	makeFuncVisible( func, false );
+	compileFunction( func, block->code );
 
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 9ab3b969..6e89e888 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -611,7 +611,7 @@ void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input )
 
 	#ifdef COLM_LOG_PARSE
 	cerr << "new token region: " << 
-			parser->tables->gbl->regionInfo[region].name << endl;
+			parser->tables->gbl->regionInfo[fsmRun->region].name << endl;
 	#endif
 }
 
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 348d5f85..c564b02f 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -427,7 +427,8 @@ ParseData::ParseData( const String &fileName, const String &sectionName,
 	nextObjectId(1),     /* 0 is  reserved for no object. */
 	nextFrameId(0),
 	nextParserId(0),
-	nextLabelId(0)
+	nextLabelId(0),
+	revertOn(true)
 {
 }
 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 12a1e07d..12685b04 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -725,7 +725,10 @@ struct ParseData
 	void resolveMapElementOf( ObjectDef *container, ObjectDef *obj, ElementOf *elof );
 	void resolveElementOf( ObjectDef *obj );
 	void makeFuncVisible( Function *func, bool isUserIter );
+
+	void compileFunction( Function *func, CodeVect &code );
 	void compileFunction( Function *func );
+
 	void compileUserIter( Function *func );
 	void compilePreEof( TokenRegion *region );
 	void compileRootBlock();
@@ -877,6 +880,8 @@ struct ParseData
 
 	long nextLabelId;
 	ObjFieldMap *objFieldMap;
+
+	bool revertOn;
 };
 
 void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
diff --git a/colm/parsetree.h b/colm/parsetree.h
index c4c6c9e8..c7514cee 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1565,9 +1565,11 @@ struct CodeBlock
 
 	StmtList *stmtList;
 	ObjectDef *localFrame;
+	CharSet trees;
+
+	/* Write revert and write commit versions. */
 	CodeVect code;
 	long frameId;
-	CharSet trees;
 };
 
 struct Function
-- 
cgit v1.2.1


From 1de8ebcffa2d06c2ce404dc6305eaf6ca05860aa Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 21:05:58 +0000
Subject: Added IN_LOAD_GLOBAL_WC for writes to globals in a commit context.
 Could just use _R version but this would be confusing in the log output.

Specialized IN_CALL into WV and WC versions. Now also compiling functions twice
for WV and WC versions. The call instructions access the right one.
---
 colm/bytecode.cpp   | 33 +++++++++++++++++++++++++++++++--
 colm/bytecode.h     |  4 +++-
 colm/compile.cpp    | 21 ++++++++++++++++-----
 colm/parsetree.h    |  6 +++++-
 colm/pdabuild.cpp   |  5 +++++
 colm/pdacodegen.cpp | 24 ++++++++++++++++++++++++
 colm/pdarun.h       |  2 ++
 7 files changed, 86 insertions(+), 9 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index be4722a4..d6106e48 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -787,6 +787,17 @@ again:
 			rcodeUnitLen = 1;
 			break;
 		}
+		case IN_LOAD_GLOBAL_WC: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_LOAD_GLOBAL_WC" << endl;
+			#endif
+
+			/* This is identical to the _R version, but using it for writing
+			 * would be confusing. */
+			tree_upref( prg->global );
+			push( prg->global );
+			break;
+		}
 		case IN_LOAD_GLOBAL_BKT: {
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_LOAD_GLOBAL_BKT" << endl;
@@ -2568,14 +2579,32 @@ again:
 			popn( size );
 			break;
 		}
-		case IN_CALL: {
+		case IN_CALL_WC: {
+			Half funcId;
+			read_half( funcId );
+
+			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_CALL_WC " << fi->name << endl;
+			#endif
+
+			push( 0 ); /* Return value. */
+			push( (SW)instr );
+			push( (SW)frame );
+
+			instr = prg->rtd->frameInfo[fi->frameId].codeWC;
+			frame = ptop();
+			break;
+		}
+		case IN_CALL_WV: {
 			Half funcId;
 			read_half( funcId );
 
 			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CALL " << fi->name << endl;
+			cerr << "IN_CALL_WV " << fi->name << endl;
 			#endif
 
 			push( 0 ); /* Return value. */
diff --git a/colm/bytecode.h b/colm/bytecode.h
index bfee598e..ad0a7faa 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -127,6 +127,7 @@ typedef unsigned char uchar;
 
 #define IN_LOAD_GLOBAL_R         0x59
 #define IN_LOAD_GLOBAL_WV        0x5a
+#define IN_LOAD_GLOBAL_WC        0x9d
 #define IN_LOAD_GLOBAL_BKT       0x5b
 
 #define IN_PTR_DEREF_R           0x5e
@@ -180,7 +181,8 @@ typedef unsigned char uchar;
 
 #define IN_HALT                  0x8a
 
-#define IN_CALL                  0x8b
+#define IN_CALL_WC               0x8b
+#define IN_CALL_WV               0x9c
 #define IN_RET                   0x8c
 #define IN_YIELD                 0x8d
 #define IN_STOP                  0x8e
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 4f656660..fc76c050 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -426,13 +426,19 @@ void LangVarRef::loadGlobalObj( ParseData *pd, CodeVect &code,
 	/* Start the search in the global object. */
 	ObjectDef *rootObj = pd->globalObjectDef;
 
-	if ( pd->revertOn && forWriting && lastPtrInQual < 0 ) {
+	if ( forWriting && lastPtrInQual < 0 ) {
 		/* If we are writing an no reference was found in the qualification
 		 * then load the gloabl with a revert. */
-		code.append( IN_LOAD_GLOBAL_WV );
+		if ( pd->revertOn )
+			code.append( IN_LOAD_GLOBAL_WV );
+		else
+			code.append( IN_LOAD_GLOBAL_WC );
 	}
-	else
+	else {
+		/* Either we are reading or we are loading a pointer that will be
+		 * dereferenced. */
 		code.append( IN_LOAD_GLOBAL_R );
+	}
 
 	loadQualification( pd, code, rootObj, lastPtrInQual, forWriting, true );
 }
@@ -2259,7 +2265,7 @@ void ParseData::makeFuncVisible( Function *func, bool isUserIter )
 	UniqueType *returnUT = func->typeRef != 0 ? 
 			func->typeRef->lookupType(this) : uniqueTypeInt;
 	ObjMethod *objMethod = new ObjMethod( returnUT, func->name, 
-			IN_CALL, IN_CALL, 
+			IN_CALL_WC, IN_CALL_WV, 
 			func->paramList->length(), paramUTs, func->paramList, false );
 	objMethod->funcId = func->funcId;
 	objMethod->useFuncId = true;
@@ -2361,12 +2367,17 @@ void ParseData::compileFunction( Function *func )
 	/* Set up the compilation context. */
 	compileContext = CompileFunction;
 	curFunction = func;
-	revertOn = true;
 
 	/* Assign a frame Id. */
 	block->frameId = nextFrameId++;
 
 	makeFuncVisible( func, false );
+
+	/* Compile once for revert and once for commit. */
+	revertOn = false;
+	compileFunction( func, block->codeWC );
+
+	revertOn = true;
 	compileFunction( func, block->code );
 
 	/* Now that compilation is done variables are referenced. Make the local
diff --git a/colm/parsetree.h b/colm/parsetree.h
index c7514cee..59fdd7f3 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1567,7 +1567,11 @@ struct CodeBlock
 	ObjectDef *localFrame;
 	CharSet trees;
 
-	/* Write revert and write commit versions. */
+	/* Write commit versions. */
+	CodeVect codeWC;
+	long frameIdWC;
+
+	/* Write revert version. */
 	CodeVect code;
 	long frameId;
 };
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 243d8fe1..aa135470 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1283,8 +1283,13 @@ void ParseData::makeRuntimeData()
 		CodeBlock *block = func->codeBlock;
 		if ( block != 0 ) {
 			runtimeData->functionInfo[func->funcId].frameId = block->frameId;
+
+			runtimeData->frameInfo[block->frameId].codeWC = block->codeWC.data;
+			runtimeData->frameInfo[block->frameId].codeLenWC = block->codeWC.length();
+
 			runtimeData->frameInfo[block->frameId].code = block->code.data;
 			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+
 			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
 			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
 		}
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 915cb6e5..3b04ef13 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -98,6 +98,23 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	 * Blocks of code in frames.
 	 */
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
+		/* FIXME: horrible code cloning going on here. */
+		if ( runtimeData->frameInfo[i].codeLenWC > 0 ) {
+			out << "Code code_" << i << "_wc[] = {\n\t";
+
+			Code *block = runtimeData->frameInfo[i].codeWC;
+			for ( int j = 0; j < runtimeData->frameInfo[i].codeLenWC; j++ ) {
+				out << (unsigned long) block[j];
+
+				if ( j < runtimeData->frameInfo[i].codeLenWC-1 ) {
+					out << ", ";
+					if ( (j+1) % 8 == 0 )
+						out << "\n\t";
+				}
+			}
+			out << "\n};\n\n";
+		}
+
 		if ( runtimeData->frameInfo[i].codeLen > 0 ) {
 			out << "Code code_" << i << "[] = {\n\t";
 
@@ -189,6 +206,13 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
 		out << "\t{ ";
 
+		if ( runtimeData->frameInfo[i].codeLenWC > 0 )
+			out << "code_" << i << "_wc, ";
+		else
+			out << "0, ";
+
+		out << runtimeData->frameInfo[i].codeLenWC << ", ";
+
 		if ( runtimeData->frameInfo[i].codeLen > 0 )
 			out << "code_" << i << ", ";
 		else
diff --git a/colm/pdarun.h b/colm/pdarun.h
index afac5d77..01996fcb 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -349,6 +349,8 @@ struct ProdInfo
 
 struct FrameInfo
 {
+	Code *codeWC;
+	long codeLenWC;
 	Code *code;
 	long codeLen;
 	char *trees;
-- 
cgit v1.2.1


From d2cea786fe09cdc28252b4088e30154994776b2f Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 22:44:53 +0000
Subject: Fixed some inconsistent ordering of _WV and _WC variables.

---
 colm/compile.cpp | 43 ++++++++++++++++++++++---------------------
 colm/parsetree.h | 14 +++++++-------
 colm/pdarun.h    |  4 ++--
 3 files changed, 31 insertions(+), 30 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index fc76c050..0cbd7125 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -105,31 +105,31 @@ IterDef::IterDef( Type type, Function *func ) :
 {}
 
 ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
-		const String &name, int methIdWC, int methIdWV, bool isConst )
+		const String &name, int methIdWV, int methIdWC, bool isConst )
 {
 	ObjMethod *objMethod = new ObjMethod( retType, name, 
-			methIdWC, methIdWV, 0, 0, 0, isConst );
+			methIdWV, methIdWC, 0, 0, 0, isConst );
 	obj->objMethodMap->insert( name, objMethod );
 	return objMethod;
 }
 
 ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
-		const String &name, int methIdWC, int methIdWV, UniqueType *arg1, bool isConst )
+		const String &name, int methIdWV, int methIdWC, UniqueType *arg1, bool isConst )
 {
 	UniqueType *args[] = { arg1 };
 	ObjMethod *objMethod = new ObjMethod( retType, name, 
-			methIdWC, methIdWV, 1, args, 0, isConst );
+			methIdWV, methIdWC, 1, args, 0, isConst );
 	obj->objMethodMap->insert( name, objMethod );
 	return objMethod;
 }
 
 ObjMethod *initFunction( UniqueType *retType, ObjectDef *obj, 
-		const String &name, int methIdWC, int methIdWV, 
+		const String &name, int methIdWV, int methIdWC, 
 		UniqueType *arg1, UniqueType *arg2, bool isConst )
 {
 	UniqueType *args[] = { arg1, arg2 };
 	ObjMethod *objMethod = new ObjMethod( retType, name, 
-			methIdWC, methIdWV, 2, args, 0, isConst );
+			methIdWV, methIdWC, 2, args, 0, isConst );
 	obj->objMethodMap->insert( name, objMethod );
 	return objMethod;
 }
@@ -2115,13 +2115,13 @@ void ParseData::initMapFunctions( GenericType *gen )
 {
 	addLengthField( gen->objDef, IN_MAP_LENGTH );
 	initFunction( gen->utArg, gen->objDef, "find", 
-			IN_MAP_FIND, IN_MAP_FIND, gen->keyUT, true );
+			IN_MAP_FIND,      IN_MAP_FIND, gen->keyUT, true );
 	initFunction( uniqueTypeInt, gen->objDef, "insert", 
-			IN_MAP_INSERT_WC, IN_MAP_INSERT_WV, gen->keyUT, gen->utArg, false );
+			IN_MAP_INSERT_WV, IN_MAP_INSERT_WC, gen->keyUT, gen->utArg, false );
 	initFunction( uniqueTypeInt, gen->objDef, "store", 
-			IN_MAP_STORE_WC, IN_MAP_STORE_WV, gen->keyUT, gen->utArg, false );
+			IN_MAP_STORE_WV,  IN_MAP_STORE_WC, gen->keyUT, gen->utArg, false );
 	initFunction( gen->utArg, gen->objDef, "remove", 
-			IN_MAP_REMOVE_WC, IN_MAP_REMOVE_WV, gen->keyUT, false );
+			IN_MAP_REMOVE_WV, IN_MAP_REMOVE_WC, gen->keyUT, false );
 }
 
 void ParseData::initListFunctions( GenericType *gen )
@@ -2129,14 +2129,14 @@ void ParseData::initListFunctions( GenericType *gen )
 	addLengthField( gen->objDef, IN_LIST_LENGTH );
 
 	initFunction( uniqueTypeInt, gen->objDef, "append", 
-			IN_LIST_APPEND_WC, IN_LIST_APPEND_WV, gen->utArg, false );
+			IN_LIST_APPEND_WV, IN_LIST_APPEND_WC, gen->utArg, false );
 	initFunction( uniqueTypeInt, gen->objDef, "push", 
-			IN_LIST_APPEND_WC, IN_LIST_APPEND_WV, gen->utArg, false );
+			IN_LIST_APPEND_WV, IN_LIST_APPEND_WC, gen->utArg, false );
 
 	initFunction( gen->utArg, gen->objDef, "remove_end", 
-			IN_LIST_REMOVE_END_WC, IN_LIST_REMOVE_END_WV, false );
+			IN_LIST_REMOVE_END_WV, IN_LIST_REMOVE_END_WC, false );
 	initFunction( gen->utArg, gen->objDef, "pop", 
-			IN_LIST_REMOVE_END_WC, IN_LIST_REMOVE_END_WV, false );
+			IN_LIST_REMOVE_END_WV, IN_LIST_REMOVE_END_WC, false );
 }
 
 void ParseData::initListField( GenericType *gen, const char *name, int offset )
@@ -2172,9 +2172,9 @@ void ParseData::initVectorFunctions( GenericType *gen )
 {
 	addLengthField( gen->objDef, IN_VECTOR_LENGTH );
 	initFunction( uniqueTypeInt, gen->objDef, "append", 
-			IN_VECTOR_APPEND_WC, IN_VECTOR_APPEND_WV, gen->utArg, false );
+			IN_VECTOR_APPEND_WV, IN_VECTOR_APPEND_WC, gen->utArg, false );
 	initFunction( uniqueTypeInt, gen->objDef, "insert", 
-			IN_VECTOR_INSERT_WC, IN_VECTOR_INSERT_WV, uniqueTypeInt, gen->utArg, false );
+			IN_VECTOR_INSERT_WV, IN_VECTOR_INSERT_WC, uniqueTypeInt, gen->utArg, false );
 }
 
 void ParseData::resolveGenericTypes()
@@ -2265,7 +2265,7 @@ void ParseData::makeFuncVisible( Function *func, bool isUserIter )
 	UniqueType *returnUT = func->typeRef != 0 ? 
 			func->typeRef->lookupType(this) : uniqueTypeInt;
 	ObjMethod *objMethod = new ObjMethod( returnUT, func->name, 
-			IN_CALL_WC, IN_CALL_WV, 
+			IN_CALL_WV, IN_CALL_WC, 
 			func->paramList->length(), paramUTs, func->paramList, false );
 	objMethod->funcId = func->funcId;
 	objMethod->useFuncId = true;
@@ -2373,13 +2373,14 @@ void ParseData::compileFunction( Function *func )
 
 	makeFuncVisible( func, false );
 
-	/* Compile once for revert and once for commit. */
-	revertOn = false;
-	compileFunction( func, block->codeWC );
-
+	/* Compile once for revert. */
 	revertOn = true;
 	compileFunction( func, block->code );
 
+	/* Compile once for commit. */
+	revertOn = false;
+	compileFunction( func, block->codeWC );
+
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
 	findLocalTrees( block->trees );
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 59fdd7f3..67ac95b8 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1142,12 +1142,12 @@ typedef DList<ObjField> ParameterList;
 struct ObjMethod
 {
 	ObjMethod( UniqueType *returnUT, String name, 
-			int opcodeWC, int opcodeWV, int numParams, 
+			int opcodeWV, int opcodeWC, int numParams, 
 			UniqueType **types, ParameterList *paramList, bool isConst )
 		: 
 			returnUT(returnUT),
 			returnTypeId(0), name(name), 
-			opcodeWC(opcodeWC), opcodeWV(opcodeWV), 
+			opcodeWV(opcodeWV), opcodeWC(opcodeWC), 
 			numParams(numParams), paramList(paramList), 
 			isConst(isConst), funcId(0), 
 			useFuncId(false), useCallObj(true), func(0), 
@@ -1160,8 +1160,8 @@ struct ObjMethod
 	UniqueType *returnUT;
 	long returnTypeId;
 	String name;
-	long opcodeWC;
 	long opcodeWV;
+	long opcodeWC;
 	long numParams;
 	UniqueType **paramUTs;
 	ParameterList *paramList;
@@ -1567,13 +1567,13 @@ struct CodeBlock
 	ObjectDef *localFrame;
 	CharSet trees;
 
-	/* Write commit versions. */
-	CodeVect codeWC;
-	long frameIdWC;
-
 	/* Write revert version. */
 	CodeVect code;
 	long frameId;
+
+	/* Write commit versions. */
+	CodeVect codeWC;
+	long frameIdWC;
 };
 
 struct Function
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 01996fcb..5dfe230c 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -349,10 +349,10 @@ struct ProdInfo
 
 struct FrameInfo
 {
-	Code *codeWC;
-	long codeLenWC;
 	Code *code;
 	long codeLen;
+	Code *codeWC;
+	long codeLenWC;
 	char *trees;
 	long treesLen;
 };
-- 
cgit v1.2.1


From e88b5fa8de227c1c9d95fcc1d9e60f4f91390fb3 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 23:05:16 +0000
Subject: Some fixes for _WV and _WC frames. Also some cleanup.

---
 colm/bytecode.cpp   | 12 ++++++------
 colm/compile.cpp    | 16 ++++++++--------
 colm/parsedata.h    |  2 +-
 colm/parsetree.h    | 13 +++++--------
 colm/pdabuild.cpp   |  6 +++---
 colm/pdacodegen.cpp | 28 ++++++++++++++--------------
 6 files changed, 37 insertions(+), 40 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index d6106e48..17c9390e 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -2579,39 +2579,39 @@ again:
 			popn( size );
 			break;
 		}
-		case IN_CALL_WC: {
+		case IN_CALL_WV: {
 			Half funcId;
 			read_half( funcId );
 
 			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CALL_WC " << fi->name << endl;
+			cerr << "IN_CALL_WV " << fi->name << endl;
 			#endif
 
 			push( 0 ); /* Return value. */
 			push( (SW)instr );
 			push( (SW)frame );
 
-			instr = prg->rtd->frameInfo[fi->frameId].codeWC;
+			instr = prg->rtd->frameInfo[fi->frameId].code;
 			frame = ptop();
 			break;
 		}
-		case IN_CALL_WV: {
+		case IN_CALL_WC: {
 			Half funcId;
 			read_half( funcId );
 
 			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CALL_WV " << fi->name << endl;
+			cerr << "IN_CALL_WC " << fi->name << endl;
 			#endif
 
 			push( 0 ); /* Return value. */
 			push( (SW)instr );
 			push( (SW)frame );
 
-			instr = prg->rtd->frameInfo[fi->frameId].code;
+			instr = prg->rtd->frameInfo[fi->frameId].codeWC;
 			frame = ptop();
 			break;
 		}
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 0cbd7125..ed2c6803 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1718,20 +1718,20 @@ void ParseData::addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList )
 	}
 }
 
-void ParseData::addProdRHSLoads( Definition *prod, long codeInsertPos )
+void ParseData::addProdRHSLoads( Definition *prod, long codeInsertPos, CodeVect &code )
 {
-	CodeVect code;
+	CodeVect loads;
 	long position = 0;
 	for ( ProdElList::Iter rhsEl = *prod->prodElList; rhsEl.lte(); rhsEl++, position++ ) {
 		if ( rhsEl->type == PdaFactor::ReferenceType ) {
 			if ( rhsEl->objField->beenReferenced ) {
-				code.append ( IN_INIT_RHS_EL );
-				code.appendHalf( position );
-				code.appendHalf( rhsEl->objField->offset );
+				loads.append ( IN_INIT_RHS_EL );
+				loads.appendHalf( position );
+				loads.appendHalf( rhsEl->objField->offset );
 			}
 		}
 	}
-	prod->redBlock->code.insert( codeInsertPos, code );
+	code.insert( codeInsertPos, loads );
 }
 
 void ParseData::addMatchLength( ObjectDef *frame, KlangEl *lel )
@@ -1955,7 +1955,7 @@ void ParseData::compileReductionCode( Definition *prod )
 	long frameSize = curLocalFrame->size();
 	block->code.setHalf( 1, frameSize );
 
-	addProdRHSLoads( prod, afterAllocFrame );
+	addProdRHSLoads( prod, afterAllocFrame, block->code );
 
 	block->code.append( IN_POP_LOCALS );
 	block->code.appendHalf( block->frameId );
@@ -2068,7 +2068,7 @@ void ParseData::compileRootBlock( )
 	 * block, but we need an empty local frame for the compile. */
 	compileContext = CompileRoot;
 	curLocalFrame = rootLocalFrame;
-	revertOn = true;
+	revertOn = false;
 
 	/* The block needs a frame id. */
 	block->frameId = nextFrameId++;
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 12685b04..0793574d 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -681,7 +681,7 @@ struct ParseData
 	void addMatchText( ObjectDef *frame, KlangEl *lel );
 	void addMatchLength( ObjectDef *frame, KlangEl *lel );
 	void addTransTokVar( ObjectDef *frame, KlangEl *lel );
-	void addProdRHSLoads( Definition *prod, long pos );
+	void addProdRHSLoads( Definition *prod, long pos, CodeVect &code );
 	void addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList );
 	void addProdRedObjectVar( ObjectDef *localFrame, KlangEl *langEl );
 	void addProdObjects();
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 67ac95b8..9d49d314 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1559,21 +1559,18 @@ struct LangStmt
 struct CodeBlock
 {
 	CodeBlock( StmtList *stmtList ) 
-		: stmtList(stmtList), localFrame(0), frameId(-1) {}
+		: frameId(-1), stmtList(stmtList), localFrame(0) {}
 
 	void compile( ParseData *pd, CodeVect &code );
 
+	long frameId;
 	StmtList *stmtList;
 	ObjectDef *localFrame;
 	CharSet trees;
 
-	/* Write revert version. */
-	CodeVect code;
-	long frameId;
-
-	/* Write commit versions. */
-	CodeVect codeWC;
-	long frameIdWC;
+	/* Each frame has two versions of 
+	 * the code: revert and commit. */
+	CodeVect code, codeWC;
 };
 
 struct Function
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index aa135470..538ed313 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1284,12 +1284,12 @@ void ParseData::makeRuntimeData()
 		if ( block != 0 ) {
 			runtimeData->functionInfo[func->funcId].frameId = block->frameId;
 
-			runtimeData->frameInfo[block->frameId].codeWC = block->codeWC.data;
-			runtimeData->frameInfo[block->frameId].codeLenWC = block->codeWC.length();
-
 			runtimeData->frameInfo[block->frameId].code = block->code.data;
 			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
 
+			runtimeData->frameInfo[block->frameId].codeWC = block->codeWC.data;
+			runtimeData->frameInfo[block->frameId].codeLenWC = block->codeWC.length();
+
 			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
 			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
 		}
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 3b04ef13..3344a0f6 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -99,14 +99,14 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	 */
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
 		/* FIXME: horrible code cloning going on here. */
-		if ( runtimeData->frameInfo[i].codeLenWC > 0 ) {
-			out << "Code code_" << i << "_wc[] = {\n\t";
+		if ( runtimeData->frameInfo[i].codeLen > 0 ) {
+			out << "Code code_" << i << "[] = {\n\t";
 
-			Code *block = runtimeData->frameInfo[i].codeWC;
-			for ( int j = 0; j < runtimeData->frameInfo[i].codeLenWC; j++ ) {
+			Code *block = runtimeData->frameInfo[i].code;
+			for ( int j = 0; j < runtimeData->frameInfo[i].codeLen; j++ ) {
 				out << (unsigned long) block[j];
 
-				if ( j < runtimeData->frameInfo[i].codeLenWC-1 ) {
+				if ( j < runtimeData->frameInfo[i].codeLen-1 ) {
 					out << ", ";
 					if ( (j+1) % 8 == 0 )
 						out << "\n\t";
@@ -115,14 +115,14 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 			out << "\n};\n\n";
 		}
 
-		if ( runtimeData->frameInfo[i].codeLen > 0 ) {
-			out << "Code code_" << i << "[] = {\n\t";
+		if ( runtimeData->frameInfo[i].codeLenWC > 0 ) {
+			out << "Code code_" << i << "_wc[] = {\n\t";
 
-			Code *block = runtimeData->frameInfo[i].code;
-			for ( int j = 0; j < runtimeData->frameInfo[i].codeLen; j++ ) {
+			Code *block = runtimeData->frameInfo[i].codeWC;
+			for ( int j = 0; j < runtimeData->frameInfo[i].codeLenWC; j++ ) {
 				out << (unsigned long) block[j];
 
-				if ( j < runtimeData->frameInfo[i].codeLen-1 ) {
+				if ( j < runtimeData->frameInfo[i].codeLenWC-1 ) {
 					out << ", ";
 					if ( (j+1) % 8 == 0 )
 						out << "\n\t";
@@ -206,15 +206,15 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
 		out << "\t{ ";
 
-		if ( runtimeData->frameInfo[i].codeLenWC > 0 )
-			out << "code_" << i << "_wc, ";
+		if ( runtimeData->frameInfo[i].codeLen > 0 )
+			out << "code_" << i << ", ";
 		else
 			out << "0, ";
 
 		out << runtimeData->frameInfo[i].codeLenWC << ", ";
 
-		if ( runtimeData->frameInfo[i].codeLen > 0 )
-			out << "code_" << i << ", ";
+		if ( runtimeData->frameInfo[i].codeLenWC > 0 )
+			out << "code_" << i << "_wc, ";
 		else
 			out << "0, ";
 
-- 
cgit v1.2.1


From ac5de86f48a71ae57fcab8c66942f40e886b9d34 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 5 Nov 2008 23:39:27 +0000
Subject: more work on the specialization of frame code into codeWV and codeWC

---
 colm/bytecode.cpp   |  4 +--
 colm/compile.cpp    | 93 ++++++++++++++++++++++++++++++-----------------------
 colm/fsmrun.cpp     |  4 +--
 colm/parsetree.h    |  2 +-
 colm/pdabuild.cpp   | 27 +++++++++-------
 colm/pdacodegen.cpp | 21 ++++++------
 colm/pdarun.cpp     |  2 +-
 colm/pdarun.h       |  4 +--
 8 files changed, 84 insertions(+), 73 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 17c9390e..b5582b67 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -2593,7 +2593,7 @@ again:
 			push( (SW)instr );
 			push( (SW)frame );
 
-			instr = prg->rtd->frameInfo[fi->frameId].code;
+			instr = prg->rtd->frameInfo[fi->frameId].codeWV;
 			frame = ptop();
 			break;
 		}
@@ -2675,7 +2675,7 @@ again:
 			/* Now set up the first yeild. */
 			uiter->ref.kid = 0;
 			uiter->stackSize = uiter->stackRoot - ptop();
-			uiter->resume = prg->rtd->frameInfo[fi->frameId].code;
+			uiter->resume = prg->rtd->frameInfo[fi->frameId].codeWV;
 			uiter->frame = &uiter->stackRoot[-IFR_AA];
 
 			upref_uiter_args( frame, fi->argSize );
diff --git a/colm/compile.cpp b/colm/compile.cpp
index ed2c6803..beab23ac 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1942,26 +1942,28 @@ void ParseData::compileReductionCode( Definition *prod )
 	revertOn = true;
 	block->frameId = nextFrameId++;
 
+	CodeVect &code = block->codeWV;
+
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
-	long afterAllocFrame = block->code.length();
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
+	long afterAllocFrame = code.length();
 
 	/* Compile the reduce block. */
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Set in the alloc frame instruction. */
 	long frameSize = curLocalFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
-	addProdRHSLoads( prod, afterAllocFrame, block->code );
+	addProdRHSLoads( prod, afterAllocFrame, code );
 
-	block->code.append( IN_POP_LOCALS );
-	block->code.appendHalf( block->frameId );
-	block->code.appendHalf( frameSize );
+	code.append( IN_POP_LOCALS );
+	code.appendHalf( block->frameId );
+	code.appendHalf( frameSize );
 
-	block->code.append( IN_STOP );
+	code.append( IN_STOP );
 
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
@@ -1991,23 +1993,25 @@ void ParseData::compileTranslateBlock( KlangEl *langEl )
 	initFunction( uniqueTypeInt, curLocalFrame, "send_ignore",
 			IN_IGNORE, IN_IGNORE, uniqueTypeAny, true );
 
+	CodeVect &code = block->codeWV;
+
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
 
 	/* Set the local frame and compile the reduce block. */
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Set in the alloc frame instruction. */
 	long frameSize = curLocalFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
-	block->code.append( IN_POP_LOCALS );
-	block->code.appendHalf( block->frameId );
-	block->code.appendHalf( frameSize );
+	code.append( IN_POP_LOCALS );
+	code.appendHalf( block->frameId );
+	code.appendHalf( frameSize );
 
-	block->code.append( IN_STOP );
+	code.append( IN_STOP );
 
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
@@ -2035,23 +2039,25 @@ void ParseData::compilePreEof( TokenRegion *region )
 	initFunction( uniqueTypeInt, curLocalFrame, "send_ignore",
 			IN_IGNORE, IN_IGNORE, uniqueTypeAny, true );
 
+	CodeVect &code = block->codeWV;
+
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
 
 	/* Set the local frame and compile the reduce block. */
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Set in the alloc frame instruction. */
 	long frameSize = curLocalFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
-	block->code.append( IN_POP_LOCALS );
-	block->code.appendHalf( block->frameId );
-	block->code.appendHalf( frameSize );
+	code.append( IN_POP_LOCALS );
+	code.appendHalf( block->frameId );
+	code.appendHalf( frameSize );
 
-	block->code.append( IN_STOP );
+	code.append( IN_STOP );
 
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
@@ -2073,22 +2079,25 @@ void ParseData::compileRootBlock( )
 	/* The block needs a frame id. */
 	block->frameId = nextFrameId++;
 
+	/* The root block is not reverted. */
+	CodeVect &code = block->codeWC;
+
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
 
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Store it in frame init. */
 	long frameSize = curLocalFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
-	block->code.append( IN_POP_LOCALS );
-	block->code.appendHalf( block->frameId );
-	block->code.appendHalf( frameSize );
+	code.append( IN_POP_LOCALS );
+	code.appendHalf( block->frameId );
+	code.appendHalf( frameSize );
 
-	block->code.append( IN_STOP );
+	code.append( IN_STOP );
 
 	/* Make the local trees descriptor. */
 	findLocalTrees( block->trees );
@@ -2291,25 +2300,27 @@ void ParseData::compileUserIter( Function *func )
 
 	makeFuncVisible( func, true );
 
+	CodeVect &code = block->codeWV;
+
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
-	block->code.append( IN_INIT_LOCALS );
-	block->code.appendHalf( 0 );
+	code.append( IN_INIT_LOCALS );
+	code.appendHalf( 0 );
 
 	/* Compile the block. */
-	block->compile( this, block->code );
+	block->compile( this, code );
 
 	/* We have the frame size now. Set in the alloc frame instruction. */
 	int frameSize = func->localFrame->size();
-	block->code.setHalf( 1, frameSize );
+	code.setHalf( 1, frameSize );
 
 	/* Check for a return statement. */
 	if ( block->stmtList->length() == 0 ||
 			block->stmtList->tail->type != LangStmt::YieldType )
 	{
 		/* Push the return value. */
-		block->code.append( IN_LOAD_NIL );
-		block->code.append( IN_YIELD );
+		code.append( IN_LOAD_NIL );
+		code.append( IN_YIELD );
 	}
 
 	/* Now that compilation is done variables are referenced. Make the local
@@ -2375,7 +2386,7 @@ void ParseData::compileFunction( Function *func )
 
 	/* Compile once for revert. */
 	revertOn = true;
-	compileFunction( func, block->code );
+	compileFunction( func, block->codeWV );
 
 	/* Compile once for commit. */
 	revertOn = false;
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 6e89e888..993936f6 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -359,7 +359,7 @@ void FsmRun::sendEOF( )
 		cerr << "HAVE PRE_EOF BLOCK" << endl;
 		#endif
 
-		Code *code = parser->tables->gbl->frameInfo[frameId].code;
+		Code *code = parser->tables->gbl->frameInfo[frameId].codeWV;
 	
 		/* Execute the translation. */
 		Execution execution( prg, parser->reverseCode, 
@@ -486,7 +486,7 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 
 	/* Find the code. */
 	Code *code = parser->tables->gbl->frameInfo[
-			parser->tables->gbl->lelInfo[id].frameId].code;
+			parser->tables->gbl->lelInfo[id].frameId].codeWV;
 	
 	/* Execute the translation. */
 	Execution execution( prg, parser->reverseCode, 
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 9d49d314..72beac98 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1570,7 +1570,7 @@ struct CodeBlock
 
 	/* Each frame has two versions of 
 	 * the code: revert and commit. */
-	CodeVect code, codeWC;
+	CodeVect codeWV, codeWC;
 };
 
 struct Function
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 538ed313..c81fb8e4 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1167,12 +1167,12 @@ void ParseData::makeRuntimeData()
 		runtimeData->rootCodeLen = 0;
 	}
 	else {
-		runtimeData->rootCode = rootCodeBlock->code.data;
-		runtimeData->rootCodeLen = rootCodeBlock->code.length();
+		runtimeData->rootCode = rootCodeBlock->codeWC.data;
+		runtimeData->rootCodeLen = rootCodeBlock->codeWC.length();
 	}
 
-	runtimeData->frameInfo[rootCodeBlock->frameId].code = 0;
-	runtimeData->frameInfo[rootCodeBlock->frameId].codeLen = 0;
+	runtimeData->frameInfo[rootCodeBlock->frameId].codeWV = 0;
+	runtimeData->frameInfo[rootCodeBlock->frameId].codeLenWV = 0;
 	runtimeData->frameInfo[rootCodeBlock->frameId].trees = rootCodeBlock->trees.data;
 	runtimeData->frameInfo[rootCodeBlock->frameId].treesLen = rootCodeBlock->trees.length();
 
@@ -1193,8 +1193,9 @@ void ParseData::makeRuntimeData()
 		CodeBlock *block = prod->redBlock;
 		if ( block != 0 ) {
 			runtimeData->prodInfo[count].frameId = block->frameId;
-			runtimeData->frameInfo[block->frameId].code = block->code.data;
-			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].codeWV = block->codeWV.data;
+			runtimeData->frameInfo[block->frameId].codeLenWV = block->codeWV.length();
+
 			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
 			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
 		}
@@ -1220,8 +1221,9 @@ void ParseData::makeRuntimeData()
 		CodeBlock *block = reg->preEofBlock;
 		if ( block != 0 ) {
 			runtimeData->regionInfo[regId].eofFrameId = block->frameId;
-			runtimeData->frameInfo[block->frameId].code = block->code.data;
-			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].codeWV = block->codeWV.data;
+			runtimeData->frameInfo[block->frameId].codeLenWV = block->codeWV.length();
+
 			runtimeData->frameInfo[block->frameId].trees = block->trees.data;
 			runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
 		}
@@ -1247,8 +1249,9 @@ void ParseData::makeRuntimeData()
 			CodeBlock *block = lel->transBlock;
 			if ( block != 0 ) {
 				runtimeData->lelInfo[i].frameId = block->frameId;
-				runtimeData->frameInfo[block->frameId].code = block->code.data;
-				runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+				runtimeData->frameInfo[block->frameId].codeWV = block->codeWV.data;
+				runtimeData->frameInfo[block->frameId].codeLenWV = block->codeWV.length();
+
 				runtimeData->frameInfo[block->frameId].trees = block->trees.data;
 				runtimeData->frameInfo[block->frameId].treesLen = block->trees.length();
 			}
@@ -1284,8 +1287,8 @@ void ParseData::makeRuntimeData()
 		if ( block != 0 ) {
 			runtimeData->functionInfo[func->funcId].frameId = block->frameId;
 
-			runtimeData->frameInfo[block->frameId].code = block->code.data;
-			runtimeData->frameInfo[block->frameId].codeLen = block->code.length();
+			runtimeData->frameInfo[block->frameId].codeWV = block->codeWV.data;
+			runtimeData->frameInfo[block->frameId].codeLenWV = block->codeWV.length();
 
 			runtimeData->frameInfo[block->frameId].codeWC = block->codeWC.data;
 			runtimeData->frameInfo[block->frameId].codeLenWC = block->codeWC.length();
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 3344a0f6..399209a8 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -99,14 +99,14 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	 */
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
 		/* FIXME: horrible code cloning going on here. */
-		if ( runtimeData->frameInfo[i].codeLen > 0 ) {
-			out << "Code code_" << i << "[] = {\n\t";
+		if ( runtimeData->frameInfo[i].codeLenWV > 0 ) {
+			out << "Code code_" << i << "_wv[] = {\n\t";
 
-			Code *block = runtimeData->frameInfo[i].code;
-			for ( int j = 0; j < runtimeData->frameInfo[i].codeLen; j++ ) {
+			Code *block = runtimeData->frameInfo[i].codeWV;
+			for ( int j = 0; j < runtimeData->frameInfo[i].codeLenWV; j++ ) {
 				out << (unsigned long) block[j];
 
-				if ( j < runtimeData->frameInfo[i].codeLen-1 ) {
+				if ( j < runtimeData->frameInfo[i].codeLenWV-1 ) {
 					out << ", ";
 					if ( (j+1) % 8 == 0 )
 						out << "\n\t";
@@ -206,25 +206,22 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 	for ( int i = 0; i < runtimeData->numFrames; i++ ) {
 		out << "\t{ ";
 
-		if ( runtimeData->frameInfo[i].codeLen > 0 )
-			out << "code_" << i << ", ";
+		if ( runtimeData->frameInfo[i].codeLenWV > 0 )
+			out << "code_" << i << "_wv, ";
 		else
 			out << "0, ";
-
-		out << runtimeData->frameInfo[i].codeLenWC << ", ";
+		out << runtimeData->frameInfo[i].codeLenWV << ", ";
 
 		if ( runtimeData->frameInfo[i].codeLenWC > 0 )
 			out << "code_" << i << "_wc, ";
 		else
 			out << "0, ";
-
-		out << runtimeData->frameInfo[i].codeLen << ", ";
+		out << runtimeData->frameInfo[i].codeLenWC << ", ";
 
 		if ( runtimeData->frameInfo[i].treesLen > 0 )
 			out << "trees_" << i << ", ";
 		else
 			out << "0, ";
-
 		out << runtimeData->frameInfo[i].treesLen << ", ";
 
 		out << " }";
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 828596a9..b7708c38 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -416,7 +416,7 @@ again:
 
 			/* Execution environment for the reduction code. */
 			Execution execution( prg, reverseCode, 
-					this, fi->code, redLel->tree, 0 );
+					this, fi->codeWV, redLel->tree, 0 );
 
 			/* Take a copy of the lhs and store it in alg. May need it during
 			 * reverse parsing. */
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 5dfe230c..f32c178e 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -349,8 +349,8 @@ struct ProdInfo
 
 struct FrameInfo
 {
-	Code *code;
-	long codeLen;
+	Code *codeWV;
+	long codeLenWV;
 	Code *codeWC;
 	long codeLenWC;
 	char *trees;
-- 
cgit v1.2.1


From e3fc2ae83a576bf0dca0a313d06fe9a9e4b35715 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 6 Nov 2008 01:33:59 +0000
Subject: The revertOn flag is now passed to parser. But there are problems ...
 compiling a function twice overpopulates accumulated data structures.

---
 colm/bytecode.cpp  | 10 ++++++----
 colm/compile.cpp   |  1 +
 colm/parsedata.cpp |  4 ++--
 colm/pdarun.cpp    |  6 +++---
 colm/pdarun.h      |  7 +++++--
 5 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index b5582b67..fc4f862b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -118,10 +118,10 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 }
 
 Tree *parse( Tree **&sp, Program *prg, Stream *stream, 
-		long parserId, long stopId, CodeVect *&cv )
+		long parserId, long stopId, CodeVect *&cv, bool revertOn )
 {
 	PdaTables *tables = prg->rtd->parsers[parserId];
-	PdaRun parser( sp, prg, tables, stream->scanner, stopId );
+	PdaRun parser( sp, prg, tables, stream->scanner, stopId, revertOn );
 	parser.run();
 	parser.commit();
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
@@ -137,7 +137,7 @@ void undo_parse( Tree **&sp, Program *prg, Stream *stream,
 		long parserId, Tree *tree, CodeVect *rev )
 {
 	PdaTables *tables = prg->rtd->parsers[parserId];
-	PdaRun parser( sp, prg, tables, stream->scanner, 0 );
+	PdaRun parser( sp, prg, tables, stream->scanner, 0, false );
 	parser.undoParse( tree, rev );
 }
 
@@ -1649,8 +1649,10 @@ again:
 		}
 		case IN_PARSE: {
 			Half parserId, stopId;
+			uchar revertOn;
 			read_half( parserId );
 			read_half( stopId );
+			read_byte( revertOn );
 
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_PARSE " << parserId << " " << stopId << endl;
@@ -1659,7 +1661,7 @@ again:
 			/* Comes back from parse upreffed. */
 			CodeVect *cv;
 			Tree *stream = pop();
-			Tree *res = parse( sp, prg, (Stream*)stream, parserId, stopId, cv );
+			Tree *res = parse( sp, prg, (Stream*)stream, parserId, stopId, cv, revertOn );
 			push( res );
 
 			/* Single unit. */
diff --git a/colm/compile.cpp b/colm/compile.cpp
index beab23ac..3e293acb 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1002,6 +1002,7 @@ UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
 		code.appendHalf( ut->langEl->id );
 	else 
 		code.appendHalf( 0 );
+	code.append( pd->revertOn );
 	return ut;
 }
 
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index c564b02f..3fadf73d 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1636,7 +1636,7 @@ void ParseData::parsePatterns()
 		InputStreamRepl in( repl );
 		fsmRun.attachInputStream( &in );
 
-		repl->pdaRun = new PdaRun( 0, &program, repl->langEl->pdaTables, &fsmRun, 0 );
+		repl->pdaRun = new PdaRun( 0, &program, repl->langEl->pdaTables, &fsmRun, 0, false );
 		repl->pdaRun->run();
 
 		//#ifdef COLM_LOG_COMPILE
@@ -1649,7 +1649,7 @@ void ParseData::parsePatterns()
 		InputStreamPattern in( pat );
 		fsmRun.attachInputStream( &in );
 
-		pat->pdaRun = new PdaRun( 0, &program, pat->langEl->pdaTables, &fsmRun, 0 );
+		pat->pdaRun = new PdaRun( 0, &program, pat->langEl->pdaTables, &fsmRun, 0, false );
 		pat->pdaRun->run();
 
 		//#ifdef COLM_LOG_COMPILE
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index b7708c38..d058df73 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -260,9 +260,9 @@ void PdaRun::commit()
 	assert( sp == root );
 
 	/* We cannot always clear all the rcode here. We may need to backup over
-	 * the parse statement. In the future we should compute when it is safe to
-	 * do so, but for now just leave everything until later. */
-//	rcode_downref_all( root, prg, allReverseCode );
+	 * the parse statement. We depend on the context flag. */
+	if ( !revertOn )
+		rcode_downref_all( root, prg, allReverseCode );
 }
 
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index f32c178e..8f6f2c26 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -445,7 +445,7 @@ typedef Vector<Tree*> Bindings;
 struct PdaRun
 {
 	PdaRun( Tree **root, Program *prg, PdaTables *tables, 
-			FsmRun *scanner, long stopTarget )
+			FsmRun *scanner, long stopTarget, bool revertOn )
 	:
 		root(root),
 		prg(prg),
@@ -454,7 +454,8 @@ struct PdaRun
 		stopParsing(false),
 		stopTarget(stopTarget),
 		queue(0),
-		queueLast(0)
+		queueLast(0),
+		revertOn(revertOn)
 	{
 	}
 
@@ -506,6 +507,8 @@ struct PdaRun
 	Kid *queue, *queueLast;
 
 	Bindings bindings;
+
+	bool revertOn;
 };
 
 void xml_print_list( RuntimeData *runtimeData, Kid *lel, int depth );
-- 
cgit v1.2.1


From a9e75a2620a9ccd7f19534c251d318d4ffccd72f Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 6 Nov 2008 19:14:17 +0000
Subject: The compile functions should be const. We need to call them more than
 once to compile WV and WC code so they should not be modifying the AST.

Create the object field for the iterator at parse time with all the other field
creations. We need this once we start doing mutiple compiles. But still create
the type reference for the iterator variable at compile time since it is
dependent on the iterator call lookup and all call lookups are done at compile
time.

We also need to turn off the unscoping of the iterator variable so we can
support mutiple compiles. Eventually we will need a proper scoping solution and
this was just a little hack for one case.
---
 colm/compile.cpp | 133 ++++++++++++++++++++++++-------------------------------
 colm/lmparse.kl  |  12 ++++-
 colm/parsetree.h |  86 ++++++++++++++++++-----------------
 3 files changed, 111 insertions(+), 120 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index 3e293acb..84f2c3e5 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -299,7 +299,7 @@ void ObjectDef::initField( ParseData *pd, ObjField *field )
 }
 
 UniqueType *LangVarRef::loadFieldInstr( ParseData *pd, CodeVect &code, 
-		ObjectDef *inObject, ObjField *el, bool forWriting, bool revert )
+		ObjectDef *inObject, ObjField *el, bool forWriting, bool revert ) const
 {
 	/* Ensure that the field is referenced. */
 	inObject->referenceField( pd, el );
@@ -350,7 +350,7 @@ ObjectDef *objDefFromUT( ParseData *pd, UniqueType *ut )
 }
 
 void LangVarRef::loadQualification( ParseData *pd, CodeVect &code, 
-		ObjectDef *rootObj, int lastPtrInQual, bool forWriting, bool revert )
+		ObjectDef *rootObj, int lastPtrInQual, bool forWriting, bool revert ) const
 {
 	/* Start the search from the root object. */
 	ObjectDef *searchObjDef = rootObj;
@@ -421,7 +421,7 @@ void LangVarRef::loadQualification( ParseData *pd, CodeVect &code,
 }
 
 void LangVarRef::loadGlobalObj( ParseData *pd, CodeVect &code, 
-		int lastPtrInQual, bool forWriting )
+		int lastPtrInQual, bool forWriting ) const
 {
 	/* Start the search in the global object. */
 	ObjectDef *rootObj = pd->globalObjectDef;
@@ -444,14 +444,14 @@ void LangVarRef::loadGlobalObj( ParseData *pd, CodeVect &code,
 }
 
 void LangVarRef::loadLocalObj( ParseData *pd, CodeVect &code, 
-		int lastPtrInQual, bool forWriting )
+		int lastPtrInQual, bool forWriting ) const
 {
 	/* Start the search in the local frame. */
 	ObjectDef *rootObj = pd->curLocalFrame;
 	loadQualification( pd, code, rootObj, lastPtrInQual, forWriting, false );
 }
 
-bool LangVarRef::isLocalRef( ParseData *pd )
+bool LangVarRef::isLocalRef( ParseData *pd ) const
 {
 	if ( qual->length() > 0 ) {
 		if ( pd->curLocalFrame->objFieldMap->find( qual->data[0].data ) != 0 )
@@ -466,7 +466,7 @@ bool LangVarRef::isLocalRef( ParseData *pd )
 }
 
 void LangVarRef::loadObj( ParseData *pd, CodeVect &code, 
-		int lastPtrInQual, bool forWriting )
+		int lastPtrInQual, bool forWriting ) const
 {
 	if ( isLocalRef( pd ) )
 		loadLocalObj( pd, code, lastPtrInQual, forWriting );
@@ -522,7 +522,7 @@ VarRefLookup LangVarRef::lookupQualification( ParseData *pd, ObjectDef *rootDef
 	return VarRefLookup( lastPtrInQual, firstConstPart, searchObjDef );
 }
 
-VarRefLookup LangVarRef::lookupObj( ParseData *pd )
+VarRefLookup LangVarRef::lookupObj( ParseData *pd ) const
 {
 	ObjectDef *rootDef;
 	if ( isLocalRef( pd ) )
@@ -533,7 +533,7 @@ VarRefLookup LangVarRef::lookupObj( ParseData *pd )
 	return lookupQualification( pd, rootDef );
 }
 
-VarRefLookup LangVarRef::lookupField( ParseData *pd )
+VarRefLookup LangVarRef::lookupField( ParseData *pd ) const
 {
 	/* Lookup the object that the field is in. */
 	VarRefLookup lookup = lookupObj( pd );
@@ -554,7 +554,7 @@ VarRefLookup LangVarRef::lookupField( ParseData *pd )
 	return lookup;
 }
 
-VarRefLookup LangVarRef::lookupMethod( ParseData *pd )
+VarRefLookup LangVarRef::lookupMethod( ParseData *pd ) const
 {
 	/* Lookup the object that the field is in. */
 	VarRefLookup lookup = lookupObj( pd );
@@ -572,7 +572,7 @@ VarRefLookup LangVarRef::lookupMethod( ParseData *pd )
 }
 
 void LangVarRef::setFieldInstr( ParseData *pd, CodeVect &code, 
-		ObjectDef *inObject, ObjField *el, UniqueType *exprUT, bool revert )
+		ObjectDef *inObject, ObjField *el, UniqueType *exprUT, bool revert ) const
 {
 	/* Ensure that the field is referenced. */
 	inObject->referenceField( pd, el );
@@ -620,7 +620,7 @@ bool castAssignment( ParseData *pd, CodeVect &code, UniqueType *destUT,
 }
 
 void LangVarRef::setField( ParseData *pd, CodeVect &code, 
-		ObjectDef *inObject, UniqueType *exprUT, bool revert )
+		ObjectDef *inObject, UniqueType *exprUT, bool revert ) const
 {
 	ObjFieldMapEl *objDefMapEl = inObject->objFieldMap->find( name );
 	if ( objDefMapEl == 0 )
@@ -631,7 +631,7 @@ void LangVarRef::setField( ParseData *pd, CodeVect &code,
 }
 
 void LangVarRef::setFieldIter( ParseData *pd, CodeVect &code, 
-		ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert )
+		ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert ) const
 {
 	ObjFieldMapEl *objDefMapEl = inObject->objFieldMap->find( name );
 	if ( objDefMapEl == 0 )
@@ -642,7 +642,7 @@ void LangVarRef::setFieldIter( ParseData *pd, CodeVect &code,
 	code.appendHalf( el->offset );
 }
 
-UniqueType *LangVarRef::evaluate( ParseData *pd, CodeVect &code, bool forWriting )
+UniqueType *LangVarRef::evaluate( ParseData *pd, CodeVect &code, bool forWriting ) const
 {
 	/* Lookup the loadObj. */
 	VarRefLookup lookup = lookupField( pd );
@@ -658,7 +658,7 @@ UniqueType *LangVarRef::evaluate( ParseData *pd, CodeVect &code, bool forWriting
 }
 
 /* Return the field referenced. */
-ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code )
+ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code ) const
 {
 	/* Lookup the loadObj. */
 	VarRefLookup lookup = lookupField( pd );
@@ -692,7 +692,7 @@ ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code )
 }
 
 ObjField **LangVarRef::evaluateArgs( ParseData *pd, CodeVect &code, 
-		VarRefLookup &lookup, ExprVect *args )
+		VarRefLookup &lookup, ExprVect *args ) const
 {
 	/* Parameter list is given only for user defined methods. Otherwise it
 	 * will be null. */
@@ -746,7 +746,7 @@ ObjField **LangVarRef::evaluateArgs( ParseData *pd, CodeVect &code,
 	return paramRefs;
 }
 
-void LangVarRef::resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs )
+void LangVarRef::resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs ) const
 {
 	/* Parameter list is given only for user defined methods. Otherwise it
 	 * will be null. */
@@ -757,7 +757,7 @@ void LangVarRef::resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField
 }
 
 
-void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup )
+void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup ) const
 {
 	/* This is for writing if it is a non-const builtin. */
 	bool forWriting = lookup.objMethod->func == 0 && 
@@ -782,7 +782,7 @@ void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &loo
 		code.appendHalf( lookup.objMethod->funcId );
 }
 
-UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args )
+UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args ) const
 {
 	/* Evaluate the object. */
 	VarRefLookup lookup = lookupMethod( pd );
@@ -800,7 +800,7 @@ UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *a
 	return lookup.uniqueType;
 }
 
-UniqueType *LangTerm::evaluateMatch( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateMatch( ParseData *pd, CodeVect &code ) const
 {
 	/* Add the vars bound by the pattern into the local scope. */
 	for ( PatternItemList::Iter item = *pattern->list; item.lte(); item++ ) {
@@ -835,7 +835,7 @@ UniqueType *LangTerm::evaluateMatch( ParseData *pd, CodeVect &code )
 	return ut;
 }
 
-UniqueType *LangTerm::evaluateNew( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateNew( ParseData *pd, CodeVect &code ) const
 {
 	/* Evaluate the expression. */
 	UniqueType *ut = expr->evaluate( pd, code );
@@ -846,7 +846,7 @@ UniqueType *LangTerm::evaluateNew( ParseData *pd, CodeVect &code )
 	return pd->findUniqueType( TYPE_PTR, ut->langEl );
 }
 
-void LangTerm::assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT )
+void LangTerm::assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT ) const
 {
 	/* Now assign the field initializations. Note that we need to do this in
 	 * reverse because the last expression evaluated is at the top of the
@@ -877,7 +877,7 @@ void LangTerm::assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replU
 	}
 }
 
-UniqueType *LangTerm::evaluateTreeConstruct( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateTreeConstruct( ParseData *pd, CodeVect &code ) const
 {
 	/* Evaluate the initialization expressions. */
 	if ( fieldInitArgs != 0 && fieldInitArgs->length() > 0 ) {
@@ -924,7 +924,7 @@ UniqueType *LangTerm::evaluateTreeConstruct( ParseData *pd, CodeVect &code )
 }
 
 
-UniqueType *LangTerm::evaluateTermConstruct( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateTermConstruct( ParseData *pd, CodeVect &code ) const
 {
 	/* Going to make this replacement directly. Take it out of the list of
 	 * replacements so that we don't try to parse it. */
@@ -951,7 +951,7 @@ UniqueType *LangTerm::evaluateTermConstruct( ParseData *pd, CodeVect &code )
 	return replUT;
 }
 
-bool LangTerm::constructTermFromString( ParseData *pd )
+bool LangTerm::constructTermFromString( ParseData *pd ) const
 {
 	UniqueType *replUT = typeRef->lookupType( pd );
 	if ( replUT->typeId == TYPE_TREE && replUT->langEl->id < pd->firstNonTermId ) {
@@ -967,7 +967,7 @@ bool LangTerm::constructTermFromString( ParseData *pd )
 	return false;
 }
 
-UniqueType *LangTerm::evaluateConstruct( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateConstruct( ParseData *pd, CodeVect &code ) const
 {
 	/* If the type is a token and the replacement contains just a string then
 	 * construct a token using the text of the string. Otherwise do a normal
@@ -978,7 +978,7 @@ UniqueType *LangTerm::evaluateConstruct( ParseData *pd, CodeVect &code )
 		return evaluateTreeConstruct( pd, code );
 }
 
-UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
+UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop ) const
 {
 	UniqueType *ut = typeRef->lookupType( pd );
 	if ( ut->typeId != TYPE_TREE )
@@ -1006,7 +1006,7 @@ UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
 	return ut;
 }
 
-UniqueType *LangTerm::evaluate( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluate( ParseData *pd, CodeVect &code ) const
 {
 	switch ( type ) {
 		case VarRefType:
@@ -1084,7 +1084,7 @@ UniqueType *LangTerm::evaluate( ParseData *pd, CodeVect &code )
 	return 0;
 }
 
-UniqueType *LangExpr::evaluate( ParseData *pd, CodeVect &code )
+UniqueType *LangExpr::evaluate( ParseData *pd, CodeVect &code ) const
 {
 	switch ( type ) {
 		case BinaryType: {
@@ -1258,7 +1258,7 @@ UniqueType *LangExpr::evaluate( ParseData *pd, CodeVect &code )
 }
 
 void LangVarRef::assignValue( ParseData *pd, CodeVect &code, 
-		UniqueType *exprUT )
+		UniqueType *exprUT ) const
 {
 	/* Lookup the left hand side of the assignment. */
 	VarRefLookup lookup = lookupField( pd );
@@ -1292,7 +1292,7 @@ void LangVarRef::assignValue( ParseData *pd, CodeVect &code,
 		setField( pd, code, lookup.inObject, exprUT, revert );
 }
 
-UniqueType *LangTerm::evaluateMakeToken( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateMakeToken( ParseData *pd, CodeVect &code ) const
 {
 //	if ( pd->compileContext != ParseData::CompileTranslation )
 //		error(loc) << "make_token can be used only in a translation block" << endp;
@@ -1320,7 +1320,7 @@ UniqueType *LangTerm::evaluateMakeToken( ParseData *pd, CodeVect &code )
 	return pd->uniqueTypeAny;
 }
 
-UniqueType *LangTerm::evaluateMakeTree( ParseData *pd, CodeVect &code )
+UniqueType *LangTerm::evaluateMakeTree( ParseData *pd, CodeVect &code ) const
 {
 	if ( pd->compileContext != ParseData::CompileTranslation )
 		error(loc) << "make_tree can be used only in a translation block" << endp;
@@ -1345,16 +1345,15 @@ UniqueType *LangTerm::evaluateMakeTree( ParseData *pd, CodeVect &code )
 	return pd->uniqueTypeAny;
 }
 
-void LangStmt::compileForIterBody( ParseData *pd, CodeVect &code, 
-		ObjField *iterObjField, LangVarRef *iterVarRef, 
-		UniqueType *iterUT )
+void LangStmt::compileForIterBody( ParseData *pd, 
+		CodeVect &code, UniqueType *iterUT ) const
 {
 	/* Remember the top of the loop. */
 	long top = code.length();
 
 	/* Advance */
 	code.append( iterUT->iterDef->inAdvance );
-	code.appendHalf( iterObjField->offset );
+	code.appendHalf( objField->offset );
 
 	/* Test: jump past the while block if false. Note that we don't have the
 	 * distance yet. */
@@ -1373,7 +1372,7 @@ void LangStmt::compileForIterBody( ParseData *pd, CodeVect &code,
 
 	/* Add the cleanup for the current loop. */
 	loopCleanup.append( iterUT->iterDef->inDestroy );
-	loopCleanup.appendHalf( iterObjField->offset );
+	loopCleanup.appendHalf( objField->offset );
 
 	/* Push the loop cleanup. */
 	CodeVect *oldLoopCleanup = pd->loopCleanup;
@@ -1403,34 +1402,14 @@ void LangStmt::compileForIterBody( ParseData *pd, CodeVect &code,
 
 	/* Destroy the iterator. */
 	code.append( iterUT->iterDef->inDestroy );
-	code.appendHalf( iterObjField->offset );
-
-	unscopeIterVariable( pd, iterObjField );
-}
-
-ObjField *LangStmt::createIterVariable( ParseData *pd, TypeRef *iterTypeRef )
-{
-	/* Check for redeclaration. */
-	if ( pd->curLocalFrame->objFieldMap->find( name ) != 0 )
-		error(loc) << "variable " << name << " redeclared" << endp;
-
-	/* Create the field and insert it into the field map. */
-	ObjField *iterObjField = new ObjField( loc, iterTypeRef, name );
-	pd->curLocalFrame->objFieldMap->insert( name, iterObjField );
-	pd->curLocalFrame->initField( pd, iterObjField );
-	return iterObjField;
+	code.appendHalf( objField->offset );
 }
 
-void LangStmt::unscopeIterVariable( ParseData *pd, ObjField *iterObjField )
-{
-	pd->curLocalFrame->objFieldMap->detach( name );
-}
-
-LangTerm *LangStmt::chooseDefaultIter( ParseData *pd )
+LangTerm *LangStmt::chooseDefaultIter( ParseData *pd, LangTerm *fromVarRef ) const
 {
 	/* Lookup the lang term and decide what iterator to use based
 	 * on its type. */
-	VarRefLookup lookup = langTerm->varRef->lookupField( pd );
+	VarRefLookup lookup = fromVarRef->varRef->lookupField( pd );
 	
 	if ( lookup.inObject->type != ObjectDef::FrameType )
 		error(loc) << "root of iteration must be a local" << endp;
@@ -1452,7 +1431,7 @@ LangTerm *LangStmt::chooseDefaultIter( ParseData *pd )
 	/* The parameters. */
 	ExprVect *callExprVect = new ExprVect;
 	LangExpr *callExpr = new LangExpr( new LangTerm( 
-			LangTerm::VarRefType, langTerm->varRef ) );
+			LangTerm::VarRefType, fromVarRef->varRef ) );
 	callExprVect->append( callExpr );
 
 	LangTerm *callLangTerm = new LangTerm( callVarRef, callExprVect );
@@ -1460,10 +1439,11 @@ LangTerm *LangStmt::chooseDefaultIter( ParseData *pd )
 	return callLangTerm;
 }
 
-void LangStmt::compileForIter( ParseData *pd, CodeVect &code )
+void LangStmt::compileForIter( ParseData *pd, CodeVect &code ) const
 {
-	if ( langTerm->type != LangTerm::MethodCallType )
-		langTerm = chooseDefaultIter( pd );
+	LangTerm *iterCallTerm = langTerm;
+	if ( iterCallTerm->type != LangTerm::MethodCallType )
+		iterCallTerm = chooseDefaultIter( pd, langTerm );
 
 	/* The type we are searching for. */
 	UniqueType *searchUT = typeRef->lookupType( pd );
@@ -1471,29 +1451,32 @@ void LangStmt::compileForIter( ParseData *pd, CodeVect &code )
 	/* 
 	 * Declare the iterator variable.
 	 */
-	VarRefLookup lookup = langTerm->varRef->lookupMethod( pd );
+	VarRefLookup lookup = iterCallTerm->varRef->lookupMethod( pd );
 	if ( lookup.objMethod->iterDef == 0 ) {
 		error(loc) << "attempt to iterate using something "
 				"that is not an iterator" << endp;
 	}
 
-	/* Type ref and object field for the iterator. */
+	/* Now that we have done the iterator call lookup we can make the type
+	 * reference for the object field. */
 	TypeRef *iterTypeRef = new TypeRef( loc, lookup.objMethod->iterDef, typeRef );
-	ObjField *iterObjField = createIterVariable( pd, iterTypeRef );
+	objField->typeRef = iterTypeRef;
+
+	/* Also force the field to be initialized. */
+	pd->curLocalFrame->initField( pd, objField );
 
 	/* 
 	 * Create the iterator from the local var.
 	 */
 
-	LangVarRef *iterVarRef = new LangVarRef( loc, new QualItemVect, name ); 
 	UniqueType *iterUT = iterTypeRef->lookupType( pd );
 
 	/* Evaluate and push the arguments. */
-	ObjField **paramRefs = langTerm->varRef->evaluateArgs( 
-			pd, code, lookup, langTerm->args );
+	ObjField **paramRefs = iterCallTerm->varRef->evaluateArgs( 
+			pd, code, lookup, iterCallTerm->args );
 
 	code.append( iterUT->iterDef->inCreate );
-	code.appendHalf( iterObjField->offset );
+	code.appendHalf( objField->offset );
 	if ( lookup.objMethod->func != 0 )
 		code.appendHalf( lookup.objMethod->func->funcId );
 
@@ -1504,13 +1487,13 @@ void LangStmt::compileForIter( ParseData *pd, CodeVect &code )
 			code.appendHalf( searchUT->langEl->id );
 	}
 
-	compileForIterBody( pd, code, iterObjField, iterVarRef, iterUT );
+	compileForIterBody( pd, code, iterUT );
 
-	langTerm->varRef->resetActiveRefs( pd, lookup, paramRefs );
+	iterCallTerm->varRef->resetActiveRefs( pd, lookup, paramRefs );
 	delete[] paramRefs;
 }
 
-void LangStmt::compileWhile( ParseData *pd, CodeVect &code )
+void LangStmt::compileWhile( ParseData *pd, CodeVect &code ) const
 {
 	/* Generate code for the while test. Remember the top. */
 	long top = code.length();
@@ -1543,7 +1526,7 @@ void LangStmt::compileWhile( ParseData *pd, CodeVect &code )
 	pd->breakJumps.empty();
 }
 
-void LangStmt::compile( ParseData *pd, CodeVect &code )
+void LangStmt::compile( ParseData *pd, CodeVect &code ) const
 {
 	switch ( type ) {
 		case PrintType: 
@@ -1670,7 +1653,7 @@ void LangStmt::compile( ParseData *pd, CodeVect &code )
 	}
 }
 
-void CodeBlock::compile( ParseData *pd, CodeVect &code )
+void CodeBlock::compile( ParseData *pd, CodeVect &code ) const
 {
 	for ( StmtList::Iter stmt = *stmtList; stmt.lte(); stmt++ )
 		stmt->compile( pd, code );
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 06d19aa0..728bdd76 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -943,8 +943,18 @@ statement: KW_While code_expr block_or_single
 	};
 statement: KW_For TK_Word ':' type_ref KW_In iter_call block_or_single
 	final {
+		/* Check for redeclaration. */
+		if ( pd->curLocalFrame->objFieldMap->find( $2->data ) != 0 )
+			error( $2->loc ) << "variable " << $2->data << " redeclared" << endp;
+
+		/* Note that we pass in a null type reference. This type is dependent
+		 * on the result of the iter_call lookup since it must contain a reference
+		 * to the iterator that is called. This lookup is done at compile time. */
+		ObjField *iterField = new ObjField( $2->loc, (TypeRef*)0, $2->data );
+		pd->curLocalFrame->objFieldMap->insert( $2->data, iterField );
+
 		$$->stmt = new LangStmt( $1->loc, LangStmt::ForIterType, 
-			$2->data, $4->typeRef, $6->langTerm, $7->stmtList );
+				iterField, $4->typeRef, $6->langTerm, $7->stmtList );
 	};
 statement: KW_Return code_expr
 	final {
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 72beac98..ac6043a5 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1317,40 +1317,40 @@ struct LangVarRef
 		: loc(loc), qual(qual), name(name) {}
 
 	UniqueType *loadFieldInstr( ParseData *pd, CodeVect &code, ObjectDef *inObject,
-			ObjField *el, bool forWriting, bool revert );
+			ObjField *el, bool forWriting, bool revert ) const;
 	void setFieldInstr( ParseData *pd, CodeVect &code, ObjectDef *inObject, 
-			ObjField *el, UniqueType *exprUT, bool revert );
+			ObjField *el, UniqueType *exprUT, bool revert ) const;
 
-	VarRefLookup lookupMethod( ParseData *pd );
-	VarRefLookup lookupField( ParseData *pd );
+	VarRefLookup lookupMethod( ParseData *pd ) const;
+	VarRefLookup lookupField( ParseData *pd ) const;
 
 	VarRefLookup lookupQualification( ParseData *pd, ObjectDef *rootDef ) const;
-	VarRefLookup lookupObj( ParseData *pd );
+	VarRefLookup lookupObj( ParseData *pd ) const;
 
-	bool isLocalRef( ParseData *pd );
+	bool isLocalRef( ParseData *pd ) const;
 	void loadQualification( ParseData *pd, CodeVect &code, ObjectDef *rootObj, 
-			int lastPtrInQual, bool forWriting, bool revert );
+			int lastPtrInQual, bool forWriting, bool revert ) const;
 	void loadLocalObj( ParseData *pd, CodeVect &code, 
-			int lastPtrInQual, bool forWriting );
+			int lastPtrInQual, bool forWriting ) const;
 	void loadGlobalObj( ParseData *pd, CodeVect &code, 
-			int lastPtrInQual, bool forWriting );
-	void loadObj( ParseData *pd, CodeVect &code, int lastPtrInQual, bool forWriting );
+			int lastPtrInQual, bool forWriting ) const;
+	void loadObj( ParseData *pd, CodeVect &code, int lastPtrInQual, bool forWriting ) const;
 
 	void setFieldIter( ParseData *pd, CodeVect &code, 
-			ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert );
+			ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert ) const;
 	void setFieldSearch( ParseData *pd, CodeVect &code, 
-			ObjectDef *inObject, UniqueType *exprType );
+			ObjectDef *inObject, UniqueType *exprType ) const;
 	void setField( ParseData *pd, CodeVect &code, 
-			ObjectDef *inObject, UniqueType *type, bool revert );
+			ObjectDef *inObject, UniqueType *type, bool revert ) const;
 
-	void assignValue( ParseData *pd, CodeVect &code, UniqueType *exprUT );
+	void assignValue( ParseData *pd, CodeVect &code, UniqueType *exprUT ) const;
 	ObjField **evaluateArgs( ParseData *pd, CodeVect &code, 
-			VarRefLookup &lookup, ExprVect *args );
-	void callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup );
-	UniqueType *evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args );
-	UniqueType *evaluate( ParseData *pd, CodeVect &code, bool forWriting = false );
-	ObjField *evaluateRef( ParseData *pd, CodeVect &code );
-	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs );
+			VarRefLookup &lookup, ExprVect *args ) const;
+	void callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup ) const;
+	UniqueType *evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args ) const;
+	UniqueType *evaluate( ParseData *pd, CodeVect &code, bool forWriting = false ) const;
+	ObjField *evaluateRef( ParseData *pd, CodeVect &code ) const;
+	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs ) const;
 
 	InputLoc loc;
 	QualItemVect *qual;
@@ -1416,17 +1416,17 @@ struct LangTerm
 	LangTerm( Type type, LangExpr *expr )
 		: type(type), expr(expr) {}
 
-	UniqueType *evaluateParse( ParseData *pd, CodeVect &code, bool stop );
-	UniqueType *evaluateNew( ParseData *pd, CodeVect &code );
-	UniqueType *evaluateConstruct( ParseData *pd, CodeVect &code );
-	UniqueType *evaluateTreeConstruct( ParseData *pd, CodeVect &code );
-	UniqueType *evaluateTermConstruct( ParseData *pd, CodeVect &code );
-	bool constructTermFromString( ParseData *pd );
-	UniqueType *evaluateMatch( ParseData *pd, CodeVect &code );
-	UniqueType *evaluate( ParseData *pd, CodeVect &code );
-	void assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT );
-	UniqueType *evaluateMakeToken( ParseData *pd, CodeVect &code );
-	UniqueType *evaluateMakeTree( ParseData *pd, CodeVect &code );
+	UniqueType *evaluateParse( ParseData *pd, CodeVect &code, bool stop ) const;
+	UniqueType *evaluateNew( ParseData *pd, CodeVect &code ) const;
+	UniqueType *evaluateConstruct( ParseData *pd, CodeVect &code ) const;
+	UniqueType *evaluateTreeConstruct( ParseData *pd, CodeVect &code ) const;
+	UniqueType *evaluateTermConstruct( ParseData *pd, CodeVect &code ) const;
+	bool constructTermFromString( ParseData *pd ) const;
+	UniqueType *evaluateMatch( ParseData *pd, CodeVect &code ) const;
+	UniqueType *evaluate( ParseData *pd, CodeVect &code ) const;
+	void assignFieldArgs( ParseData *pd, CodeVect &code, UniqueType *replUT ) const;
+	UniqueType *evaluateMakeToken( ParseData *pd, CodeVect &code ) const;
+	UniqueType *evaluateMakeTree( ParseData *pd, CodeVect &code ) const;
 
 	InputLoc loc;
 	Type type;
@@ -1458,7 +1458,7 @@ struct LangExpr
 	LangExpr( LangTerm *term )
 		: type(TermType), term(term) {}
 
-	UniqueType *evaluate( ParseData *pd, CodeVect &code );
+	UniqueType *evaluate( ParseData *pd, CodeVect &code ) const;
 
 	InputLoc loc;
 	Type type;
@@ -1519,22 +1519,20 @@ struct LangStmt
 		type(type), varRef(varRef), expr(0), replacement(replacement), 
 		exprPtrVect(0), next(0) {}
 
-	LangStmt( const InputLoc &loc, Type type, const String &varName, 
+	/* ForIterType */
+	LangStmt( const InputLoc &loc, Type type, ObjField *objField, 
 			TypeRef *typeRef, LangTerm *langTerm, StmtList *stmtList ) : 
-		loc(loc), type(type), langTerm(langTerm), typeRef(typeRef), 
-		stmtList(stmtList), name(varName), next(0) {}
+		loc(loc), type(type), langTerm(langTerm), objField(objField), typeRef(typeRef), 
+		stmtList(stmtList), next(0) {}
 
 	LangStmt( Type type ) : 
 		type(type), next(0) {}
 
-	LangTerm *chooseDefaultIter( ParseData *pd );
-	void compileWhile( ParseData *pd, CodeVect &code );
-	void unscopeIterVariable( ParseData *pd, ObjField *iterObjField );
-	ObjField *createIterVariable( ParseData *pd, TypeRef *iterTypeRef );
-	void compileForIterBody( ParseData *pd, CodeVect &code, 
-			ObjField *iterObjField, LangVarRef *iterVarRef, UniqueType *iterUT );
-	void compileForIter( ParseData *pd, CodeVect &code );
-	void compile( ParseData *pd, CodeVect &code );
+	LangTerm *chooseDefaultIter( ParseData *pd, LangTerm *fromVarRef ) const;
+	void compileWhile( ParseData *pd, CodeVect &code ) const;
+	void compileForIterBody( ParseData *pd, CodeVect &code, UniqueType *iterUT ) const;
+	void compileForIter( ParseData *pd, CodeVect &code ) const;
+	void compile( ParseData *pd, CodeVect &code ) const;
 
 	InputLoc loc;
 	Type type;
@@ -1561,7 +1559,7 @@ struct CodeBlock
 	CodeBlock( StmtList *stmtList ) 
 		: frameId(-1), stmtList(stmtList), localFrame(0) {}
 
-	void compile( ParseData *pd, CodeVect &code );
+	void compile( ParseData *pd, CodeVect &code ) const;
 
 	long frameId;
 	StmtList *stmtList;
-- 
cgit v1.2.1


From c9aed990d4a391c10eb32282ffa88fa6576c25d2 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 6 Nov 2008 22:56:23 +0000
Subject: Stop using AF_IGNORE, a peek into lelInfo is the right way to
 determine if a tree to be ignored.

---
 colm/bytecode.cpp |  2 --
 colm/bytecode.h   |  3 +--
 colm/fsmrun.cpp   | 10 +++++++---
 3 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index fc4f862b..5f7c4dab 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -100,8 +100,6 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 		tree->id = prg->rtd->lelInfo[tree->id].termDupId;
 
 	tree->alg->flags |= AF_ARTIFICIAL;
-	if ( ignore )
-		tree->alg->flags |= AF_IGNORE;
 
 	/* FIXME: Do we need to remove the ignore tokens 
 	 * at this point? Will it cause a leak? */
diff --git a/colm/bytecode.h b/colm/bytecode.h
index ad0a7faa..aa5d185d 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -247,8 +247,7 @@ typedef unsigned char uchar;
 #define AF_ARTIFICIAL  0x8
 #define AF_NAMED       0x10
 #define AF_GROUP_MEM   0x20
-#define AF_IGNORE      0x40
-#define AF_HAS_RCODE   0x80
+#define AF_HAS_RCODE   0x40
 
 /*
  * Call stack.
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 993936f6..de85591d 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -326,11 +326,13 @@ void FsmRun::sendBack( Kid *input )
  * generated from a single action. */
 void set_AF_GROUP_MEM( PdaRun *parser )
 {
-	/* Set AF_GROUP_MEM now. */
+	LangElInfo *lelInfo = parser->prg->rtd->lelInfo;
+
 	long sendCount = 0;
 	Kid *queued = parser->queue;
 	while ( queued != 0 ) {
-		if ( !(queued->tree->alg->flags & AF_IGNORE) ) {
+		/* Only bother with non-ignore tokens. */
+		if ( !lelInfo[queued->tree->id].ignore ) {
 			if ( sendCount > 0 )
 				queued->tree->alg->flags |= AF_GROUP_MEM;
 			sendCount += 1;
@@ -387,6 +389,8 @@ void FsmRun::sendEOF( )
 
 void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 {
+	LangElInfo *lelInfo = fsmRun->prg->rtd->lelInfo;
+
 	while ( parser->queue != 0 ) {
 		/* Pull an item to send off the queue. */
 		Kid *send = parser->queue;
@@ -394,7 +398,7 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 
 		/* Must clear next, since the parsing algorithm uses it. */
 		send->next = 0;
-		if ( send->tree->alg->flags & AF_IGNORE ) {
+		if ( lelInfo[send->tree->id].ignore ) {
 			#ifdef COLM_LOG_PARSE
 			cerr << "ignoring queued item: " << 
 					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
-- 
cgit v1.2.1


From 89fbf86288761cf9464aefb78705f8a16cbb967f Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 6 Nov 2008 23:39:24 +0000
Subject: Added the _notoken language element. This ignore token will be sent
 when a generation action doesn't send anything (ignored or real) and there is
 reverse code.

---
 colm/parsedata.h  |  2 +-
 colm/pdabuild.cpp | 13 +++++++++++--
 2 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/colm/parsedata.h b/colm/parsedata.h
index 0793574d..f1808595 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -200,7 +200,6 @@ struct KlangEl : public DListEl<KlangEl>
 
 	GenericType *generic;
 
-
 	long parserId;
 };
 
@@ -778,6 +777,7 @@ struct ParseData
 	KlangEl *streamKlangEl;
 	KlangEl *anyKlangEl;
 	KlangEl *rootKlangEl;
+	KlangEl *noTokenEl;
 	KlangEl *eofKlangEl;
 	KlangEl *errorKlangEl;
 	KlangEl *defaultCharKlangEl;
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index c81fb8e4..98df9af1 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -203,6 +203,17 @@ void ParseData::makeKlangElIds()
 			ptrKlangEl->name, ptrKlangEl );
 	assert( ptrMapEl != 0 );
 
+	/* Make a "_notoken" language element. This element is used when a
+	 * generation action fails to generate anything, but there is reverse code
+	 * that needs to be associated with a language element. This allows us to
+	 * always associate reverse code with the first language element produced
+	 * after a generation action. */
+	noTokenEl = new KlangEl( rootNamespace, strdup("_notoken"), KlangEl::Term );
+	noTokenEl->ignore = true;
+	langEls.prepend( noTokenEl );
+	SymbolMapEl *noTokenMapEl = rootNamespace->symbolMap.insert( noTokenEl->name, noTokenEl );
+	assert( noTokenMapEl != 0 );
+
 	/* Make the EOF language element. */
 	eofKlangEl = new KlangEl( rootNamespace, strdup("_eof"), KlangEl::Term );
 	langEls.prepend( eofKlangEl );
@@ -215,8 +226,6 @@ void ParseData::makeKlangElIds()
 	SymbolMapEl *anyMapEl = rootNamespace->symbolMap.insert( anyKlangEl->name, anyKlangEl );
 	assert( anyMapEl != 0 );
 
-	/* Make a translate token language element. */
-
 	/* Make terminal language elements corresponding to each nonterminal in
 	 * the grammar. */
 	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-- 
cgit v1.2.1


From 1624689f25b16426d150f65d1f7d47bf9d5629b8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 7 Nov 2008 16:53:27 +0000
Subject: function movement.

---
 colm/fsmrun.cpp | 63 +++++++++++++++++++++++++++++----------------------------
 1 file changed, 32 insertions(+), 31 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index de85591d..ef45022b 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -341,6 +341,38 @@ void set_AF_GROUP_MEM( PdaRun *parser )
 	}
 }
 
+void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
+{
+	LangElInfo *lelInfo = fsmRun->prg->rtd->lelInfo;
+
+	while ( parser->queue != 0 ) {
+		/* Pull an item to send off the queue. */
+		Kid *send = parser->queue;
+		parser->queue = parser->queue->next;
+
+		/* Must clear next, since the parsing algorithm uses it. */
+		send->next = 0;
+		if ( lelInfo[send->tree->id].ignore ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "ignoring queued item: " << 
+					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+			#endif
+			
+			parser->ignore( send->tree );
+			fsmRun->prg->kidPool.free( send );
+		}
+		else {
+			#ifdef COLM_LOG_PARSE
+			cerr << "sending queue item: " << 
+					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+			#endif
+
+			send_handle_error( fsmRun, parser, send );
+		}
+	}
+}
+
+
 void FsmRun::sendEOF( )
 {
 	#ifdef COLM_LOG_PARSE
@@ -387,37 +419,6 @@ void FsmRun::sendEOF( )
 	cs = tables->entryByRegion[region];
 }
 
-void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
-{
-	LangElInfo *lelInfo = fsmRun->prg->rtd->lelInfo;
-
-	while ( parser->queue != 0 ) {
-		/* Pull an item to send off the queue. */
-		Kid *send = parser->queue;
-		parser->queue = parser->queue->next;
-
-		/* Must clear next, since the parsing algorithm uses it. */
-		send->next = 0;
-		if ( lelInfo[send->tree->id].ignore ) {
-			#ifdef COLM_LOG_PARSE
-			cerr << "ignoring queued item: " << 
-					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
-			#endif
-			
-			parser->ignore( send->tree );
-			fsmRun->prg->kidPool.free( send );
-		}
-		else {
-			#ifdef COLM_LOG_PARSE
-			cerr << "sending queue item: " << 
-					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
-			#endif
-
-			send_handle_error( fsmRun, parser, send );
-		}
-	}
-}
-
 void FsmRun::sendToken( long id )
 {
 	#ifdef COLM_LOG_PARSE
-- 
cgit v1.2.1


From 8e568f07ea6f54fb5e9ad61f264a4f29972fb693 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 7 Nov 2008 20:19:21 +0000
Subject: Reverse code is now transferred to the allReverseCode buffer after
 each execution. This is enabled by adding a no-token if there is reverse code
 but nothing left in the queue after a generation action.

---
 colm/bytecode.cpp   |   4 +-
 colm/fsmrun.cpp     | 159 ++++++++++++++++++++++++++++++----------------------
 colm/parsedata.h    |   2 +-
 colm/pdabuild.cpp   |  32 +++++------
 colm/pdacodegen.cpp |   3 +-
 colm/pdarun.cpp     |   2 +-
 colm/pdarun.h       |   3 +-
 7 files changed, 112 insertions(+), 93 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 5f7c4dab..092ac299 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -376,7 +376,7 @@ void Program::run()
 		cerr << "freeing the root reverse code" << endl;
 		#endif
 
-		bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+		bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
 		if ( hasrcode )
 			rcode_downref( root, this, allReverseCode->data );
 		delete allReverseCode;
@@ -635,7 +635,7 @@ void Execution::execute( Tree **root )
 	assert( sp == root );
 }
 
-bool makeReverseCode( CodeVect *all, CodeVect &reverseCode )
+bool make_reverse_code( CodeVect *all, CodeVect &reverseCode )
 {
 	/* Do we need to revert the left hand side? */
 
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index ef45022b..82a8d483 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -322,6 +322,27 @@ void FsmRun::sendBack( Kid *input )
 	prg->kidPool.free( input );
 }
 
+/* If no token was generated but there is reverse code then we must generate
+ * a fake token so we can attach the reverse code to it. */
+void add_notoken( Program *prg, PdaRun *parser )
+{
+	/* Check if there was anything generated. */
+	if ( parser->queue == 0 && parser->reverseCode.length() > 0 ) {
+		#ifdef COLM_LOG_PARSE
+		cerr << "found reverse code but no token, sending _notoken" << endl;
+		#endif
+
+		Tree *tree = prg->treePool.allocate();
+		tree->refs = 1;
+		tree->id = prg->rtd->noTokenId;
+		tree->tokdata = 0;
+
+		parser->queue = prg->kidPool.allocate();
+		parser->queue->tree = tree;
+		parser->queue->next = 0;
+	}
+}
+
 /* Sets the AF_GROUP_MEM so the backtracker can tell which tokens were sent
  * generated from a single action. */
 void set_AF_GROUP_MEM( PdaRun *parser )
@@ -372,53 +393,6 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 	}
 }
 
-
-void FsmRun::sendEOF( )
-{
-	#ifdef COLM_LOG_PARSE
-	cerr << "token: _EOF" << endl;
-	#endif
-
-	Kid *input = prg->kidPool.allocate();
-	input->tree = prg->treePool.allocate();
-	input->tree->alg = prg->algPool.allocate();
-
-	input->tree->refs = 1;
-	input->tree->id = parser->tables->gbl->eofId;
-
-	bool ctxDepParsing = prg->ctxDepParsing;
-	long frameId = parser->tables->gbl->regionInfo[region].eofFrameId;
-	if ( ctxDepParsing && frameId >= 0 ) {
-		#ifdef COLM_LOG_PARSE
-		cerr << "HAVE PRE_EOF BLOCK" << endl;
-		#endif
-
-		Code *code = parser->tables->gbl->frameInfo[frameId].codeWV;
-	
-		/* Execute the translation. */
-		Execution execution( prg, parser->reverseCode, 
-				parser, code, 0, 0 );
-		execution.execute( parser->root );
-
-		/* Mark generated tokens as belonging to a group. */
-		set_AF_GROUP_MEM( parser );
-
-		/* Send the generated tokens. */
-		send_queued_tokens( this, parser );
-	}
-
-	parser->send( input );
-
-	if ( parser->errCount > 0 ) {
-		parser->parse_error( parser->tables->gbl->eofId, input->tree ) << 
-				"parse error" << endp;
-	}
-
-	tokstart = 0;
-	region = parser->getNextRegion();
-	cs = tables->entryByRegion[region];
-}
-
 void FsmRun::sendToken( long id )
 {
 	#ifdef COLM_LOG_PARSE
@@ -477,6 +451,30 @@ void FsmRun::sendNamedLangEl()
 	send_handle_error( this, parser, input );
 }
 
+void execute_generation_action( Program *prg, PdaRun *parser, Code *code, Head *tokdata )
+{
+	/* Execute the translation. */
+	Execution execution( prg, parser->reverseCode, parser, code, 0, tokdata );
+	execution.execute( parser->root );
+
+	/* If there is revese code but nothing generated we need a noToken. */
+	add_notoken( prg, parser );
+
+	/* If there is reverse code then add_notoken will guarantee that the
+	 * queue is not empty. Pull the reverse code out and store in the
+	 * token. */
+	Tree *tree = parser->queue->tree;
+	bool hasrcode = make_reverse_code( parser->allReverseCode, parser->reverseCode );
+	if ( hasrcode ) {
+		if ( tree->alg == 0 )
+			tree->alg = prg->algPool.allocate();
+		tree->alg->flags |= AF_HAS_RCODE;
+	}
+
+	/* Mark generated tokens as belonging to a group. */
+	set_AF_GROUP_MEM( parser );
+}
+
 /* 
  * Not supported:
  *  -invoke failure (the backtracker)
@@ -492,18 +490,13 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 	/* Find the code. */
 	Code *code = parser->tables->gbl->frameInfo[
 			parser->tables->gbl->lelInfo[id].frameId].codeWV;
-	
-	/* Execute the translation. */
-	Execution execution( prg, parser->reverseCode, 
-			parser, code, 0, tokdata );
-	execution.execute( parser->root );
+
+	/* Execute the action and process the queue. */
+	execute_generation_action( prg, parser, code, tokdata );
 
 	/* Finished with the match text. */
 	string_free( prg, tokdata );
 
-	/* Mark generated tokens as belonging to a group. */
-	set_AF_GROUP_MEM( parser );
-
 	/* Send the queued tokens. */
 	send_queued_tokens( this, parser );
 }
@@ -580,11 +573,6 @@ void PdaRun::send( Kid *input )
 		ignore->next = child;
 	}
 		
-	/* Pull the reverse code out and store in the token. */
-	bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
-	if ( hasrcode )
-		input->tree->alg->flags |= AF_HAS_RCODE;
-
 	parseToken( input );
 }
 
@@ -626,14 +614,6 @@ void PdaRun::ignore( Tree *tree )
 	Kid *ignore = prg->kidPool.allocate();
 	ignore->tree = tree;
 
-	/* Pull the reverse code out and store in the token. */
-	bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
-	if ( hasrcode ) {
-		if ( tree->alg == 0 )
-			tree->alg = prg->algPool.allocate();
-		tree->alg->flags |= AF_HAS_RCODE;
-	}
-
 	/* Prepend it to the list of ignore tokens. */
 	ignore->next = accumIgnore;
 	accumIgnore = ignore;
@@ -706,6 +686,49 @@ Head *FsmRun::extractToken( long length )
 	return tokdata;
 }
 
+void FsmRun::sendEOF( )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "token: _EOF" << endl;
+	#endif
+
+	Kid *input = prg->kidPool.allocate();
+	input->tree = prg->treePool.allocate();
+	input->tree->alg = prg->algPool.allocate();
+
+	input->tree->refs = 1;
+	input->tree->id = parser->tables->gbl->eofId;
+
+	bool ctxDepParsing = prg->ctxDepParsing;
+	long frameId = parser->tables->gbl->regionInfo[region].eofFrameId;
+	if ( ctxDepParsing && frameId >= 0 ) {
+		#ifdef COLM_LOG_PARSE
+		cerr << "HAVE PRE_EOF BLOCK" << endl;
+		#endif
+
+		/* Get the code for the pre-eof block. */
+		Code *code = parser->tables->gbl->frameInfo[frameId].codeWV;
+
+		/* Execute the action and process the queue. */
+		execute_generation_action( prg, parser, code, 0 );
+
+		/* Send the generated tokens. */
+		send_queued_tokens( this, parser );
+	}
+
+	parser->send( input );
+
+	if ( parser->errCount > 0 ) {
+		parser->parse_error( parser->tables->gbl->eofId, input->tree ) << 
+				"parse error" << endp;
+	}
+
+	tokstart = 0;
+	region = parser->getNextRegion();
+	cs = tables->entryByRegion[region];
+}
+
+
 void FsmRun::attachInputStream( InputStream *in )
 {
 	/* Run buffers need to stick around because 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index f1808595..5912e8e6 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -777,7 +777,7 @@ struct ParseData
 	KlangEl *streamKlangEl;
 	KlangEl *anyKlangEl;
 	KlangEl *rootKlangEl;
-	KlangEl *noTokenEl;
+	KlangEl *noTokenKlangEl;
 	KlangEl *eofKlangEl;
 	KlangEl *errorKlangEl;
 	KlangEl *defaultCharKlangEl;
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 98df9af1..c77a74a9 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -208,10 +208,11 @@ void ParseData::makeKlangElIds()
 	 * that needs to be associated with a language element. This allows us to
 	 * always associate reverse code with the first language element produced
 	 * after a generation action. */
-	noTokenEl = new KlangEl( rootNamespace, strdup("_notoken"), KlangEl::Term );
-	noTokenEl->ignore = true;
-	langEls.prepend( noTokenEl );
-	SymbolMapEl *noTokenMapEl = rootNamespace->symbolMap.insert( noTokenEl->name, noTokenEl );
+	noTokenKlangEl = new KlangEl( rootNamespace, strdup("_notoken"), KlangEl::Term );
+	noTokenKlangEl->ignore = true;
+	langEls.prepend( noTokenKlangEl );
+	SymbolMapEl *noTokenMapEl = rootNamespace->symbolMap.insert( 
+			noTokenKlangEl->name, noTokenKlangEl );
 	assert( noTokenMapEl != 0 );
 
 	/* Make the EOF language element. */
@@ -252,27 +253,19 @@ void ParseData::makeKlangElIds()
 	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
 		/* Must be a term, and not any of the special reserved terminals.
 		 * Remember if the non terminal is a user non terminal. */
-		if ( lel->type == KlangEl::Term && lel != eofKlangEl && lel != errorKlangEl ) {
+		if ( lel->type == KlangEl::Term && 
+				lel != eofKlangEl && 
+				lel != errorKlangEl &&
+				lel != noTokenKlangEl )
+		{
 			lel->isUserTerm = true;
 			lel->id = nextSymbolId++;
 		}
 	}
 
-	/* Next assign to the eof token, which we always create. */
+	/* Next assign to the eof notoken, which we always create. */
 	eofKlangEl->id = nextSymbolId++;
-
-	/* First pass assigns to the user terminals. */
-	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-		if ( lel->id < 0 ) {
-			/* Must be a term, and not any of the special reserved terminals.
-			 * Remember if the non terminal is a user non terminal. */
-			if ( lel->type == KlangEl::Term && lel != eofKlangEl && lel != errorKlangEl ) {
-				assert( false );
-				lel->isUserTerm = true;
-				lel->id = nextSymbolId++;
-			}
-		}
-	}
+	noTokenKlangEl->id = nextSymbolId++;
 
 	/* Possibly assign to the error language element. */
 	if ( errorKlangEl != 0 )
@@ -1385,6 +1378,7 @@ void ParseData::makeRuntimeData()
 	runtimeData->stringId = strKlangEl->id;
 	runtimeData->anyId = anyKlangEl->id;
 	runtimeData->eofId = eofKlangEl->id;
+	runtimeData->noTokenId = noTokenKlangEl->id;
 }
 
 /* Borrow alg->state for mapsTo. */
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 399209a8..8067dc06 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -406,7 +406,8 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 		"	" << runtimeData->integerId << ",\n"
 		"	" << runtimeData->stringId << ",\n"
 		"	" << runtimeData->anyId << ",\n"
-		"	" << runtimeData->eofId << "\n"
+		"	" << runtimeData->eofId << ",\n"
+		"	" << runtimeData->noTokenId << "\n"
 		"};\n"
 		"\n";
 }
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index d058df73..ef22665e 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -427,7 +427,7 @@ again:
 			execution.execute( root );
 
 			/* Pull out the reverse code, if any. */
-			bool hasrcode = makeReverseCode( allReverseCode, reverseCode );
+			bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
 			if ( hasrcode )
 				redAlg->flags |= AF_HAS_RCODE;
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 8f6f2c26..ccb0290a 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -410,6 +410,7 @@ struct RuntimeData
 	long stringId;
 	long anyId;
 	long eofId;
+	long noTokenId;
 };
 
 struct PdaTables
@@ -438,7 +439,7 @@ struct PdaTables
 	RuntimeData *gbl;
 };
 
-bool makeReverseCode( CodeVect *all, CodeVect &reverseCode );
+bool make_reverse_code( CodeVect *all, CodeVect &reverseCode );
 
 typedef Vector<Tree*> Bindings;
 
-- 
cgit v1.2.1


From 8669467abf4ccdbbdcd522467082098725af96c4 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 7 Nov 2008 21:08:38 +0000
Subject: Split the IN_PARSE instruction into _WV and _WC versions instead of
 using a flag. The _WC version should not write the reverse code.

After executing the root code assert reverseCode as empty. The root code should
not be calling any _WC code unless it calls a parse.
---
 colm/bytecode.cpp | 46 +++++++++++++++++++++++++++++++++-------------
 colm/bytecode.h   |  3 ++-
 colm/compile.cpp  | 11 +++++++++--
 3 files changed, 44 insertions(+), 16 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 092ac299..98e7713d 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -115,7 +115,7 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 	}
 }
 
-Tree *parse( Tree **&sp, Program *prg, Stream *stream, 
+Tree *call_parser( Tree **&sp, Program *prg, Stream *stream, 
 		long parserId, long stopId, CodeVect *&cv, bool revertOn )
 {
 	PdaTables *tables = prg->rtd->parsers[parserId];
@@ -126,8 +126,14 @@ Tree *parse( Tree **&sp, Program *prg, Stream *stream,
 	tree_upref( tree );
 	parser.clean();
 
-	/* Return the reverse code. */
-	cv = parser.allReverseCode;
+	/* Maybe return the reverse code. */
+	if ( revertOn )
+		cv = parser.allReverseCode;
+	else {
+		delete parser.allReverseCode;
+		cv = 0;
+	}
+
 	return tree;
 }
 
@@ -367,7 +373,6 @@ void Program::run()
 
 	if ( rtd->rootCodeLen > 0 ) {
 		CodeVect reverseCode;
-		CodeVect *allReverseCode = new CodeVect;
 		Execution execution( this, reverseCode, 0, rtd->rootCode, 0, 0 );
 		execution.execute( root );
 
@@ -376,10 +381,9 @@ void Program::run()
 		cerr << "freeing the root reverse code" << endl;
 		#endif
 
-		bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
-		if ( hasrcode )
-			rcode_downref( root, this, allReverseCode->data );
-		delete allReverseCode;
+		/* The root code should all be commit code and reverseCode
+		 * should be empty. */
+		assert( reverseCode.length() == 0 );
 	}
 
 	/* Clear */
@@ -1645,21 +1649,19 @@ again:
 			tree_downref( prg, sp, tree );
 			break;
 		}
-		case IN_PARSE: {
+		case IN_PARSE_WV: {
 			Half parserId, stopId;
-			uchar revertOn;
 			read_half( parserId );
 			read_half( stopId );
-			read_byte( revertOn );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PARSE " << parserId << " " << stopId << endl;
+			cerr << "IN_PARSE_WV " << parserId << " " << stopId << endl;
 			#endif
 
 			/* Comes back from parse upreffed. */
 			CodeVect *cv;
 			Tree *stream = pop();
-			Tree *res = parse( sp, prg, (Stream*)stream, parserId, stopId, cv, revertOn );
+			Tree *res = call_parser( sp, prg, (Stream*)stream, parserId, stopId, cv, true );
 			push( res );
 
 			/* Single unit. */
@@ -1672,6 +1674,24 @@ again:
 			reverseCode.append( 15 );
 			break;
 		}
+		case IN_PARSE_WC: {
+			Half parserId, stopId;
+			read_half( parserId );
+			read_half( stopId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_PARSE_WC " << parserId << " " << stopId << endl;
+			#endif
+
+			/* Comes back from parse upreffed. */
+			CodeVect *cv;
+			Tree *stream = pop();
+			Tree *res = call_parser( sp, prg, (Stream*)stream, parserId, stopId, cv, false );
+			push( res );
+
+			tree_downref( prg, sp, (Tree*)stream );
+			break;
+		}
 		case IN_STREAM_PULL: {
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_STREAM_PULL" << endl;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index aa5d185d..cef37666 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -200,7 +200,8 @@ typedef unsigned char uchar;
 #define IN_MAKE_TOKEN            0x96
 #define IN_MAKE_TREE             0xb2
 #define IN_CONSTRUCT_TERM        0x9a
-#define IN_PARSE                 0xb1
+#define IN_PARSE_WV              0xb1
+#define IN_PARSE_WC              0xbe
 #define IN_PARSE_BKT             0xb3
 #define IN_STREAM_PULL           0xb4
 #define IN_STREAM_PULL_BKT       0xb5
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 84f2c3e5..c5a07b2f 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -996,13 +996,20 @@ UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
 	 * the type. */
 	ut->langEl->parserId = pd->nextParserId++;
 
-	code.append( IN_PARSE );
+	/* Parse instruction, dependent on whether or not we are
+	 * producing revert or commit code. */
+	if ( pd->revertOn )
+		code.append( IN_PARSE_WV );
+	else
+		code.append( IN_PARSE_WC );
+
+	/* The id of the parser, followed by the stop id. */
 	code.appendHalf( ut->langEl->parserId );
 	if ( stop )
 		code.appendHalf( ut->langEl->id );
 	else 
 		code.appendHalf( 0 );
-	code.append( pd->revertOn );
+
 	return ut;
 }
 
-- 
cgit v1.2.1


From d38cf34e03b6801e58713368e708d25b0a9e79e5 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 7 Nov 2008 23:02:00 +0000
Subject: Removed upref_uiter_args from IN_UITER_CREATE. Seems to be left over
 from a time before refernce args and the upreffing of trees as they are
 pushed onto the stack.

---
 colm/bytecode.cpp | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 98e7713d..78a95edc 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -198,16 +198,6 @@ void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, lo
 	}
 }
 
-void upref_uiter_args( Tree **frame, long nargs )
-{
-	for ( long l = IFR_AA; l < IFR_AA + nargs; l++ ) {
-		#ifdef COLM_LOG_BYTECODE
-		cerr << "upref local " << l << endl;
-		#endif
-		tree_upref( local(l) );
-	}
-}
-
 UserIter *uiter_create( Tree **&sp, Program *prg, FunctionInfo *fi, long searchId )
 {
 	pushn( sizeof(UserIter) / sizeof(Word) );
@@ -2697,8 +2687,6 @@ again:
 			uiter->stackSize = uiter->stackRoot - ptop();
 			uiter->resume = prg->rtd->frameInfo[fi->frameId].codeWV;
 			uiter->frame = &uiter->stackRoot[-IFR_AA];
-
-			upref_uiter_args( frame, fi->argSize );
 			break;
 		}
 		case IN_UITER_DESTROY: {
-- 
cgit v1.2.1


From ef7a4e1818ac2e0d80bb3beb8cd80ab51a98548e Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 8 Nov 2008 00:36:14 +0000
Subject: User iterator calls now distinguish between _WV and _WC code.

---
 colm/bytecode.cpp | 52 +++++++++++++++++++++++++++++++++++++++++++++-------
 colm/bytecode.h   |  3 ++-
 colm/compile.cpp  | 49 ++++++++++++++++++++++++++++++++++---------------
 colm/parsedata.h  |  1 +
 colm/parsetree.h  |  3 ++-
 5 files changed, 84 insertions(+), 24 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 78a95edc..b8dfdbe2 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -207,6 +207,20 @@ UserIter *uiter_create( Tree **&sp, Program *prg, FunctionInfo *fi, long searchI
 	return uiter;
 }
 
+void uiter_init( Program *prg, Tree **sp, UserIter *uiter, 
+		FunctionInfo *fi, bool revertOn )
+{
+	/* Set up the first yeild so when we resume it starts at the beginning. */
+	uiter->ref.kid = 0;
+	uiter->stackSize = uiter->stackRoot - ptop();
+	uiter->frame = &uiter->stackRoot[-IFR_AA];
+
+	if ( revertOn )
+		uiter->resume = prg->rtd->frameInfo[fi->frameId].codeWV;
+	else
+		uiter->resume = prg->rtd->frameInfo[fi->frameId].codeWC;
+}
+
 void tree_iter_destroy( Tree **&sp, TreeIter *iter )
 {
 	long curStackSize = iter->stackRoot - ptop();
@@ -2657,7 +2671,35 @@ again:
 			}
 			break;
 		}
-		case IN_UITER_CREATE: {
+		case IN_UITER_CREATE_WV: {
+			short field;
+			Half funcId, searchId;
+			read_half( field );
+			read_half( funcId );
+			read_half( searchId );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_UITER_CREATE_WV " << field << " " << 
+					funcId << " " << searchId << endl;
+			#endif
+
+			FunctionInfo *fi = prg->rtd->functionInfo + funcId;
+			UserIter *uiter = uiter_create( sp, prg, fi, searchId );
+			local(field) = (SW) uiter;
+
+			/* This is a setup similar to as a call, only the frame structure
+			 * is slightly different for user iterators. We aren't going to do
+			 * the call. We don't need to set up the return ip because the
+			 * uiter advance will set it. The frame we need to do because it
+			 * is set once for the lifetime of the iterator. */
+			push( 0 );            /* Return instruction pointer,  */
+			push( (SW)iframe ); /* Return iframe. */
+			push( (SW)frame );  /* Return frame. */
+
+			uiter_init( prg, sp, uiter, fi, true );
+			break;
+		}
+		case IN_UITER_CREATE_WC: {
 			short field;
 			Half funcId, searchId;
 			read_half( field );
@@ -2665,7 +2707,7 @@ again:
 			read_half( searchId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_CREATE " << field << " " << 
+			cerr << "IN_UITER_CREATE_WC " << field << " " << 
 					funcId << " " << searchId << endl;
 			#endif
 
@@ -2682,11 +2724,7 @@ again:
 			push( (SW)iframe ); /* Return iframe. */
 			push( (SW)frame );  /* Return frame. */
 
-			/* Now set up the first yeild. */
-			uiter->ref.kid = 0;
-			uiter->stackSize = uiter->stackRoot - ptop();
-			uiter->resume = prg->rtd->frameInfo[fi->frameId].codeWV;
-			uiter->frame = &uiter->stackRoot[-IFR_AA];
+			uiter_init( prg, sp, uiter, fi, false );
 			break;
 		}
 		case IN_UITER_DESTROY: {
diff --git a/colm/bytecode.h b/colm/bytecode.h
index cef37666..38358c59 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -117,7 +117,8 @@ typedef unsigned char uchar;
 #define IN_TRITER_DESTROY        0x41
 
 #define IN_UITER_DESTROY         0x52
-#define IN_UITER_CREATE          0x53
+#define IN_UITER_CREATE_WV       0x53
+#define IN_UITER_CREATE_WC       0xbf
 #define IN_UITER_ADVANCE         0x54
 #define IN_UITER_GET_CUR_R       0x55
 #define IN_UITER_GET_CUR_WC      0x56
diff --git a/colm/compile.cpp b/colm/compile.cpp
index c5a07b2f..269b73ba 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -54,7 +54,8 @@ IterDef::IterDef( Type type ) :
 	useSearchUT(false)
 {
 	if ( type == Tree ) {
-		inCreate = IN_TRITER_FROM_REF;
+		inCreateWV = IN_TRITER_FROM_REF;
+		inCreateWC = IN_TRITER_FROM_REF;
 		inDestroy = IN_TRITER_DESTROY;
 		inAdvance = IN_TRITER_ADVANCE;
 
@@ -65,7 +66,8 @@ IterDef::IterDef( Type type ) :
 		useSearchUT = true;
 	}
 	else if ( type == Child ) {
-		inCreate = IN_TRITER_FROM_REF;
+		inCreateWV = IN_TRITER_FROM_REF;
+		inCreateWC = IN_TRITER_FROM_REF;
 		inDestroy = IN_TRITER_DESTROY;
 		inAdvance = IN_TRITER_NEXT_CHILD;
 
@@ -76,7 +78,8 @@ IterDef::IterDef( Type type ) :
 		useSearchUT = true;
 	}
 	else if ( type == RevChild ) {
-		inCreate = IN_TRITER_FROM_REF;
+		inCreateWV = IN_TRITER_FROM_REF;
+		inCreateWC = IN_TRITER_FROM_REF;
 		inDestroy = IN_TRITER_DESTROY;
 		inAdvance = IN_TRITER_PREV_CHILD;
 
@@ -95,7 +98,8 @@ IterDef::IterDef( Type type, Function *func ) :
 	func(func),
 	useFuncId(true),
 	useSearchUT(true),
-	inCreate(IN_UITER_CREATE),
+	inCreateWV(IN_UITER_CREATE_WV),
+	inCreateWC(IN_UITER_CREATE_WC),
 	inDestroy(IN_UITER_DESTROY),
 	inAdvance(IN_UITER_ADVANCE),
 	inGetCurR(IN_UITER_GET_CUR_R),
@@ -1482,7 +1486,11 @@ void LangStmt::compileForIter( ParseData *pd, CodeVect &code ) const
 	ObjField **paramRefs = iterCallTerm->varRef->evaluateArgs( 
 			pd, code, lookup, iterCallTerm->args );
 
-	code.append( iterUT->iterDef->inCreate );
+	if ( pd->revertOn )
+		code.append( iterUT->iterDef->inCreateWV );
+	else
+		code.append( iterUT->iterDef->inCreateWC );
+
 	code.appendHalf( objField->offset );
 	if ( lookup.objMethod->func != 0 )
 		code.appendHalf( lookup.objMethod->func->funcId );
@@ -2280,19 +2288,10 @@ void ParseData::makeFuncVisible( Function *func, bool isUserIter )
 	globalObjectDef->objMethodMap->insert( func->name, objMethod );
 }
 
-void ParseData::compileUserIter( Function *func )
+void ParseData::compileUserIter( Function *func, CodeVect &code )
 {
 	CodeBlock *block = func->codeBlock;
 
-	compileContext = CompileFunction;
-	curFunction = func;
-	revertOn = true;
-	block->frameId = nextFrameId++;
-
-	makeFuncVisible( func, true );
-
-	CodeVect &code = block->codeWV;
-
 	/* Add the alloc frame opcode. We don't have the right 
 	 * frame size yet. We will fill it in later. */
 	code.append( IN_INIT_LOCALS );
@@ -2313,6 +2312,26 @@ void ParseData::compileUserIter( Function *func )
 		code.append( IN_LOAD_NIL );
 		code.append( IN_YIELD );
 	}
+}
+
+void ParseData::compileUserIter( Function *func )
+{
+	CodeBlock *block = func->codeBlock;
+
+	/* Set up the context. */
+	compileContext = CompileFunction;
+	curFunction = func;
+	block->frameId = nextFrameId++;
+
+	/* Process the params, etc. */
+	makeFuncVisible( func, true );
+
+	/* Compile for revert and commit. */
+	revertOn = true;
+	compileUserIter( func, block->codeWV );
+
+	revertOn = false;
+	compileUserIter( func, block->codeWC );
 
 	/* Now that compilation is done variables are referenced. Make the local
 	 * trees descriptor. */
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 5912e8e6..4d6cce79 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -728,6 +728,7 @@ struct ParseData
 	void compileFunction( Function *func, CodeVect &code );
 	void compileFunction( Function *func );
 
+	void compileUserIter( Function *func, CodeVect &code );
 	void compileUserIter( Function *func );
 	void compilePreEof( TokenRegion *region );
 	void compileRootBlock();
diff --git a/colm/parsetree.h b/colm/parsetree.h
index ac6043a5..b25a691c 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1015,7 +1015,8 @@ struct IterDef
 	bool useFuncId;
 	bool useSearchUT;
 
-	Code inCreate;
+	Code inCreateWV;
+	Code inCreateWC;
 	Code inDestroy;
 	Code inAdvance;
 
-- 
cgit v1.2.1


From 3ba29973c2e9c97072d0733c5eb3bf543a1f85ce Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 8 Nov 2008 19:07:15 +0000
Subject: A global commit with revertOn cannot clear the parsed fields from
 Alg. Shown by commitbt.lm test.

---
 colm/pdarun.cpp  |  21 ++++++++++-
 test/commitbt.in |   1 +
 test/commitbt.lm | 110 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
 3 files changed, 130 insertions(+), 2 deletions(-)
 create mode 100644 test/commitbt.in
 create mode 100644 test/commitbt.lm

diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index ef22665e..43618025 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -102,6 +102,20 @@ long PdaRun::stackTopTarget()
 	return state;
 }
 
+/*
+ * Local commit:
+ * 		-clears reparse flags underneath
+ * 		-must be possible to backtrack after
+ * Global commit (revertOn)
+ * 		-clears all reparse flags
+ * 		-must be possible to backtrack after
+ * Global commit (!revertOn)
+ * 		-clears all reparse flags
+ * 		-clears all 'parsed' reverse code
+ * 		-clears all reverse code
+ * 		-clears all alg structures
+ */
+
 bool beenCommitted( Kid *kid )
 {
 	return kid->tree->alg->flags & AF_COMMITTED;
@@ -204,7 +218,7 @@ head:
 
 	/* Commit */
 	#ifdef COLM_LOG_PARSE
-	cerr << "rev free visiting: " << 
+	cerr << "parsed_downref_kid visiting: " << 
 			prg->rtd->lelInfo[lel->tree->id].name << endl;
 	#endif
 
@@ -251,7 +265,10 @@ void PdaRun::commit()
 	while ( topLevel > 0 ) {
 		kid = (Kid*)vm_pop();
 		commitKid( sp, kid );
-		parsed_downref_kid( sp, prg, kid );
+
+		/* Can't do this here. See commitbt.lm. */
+		/* parsed_downref_kid( sp, prg, kid ); */
+
 		topLevel -= 1;
 	}
 
diff --git a/test/commitbt.in b/test/commitbt.in
new file mode 100644
index 00000000..24a7dece
--- /dev/null
+++ b/test/commitbt.in
@@ -0,0 +1 @@
+1 2 3 *
\ No newline at end of file
diff --git a/test/commitbt.lm b/test/commitbt.lm
new file mode 100644
index 00000000..75172b4b
--- /dev/null
+++ b/test/commitbt.lm
@@ -0,0 +1,110 @@
+#
+# Local commit:
+# 		-clears reparse flags underneath
+# 		-must be possible to backtrack after
+# Global commit (revertOn)
+# 		-clears all reparse flags
+# 		-must be possible to backtrack after
+# Global commit (!revertOn)
+# 		-clears all reparse flags
+# 		-clears all 'parsed' reverse code
+# 		-clears all reverse code
+# 		-clears all alg structures
+#
+
+# This test shows that a global commit with revertOn cannot clear 'parsed'
+# items because it must entertain the possibility of backtracking.
+
+lex start
+{
+	ignore /[\t\n ]+/
+	literal '^', '|', '-', ',', ':', '!', '?', '.'
+	literal '(', ')', '{', '}', '*', '&', '+'
+
+	literal '--', ':>', ':>>', '<:', '->', '**'
+
+	token word /[a-zA-Z_][a-zA-Z0-9_]*/
+	token uint /[0-9]+/
+}
+
+
+def expression [term expression_op*]
+
+def expression_op
+	['|' term]
+|	['&' term]
+|	['-' term]
+|	['--' term]
+
+def term [factor_rep term_rest]
+
+# This list is done manually to get shortest match.
+def term_rest
+	[]
+|	[term_op term_rest]
+
+def term_op
+	[factor_rep]
+|	['.' factor_rep]
+|	[':>' factor_rep]
+|	[':>>' factor_rep]
+|	['<:' factor_rep]
+
+def factor_rep 
+	[factor_neg factor_rep_op*]
+
+def factor_rep_op
+	['*']
+|	['**']
+|	['?']
+|	['+']
+|	['{' factor_rep_num '}']
+|	['{' ',' factor_rep_num '}']
+|	['{' factor_rep_num ',' '}']
+|	['{' factor_rep_num ',' factor_rep_num '}']
+
+def factor_rep_num [uint]
+
+def factor_neg 
+	['!' factor_neg]
+|	['^' factor_neg]
+|	[factor]
+
+def factor 
+	[alphabet_num]
+|	[word]
+|	['(' expression ')']
+
+def alphabet_num 
+	[uint]
+
+global int i
+
+def suint
+	int i
+	[uint]
+	{
+		lhs.i = 0
+		i = 1
+		lhs = construct suint "1"
+	}
+
+def sub
+	[suint* '*']
+
+token item
+	sub S
+	/[0-9]+/
+	{
+		str M = pull(stdin, match_length)
+		sub S = parse sub(stdin)
+		send( make_token( typeid item, M, S ) )
+	}
+
+def stuff
+	[item* '!']
+|	[sub]
+
+stuff S = parse stuff(stdin)
+
+print_xml( S )
-- 
cgit v1.2.1


From e1ba7adb9e25c9b6c28d1b4159724b0afcb68c24 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 8 Nov 2008 22:17:23 +0000
Subject: Now downreffing all 'parsed' trees on a full commit only when revert
 is not on.

Some conversion to C functions.
---
 colm/bytecode.cpp | 12 ++++----
 colm/bytecode.h   |  8 +++--
 colm/pdarun.cpp   | 90 ++++++++++++++++++++++++++++++++++---------------------
 3 files changed, 67 insertions(+), 43 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index b8dfdbe2..7636160f 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -121,7 +121,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 	PdaTables *tables = prg->rtd->parsers[parserId];
 	PdaRun parser( sp, prg, tables, stream->scanner, stopId, revertOn );
 	parser.run();
-	parser.commit();
+	full_commit( &parser );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
 	tree_upref( tree );
 	parser.clean();
@@ -412,7 +412,7 @@ Execution::Execution( Program *prg, CodeVect &reverseCode,
 	}
 }
 
-void rcode_downref_all( Tree **sp, Program *prg, CodeVect *rev )
+void rcode_downref_all( Program *prg, Tree **sp, CodeVect *rev )
 {
 	while ( rev->length() > 0 ) {
 		/* Read the length */
@@ -425,14 +425,14 @@ void rcode_downref_all( Tree **sp, Program *prg, CodeVect *rev )
 		prcode = rev->data + start;
 
 		/* Execute it. */
-		rcode_downref( sp, prg, prcode );
+		rcode_downref( prg, sp, prcode );
 
 		/* Backup over it. */
 		rev->tabLen -= len + 4;
 	}
 }
 
-void rcode_downref( Tree **sp, Program *prg, Code *instr )
+void rcode_downref( Program *prg, Tree **sp, Code *instr )
 {
 again:
 	switch ( *instr++ ) {
@@ -449,8 +449,8 @@ again:
 			cerr << "IN_PARSE_BKT " << parserId << endl;
 			#endif
 
-			parsed_downref( sp, prg, tree );
-			rcode_downref_all( sp, prg, (CodeVect*)wrev );
+			parsed_downref( prg, sp, tree );
+			rcode_downref_all( prg, sp, (CodeVect*)wrev );
 			tree_downref( prg, sp, stream );
 			tree_downref( prg, sp, tree );
 			delete (CodeVect*)wrev;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 38358c59..3e45a79a 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -418,9 +418,11 @@ Word cmp_string( Head *s1, Head *s2 );
 
 Head *int_to_str( Program *prg, Word i );
 
-void rcode_downref( Tree **stack_root, Program *prg, Code *instr );
-void rcode_downref_all( Tree **stack_root, Program *prg, CodeVect *cv );
-void parsed_downref( Tree **root, Program *prg, Tree *tree );
+void rcode_downref( Program *prg, Tree **stack_root, Code *instr );
+void rcode_downref_all( Program *prg, Tree **stack_root, CodeVect *cv );
+void parsed_downref( Program *prg, Tree **root, Tree *tree );
+void parsed_downref_all( PdaRun *parser );
+void full_commit( PdaRun *parser );
 
 bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
 Head *make_literal( Program *prg, long litoffset );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 43618025..8fbeba97 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -116,20 +116,15 @@ long PdaRun::stackTopTarget()
  * 		-clears all alg structures
  */
 
-bool beenCommitted( Kid *kid )
+bool been_committed( Kid *kid )
 {
 	return kid->tree->alg->flags & AF_COMMITTED;
 }
 
-bool beenFreed( Kid *kid )
-{
-	return kid->tree->alg->flags & AF_REV_FREED;
-}
-
 /* The top level of the stack is linked right-to-left. Trees underneath are
  * left to right natural order. */
 
-void PdaRun::commitKid( Tree **root, Kid *lel )
+void commit_kid( PdaRun *parser, Tree **root, Kid *lel )
 {
 	Alg *alg = 0;
 	Tree *tree = 0;
@@ -145,10 +140,10 @@ head:
 	/* Recurse only on non-generated trees. */
 	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
 		vm_push( (Tree*)lel );
-		lel = tree_child( prg, tree );
+		lel = tree_child( parser->prg, tree );
 
 		while ( lel != 0 ) {
-			if ( !beenCommitted( lel ) )
+			if ( !been_committed( lel ) )
 				goto head;
 
 			upwards:
@@ -161,18 +156,18 @@ head:
 	/* Commit */
 	#ifdef COLM_LOG_PARSE
 	cerr << "commit visiting: " << 
-			prg->rtd->lelInfo[lel->tree->id].name << endl;
+			parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
 	#endif
 
 	alg = lel->tree->alg;
 
 	/* Reset retries. */
 	if ( alg->retry_lower > 0 ) {
-		numRetry -= 1;
+		parser->numRetry -= 1;
 		alg->retry_lower = 0;
 	}
 	if ( alg->retry_upper > 0 ) {
-		numRetry -= 1;
+		parser->numRetry -= 1;
 		alg->retry_upper = 0;
 	}
 	alg->flags |= AF_COMMITTED;
@@ -180,10 +175,47 @@ head:
 	if ( sp != root )
 		goto upwards;
 
-	numRetry = 0;
+	parser->numRetry = 0;
 	assert( sp == root );
 }
 
+void full_commit( PdaRun *parser )
+{
+	#ifdef COLM_LOG_PARSE
+	cerr << "running full commit" << endl;
+	#endif
+	
+	Tree **sp = parser->root;
+	Kid *kid = parser->stackTop;
+	long topLevel = 0;
+	while ( kid != 0 && !been_committed( kid ) ) {
+		vm_push( (Tree*)kid );
+		kid = kid->next;
+		topLevel += 1;
+	}
+
+	while ( topLevel > 0 ) {
+		kid = (Kid*)vm_pop();
+		commit_kid( parser, sp, kid );
+		topLevel -= 1;
+	}
+
+	/* After running the commit the the stack should be where it 
+	 * was when we started. */
+	assert( sp == parser->root );
+
+	/* We cannot always clear all the rcode here. We may need to backup over
+	 * the parse statement. We depend on the context flag. */
+	if ( !parser->revertOn ) {
+		parsed_downref_all( parser );
+		rcode_downref_all( parser->prg, parser->root, parser->allReverseCode );
+	}
+}
+
+bool been_freed( Kid *kid )
+{
+	return kid->tree->alg->flags & AF_REV_FREED;
+}
 
 /* The top level of the stack is linked right-to-left. Trees underneath are
  * left to right natural order. */
@@ -206,7 +238,7 @@ head:
 		lel = tree_child( prg, tree );
 
 		while ( lel != 0 ) {
-			if ( !beenFreed( lel ) )
+			if ( !been_freed( lel ) )
 				goto head;
 
 			upwards:
@@ -235,7 +267,7 @@ head:
 	assert( sp == root );
 }
 
-void parsed_downref( Tree **root, Program *prg, Tree *tree )
+void parsed_downref( Program *prg, Tree **root, Tree *tree )
 {
 	#ifdef COLM_LOG_PARSE
 	cerr << "running parsed_downref on tree" << endl;
@@ -247,16 +279,16 @@ void parsed_downref( Tree **root, Program *prg, Tree *tree )
 	parsed_downref_kid( root, prg, &kid );
 }
 
-void PdaRun::commit()
+void parsed_downref_all( PdaRun *parser )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "running full commit" << endl;
+	cerr << "running full parsed_downref" << endl;
 	#endif
 	
-	Tree **sp = root;
-	Kid *kid = stackTop;
+	Tree **sp = parser->root;
+	Kid *kid = parser->stackTop;
 	long topLevel = 0;
-	while ( kid != 0 && !beenCommitted( kid ) ) {
+	while ( kid != 0 && !been_freed( kid ) ) {
 		vm_push( (Tree*)kid );
 		kid = kid->next;
 		topLevel += 1;
@@ -264,25 +296,15 @@ void PdaRun::commit()
 
 	while ( topLevel > 0 ) {
 		kid = (Kid*)vm_pop();
-		commitKid( sp, kid );
-
-		/* Can't do this here. See commitbt.lm. */
-		/* parsed_downref_kid( sp, prg, kid ); */
-
+		parsed_downref_kid( sp, parser->prg, kid );
 		topLevel -= 1;
 	}
 
-	/* Affter running the commit the the stack should be where it 
+	/* After running the commit the the stack should be where it 
 	 * was when we started. */
-	assert( sp == root );
-
-	/* We cannot always clear all the rcode here. We may need to backup over
-	 * the parse statement. We depend on the context flag. */
-	if ( !revertOn )
-		rcode_downref_all( root, prg, allReverseCode );
+	assert( sp == parser->root );
 }
 
-
 /*
  * shift:         retry goes into lower of shifted node.
  * reduce:        retry goes into upper of reduced node.
@@ -362,7 +384,7 @@ again:
 	}
 
 	if ( tables->commitLen[pos] != 0 )
-		commit();
+		full_commit( this );
 
 	if ( *action & act_rb ) {
 		int objectLength, reduction = *action >> 2;
-- 
cgit v1.2.1


From fac60a6b6e1cc360d9aaa04e53c9f37cb927f3bf Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 8 Nov 2008 23:27:26 +0000
Subject: Name change: gbl -> rtd.

---
 colm/fsmrun.cpp   | 46 +++++++++++++++++++++++-----------------------
 colm/pdabuild.cpp |  2 +-
 colm/pdarun.cpp   | 34 +++++++++++++++++-----------------
 colm/pdarun.h     |  2 +-
 4 files changed, 42 insertions(+), 42 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 82a8d483..8c6b3aed 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -193,7 +193,7 @@ void FsmRun::queueBack( Kid *input )
 
 	if ( alg->flags & AF_GROUP_MEM ) {
 		#ifdef COLM_LOG_PARSE
-		LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 		cerr << "queuing back: " << lelInfo[input->tree->id].name << endl;
 		#endif
 
@@ -237,7 +237,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 	/* Ignore tokens are queued in reverse order. */
 	while ( tree_is_ignore( prg, ignore ) ) {
 		#ifdef COLM_LOG_PARSE
-		LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 		cerr << "sending back: " << lelInfo[ignore->tree->id].name;
 		if ( ignore->tree->alg != 0 && ignore->tree->alg->flags & AF_ARTIFICIAL )
 			cerr << " (artificial)";
@@ -269,7 +269,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 void FsmRun::sendBack( Kid *input )
 {
 	#ifdef COLM_LOG_PARSE
-	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 	cerr << "sending back: " << lelInfo[input->tree->id].name;
 	if ( input->tree->alg->flags & AF_ARTIFICIAL )
 		cerr << " (artificial)";
@@ -307,7 +307,7 @@ void FsmRun::sendBack( Kid *input )
 	sendBackIgnore( tree_ignore( prg, input->tree ) );
 
 	/* If eof was just sent back remember that it needs to be sent again. */
-	if ( input->tree->id == parser->tables->gbl->eofId )
+	if ( input->tree->id == parser->tables->rtd->eofId )
 		eofSent = false;
 
 	/* If the item is bound then store remove it from the bindings array. */
@@ -376,7 +376,7 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 		if ( lelInfo[send->tree->id].ignore ) {
 			#ifdef COLM_LOG_PARSE
 			cerr << "ignoring queued item: " << 
-					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+					parser->tables->rtd->lelInfo[send->tree->id].name << endl;
 			#endif
 			
 			parser->ignore( send->tree );
@@ -385,7 +385,7 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 		else {
 			#ifdef COLM_LOG_PARSE
 			cerr << "sending queue item: " << 
-					parser->tables->gbl->lelInfo[send->tree->id].name << endl;
+					parser->tables->rtd->lelInfo[send->tree->id].name << endl;
 			#endif
 
 			send_handle_error( fsmRun, parser, send );
@@ -396,11 +396,11 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 void FsmRun::sendToken( long id )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "token: " << parser->tables->gbl->lelInfo[id].name << endl;
+	cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
 	#endif
 
 	bool ctxDepParsing = prg->ctxDepParsing;
-	LangElInfo *lelInfo = parser->tables->gbl->lelInfo;
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 
 	/* Make the token data. */
 	long length = p-tokstart;
@@ -439,7 +439,7 @@ void FsmRun::sendNamedLangEl()
 		klangEl = klangEl->termDup;
 	
 	#ifdef COLM_LOG_PARSE
-	cerr << "named langEl: " << parser->tables->gbl->lelInfo[klangEl->id].name << endl;
+	cerr << "named langEl: " << parser->tables->rtd->lelInfo[klangEl->id].name << endl;
 	#endif
 
 	/* Copy the token data. */
@@ -484,12 +484,12 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 {
 	#ifdef COLM_LOG_PARSE
 	cerr << "generation action: " << 
-			parser->tables->gbl->lelInfo[id].name << endl;
+			parser->tables->rtd->lelInfo[id].name << endl;
 	#endif
 
 	/* Find the code. */
-	Code *code = parser->tables->gbl->frameInfo[
-			parser->tables->gbl->lelInfo[id].frameId].codeWV;
+	Code *code = parser->tables->rtd->frameInfo[
+			parser->tables->rtd->lelInfo[id].frameId].codeWV;
 
 	/* Execute the action and process the queue. */
 	execute_generation_action( prg, parser, code, tokdata );
@@ -504,7 +504,7 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 {
 	/* Make the token object. */
-	long objectLength = parser->tables->gbl->lelInfo[id].objectLength;
+	long objectLength = parser->tables->rtd->lelInfo[id].objectLength;
 	Kid *attrs = alloc_attrs( prg, objectLength );
 
 	Kid *input = 0;
@@ -604,7 +604,7 @@ void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input )
 
 	#ifdef COLM_LOG_PARSE
 	cerr << "new token region: " << 
-			parser->tables->gbl->regionInfo[fsmRun->region].name << endl;
+			parser->tables->rtd->regionInfo[fsmRun->region].name << endl;
 	#endif
 }
 
@@ -622,7 +622,7 @@ void PdaRun::ignore( Tree *tree )
 void FsmRun::sendIgnore( long id )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "ignoring: " << parser->tables->gbl->lelInfo[id].name << endl;
+	cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
 	#endif
 
 	/* Make the ignore string. */
@@ -697,17 +697,17 @@ void FsmRun::sendEOF( )
 	input->tree->alg = prg->algPool.allocate();
 
 	input->tree->refs = 1;
-	input->tree->id = parser->tables->gbl->eofId;
+	input->tree->id = parser->tables->rtd->eofId;
 
 	bool ctxDepParsing = prg->ctxDepParsing;
-	long frameId = parser->tables->gbl->regionInfo[region].eofFrameId;
+	long frameId = parser->tables->rtd->regionInfo[region].eofFrameId;
 	if ( ctxDepParsing && frameId >= 0 ) {
 		#ifdef COLM_LOG_PARSE
 		cerr << "HAVE PRE_EOF BLOCK" << endl;
 		#endif
 
 		/* Get the code for the pre-eof block. */
-		Code *code = parser->tables->gbl->frameInfo[frameId].codeWV;
+		Code *code = parser->tables->rtd->frameInfo[frameId].codeWV;
 
 		/* Execute the action and process the queue. */
 		execute_generation_action( prg, parser, code, 0 );
@@ -719,7 +719,7 @@ void FsmRun::sendEOF( )
 	parser->send( input );
 
 	if ( parser->errCount > 0 ) {
-		parser->parse_error( parser->tables->gbl->eofId, input->tree ) << 
+		parser->parse_error( parser->tables->rtd->eofId, input->tree ) << 
 				"parse error" << endp;
 	}
 
@@ -848,9 +848,9 @@ long FsmRun::run( PdaRun *destParser )
 
 			/* Check for a default token in the region. If one is there
 			 * then send it and continue with the processing loop. */
-			if ( parser->tables->gbl->regionInfo[region].defaultToken >= 0 ) {
+			if ( parser->tables->rtd->regionInfo[region].defaultToken >= 0 ) {
 				tokstart = tokend = p;
-				sendToken( parser->tables->gbl->regionInfo[region].defaultToken );
+				sendToken( parser->tables->rtd->regionInfo[region].defaultToken );
 				continue;
 			}
 
@@ -869,7 +869,7 @@ long FsmRun::run( PdaRun *destParser )
 				cs = tables->entryByRegion[region];
 				#ifdef COLM_LOG_PARSE
 				cerr << "new token region: " << 
-						parser->tables->gbl->regionInfo[region].name << endl;
+						parser->tables->rtd->regionInfo[region].name << endl;
 				#endif
 				continue;
 			}
@@ -892,7 +892,7 @@ long FsmRun::run( PdaRun *destParser )
 					cs = tables->entryByRegion[region];
 					#ifdef COLM_LOG_PARSE
 					cerr << "new token region: " << 
-							parser->tables->gbl->regionInfo[region].name << endl;
+							parser->tables->rtd->regionInfo[region].name << endl;
 					#endif
 					continue;
 				}
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index c77a74a9..a95399c9 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1658,7 +1658,7 @@ PdaTables *ParseData::makePdaTables( PdaGraph *pdaGraph )
 	}
 
 	/* Get a pointer to the (yet unfilled) global runtime data. */
-	pdaTables->gbl = runtimeData;
+	pdaTables->rtd = runtimeData;
 
 	return pdaTables;
 }
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 8fbeba97..795a95f6 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -353,7 +353,7 @@ again:
 
 	if ( *action & act_sb ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "shifted: " << tables->gbl->lelInfo[lel->tree->id].name;
+		cerr << "shifted: " << tables->rtd->lelInfo[lel->tree->id].name;
 		#endif
 		input = input->next;
 		lel->tree->alg->state = cs;
@@ -361,10 +361,10 @@ again:
 		stackTop = lel;
 
 		/* If shifting a termDup then change it to the nonterm. */
-		if ( lel->tree->id < tables->gbl->firstNonTermId &&
-				tables->gbl->lelInfo[lel->tree->id].termDupId > 0 )
+		if ( lel->tree->id < tables->rtd->firstNonTermId &&
+				tables->rtd->lelInfo[lel->tree->id].termDupId > 0 )
 		{
-			lel->tree->id = tables->gbl->lelInfo[lel->tree->id].termDupId;
+			lel->tree->id = tables->rtd->lelInfo[lel->tree->id].termDupId;
 			lel->tree->alg->flags |= AF_GENERATED;
 		}
 
@@ -399,7 +399,7 @@ again:
 		redAlg = prg->algPool.allocate();
 
 		redLel->tree->refs = 1;
-		redLel->tree->id = tables->gbl->prodInfo[reduction].lhsId;
+		redLel->tree->id = tables->rtd->prodInfo[reduction].lhsId;
 
 		redLel->next = 0;
 		redAlg->causeReduce = 0;
@@ -408,11 +408,11 @@ again:
 		lel->tree->alg->retry_lower = 0;
 
 		/* Allocate the attributes. */
-		objectLength = tables->gbl->lelInfo[redLel->tree->id].objectLength;
+		objectLength = tables->rtd->lelInfo[redLel->tree->id].objectLength;
 		attrs = alloc_attrs( prg, objectLength );
 
 		/* Build the list of children. */
-		rhsLen = tables->gbl->prodInfo[reduction].length;
+		rhsLen = tables->rtd->prodInfo[reduction].length;
 		child = last = 0;
 		for ( int r = 0; r < rhsLen; r++ ) {
 			child = stackTop;
@@ -425,7 +425,7 @@ again:
 
 		#ifdef COLM_LOG_PARSE
 		cerr << "reduced: "
-				<< tables->gbl->prodInfo[reduction].name
+				<< tables->rtd->prodInfo[reduction].name
 				<< " rhsLen: " << rhsLen;
 		#endif
 		if ( action[1] == 0 )
@@ -449,9 +449,9 @@ again:
 
 		assert( redLel->tree->refs == 1 );
 
-		if ( prg->ctxDepParsing && tables->gbl->prodInfo[reduction].frameId >= 0 ) {
+		if ( prg->ctxDepParsing && tables->rtd->prodInfo[reduction].frameId >= 0 ) {
 			/* Frame info for reduction. */
-			FrameInfo *fi = &tables->gbl->frameInfo[tables->gbl->prodInfo[reduction].frameId];
+			FrameInfo *fi = &tables->rtd->frameInfo[tables->rtd->prodInfo[reduction].frameId];
 
 			/* Execution environment for the reduction code. */
 			Execution execution( prg, reverseCode, 
@@ -485,7 +485,7 @@ again:
 		if ( induceReject ) {
 			#ifdef COLM_LOG_PARSE
 			cerr << "error induced during reduction of " <<
-					tables->gbl->lelInfo[redLel->tree->id].name << endl;
+					tables->rtd->lelInfo[redLel->tree->id].name << endl;
 			#endif
 			redLel->tree->alg->state = cs;
 			redLel->next = stackTop;
@@ -560,12 +560,12 @@ parseError:
 
 		/* Either we are dealing with a terminal that was
 		 * shifted or a nonterminal that was reduced. */
-		if ( stackTop->tree->id < tables->gbl->firstNonTermId || 
+		if ( stackTop->tree->id < tables->rtd->firstNonTermId || 
 				(stackTop->tree->alg->flags & AF_GENERATED) )
 		{
 			#ifdef COLM_LOG_PARSE
 			cerr << "backing up over effective terminal: " <<
-					tables->gbl->lelInfo[stackTop->tree->id].name << endl;
+					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
 			#endif
 
 			/* Pop the item from the stack. */
@@ -573,7 +573,7 @@ parseError:
 
 			/* Undo the translation from termDup. */
 			if ( undoLel->tree->alg->flags & AF_GENERATED ) {
-				undoLel->tree->id = tables->gbl->lelInfo[undoLel->tree->id].termDupId;
+				undoLel->tree->id = tables->rtd->lelInfo[undoLel->tree->id].termDupId;
 				undoLel->tree->alg->flags &= ~AF_GENERATED;
 			}
 
@@ -584,7 +584,7 @@ parseError:
 		else {
 			#ifdef COLM_LOG_PARSE
 			cerr << "backing up over non-terminal: " <<
-					tables->gbl->lelInfo[stackTop->tree->id].name << endl;
+					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
 			#endif
 
 			/* Take the alg out of undoLel. */
@@ -666,9 +666,9 @@ ostream &PdaRun::parse_error( int tokId, Tree *tree )
 {
 	cerr << "error:" << fsmRun->line << ": at token ";
 	if ( tokId < 128 )
-		cerr << "\"" << tables->gbl->lelInfo[tokId].name << "\"";
+		cerr << "\"" << tables->rtd->lelInfo[tokId].name << "\"";
 	else 
-		cerr << tables->gbl->lelInfo[tokId].name;
+		cerr << tables->rtd->lelInfo[tokId].name;
 	if ( string_length( tree->tokdata ) > 0 ) {
 		cerr << " with data \"";
 		cerr.write( string_data( tree->tokdata ), 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index ccb0290a..c78538de 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -436,7 +436,7 @@ struct PdaTables
 	int numCommitLen;
 	int numRegionItems;
 
-	RuntimeData *gbl;
+	RuntimeData *rtd;
 };
 
 bool make_reverse_code( CodeVect *all, CodeVect &reverseCode );
-- 
cgit v1.2.1


From 8bd44760137d615df994e1773d98d894139b7422 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 9 Nov 2008 00:27:56 +0000
Subject: Only store the original tree in Alg::parsed if the tree was changed.

---
 colm/pdarun.cpp | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 795a95f6..0fa9d028 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -122,8 +122,7 @@ bool been_committed( Kid *kid )
 }
 
 /* The top level of the stack is linked right-to-left. Trees underneath are
- * left to right natural order. */
-
+ * linked left-to-right. */
 void commit_kid( PdaRun *parser, Tree **root, Kid *lel )
 {
 	Alg *alg = 0;
@@ -459,8 +458,8 @@ again:
 
 			/* Take a copy of the lhs and store it in alg. May need it during
 			 * reverse parsing. */
-			redAlg->parsed = redLel->tree;
-			tree_upref( redAlg->parsed );
+			Tree *parsed = redLel->tree;
+			tree_upref( parsed );
 
 			/* Execute it. */
 			execution.execute( root );
@@ -474,6 +473,13 @@ again:
 			 * while in the environment. */
 			redLel->tree = execution.lhs;
 
+			/* If the lhs changed then store the original, otherwise downref
+			 * since we took a copy above. */
+			if ( parsed != redLel->tree )
+				redAlg->parsed = parsed;
+			else
+				tree_downref( prg, root, parsed );
+
 			/* Perhaps the execution environment is telling us we need to
 			 * reject the reduction. */
 			induceReject = execution.reject;
-- 
cgit v1.2.1


From f4d8fc2a9ece4efc584028ab0353df9a5f459808 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 9 Nov 2008 17:47:29 +0000
Subject: The order of node visitation in the commit code was changed. It was
 previously motivated by the need to execute final actions in kelbt. These
 were executed in the same order that try actions were executed in.

Now we want to walk the undo code stack as we commit so instead visit in the
order that that unparsing would visit in: rightmost, topmost.
---
 colm/bytecode.cpp |  2 +-
 colm/bytecode.h   |  2 +-
 colm/pdarun.cpp   | 66 +++++++++++++++++++++++++++----------------------------
 3 files changed, 35 insertions(+), 35 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 7636160f..8edd1df0 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -121,7 +121,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 	PdaTables *tables = prg->rtd->parsers[parserId];
 	PdaRun parser( sp, prg, tables, stream->scanner, stopId, revertOn );
 	parser.run();
-	full_commit( &parser );
+	commit_full( &parser );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
 	tree_upref( tree );
 	parser.clean();
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 3e45a79a..796af736 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -422,7 +422,7 @@ void rcode_downref( Program *prg, Tree **stack_root, Code *instr );
 void rcode_downref_all( Program *prg, Tree **stack_root, CodeVect *cv );
 void parsed_downref( Program *prg, Tree **root, Tree *tree );
 void parsed_downref_all( PdaRun *parser );
-void full_commit( PdaRun *parser );
+void commit_full( PdaRun *parser );
 
 bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
 Head *make_literal( Program *prg, long litoffset );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 0fa9d028..00cbb975 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -136,22 +136,6 @@ head:
 	if ( alg->parsed != 0 )
 		tree = alg->parsed;
 
-	/* Recurse only on non-generated trees. */
-	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
-		vm_push( (Tree*)lel );
-		lel = tree_child( parser->prg, tree );
-
-		while ( lel != 0 ) {
-			if ( !been_committed( lel ) )
-				goto head;
-
-			upwards:
-			lel = lel->next;
-		}
-
-		lel = (Kid*)vm_pop();
-	}
-
 	/* Commit */
 	#ifdef COLM_LOG_PARSE
 	cerr << "commit visiting: " << 
@@ -171,14 +155,41 @@ head:
 	}
 	alg->flags |= AF_COMMITTED;
 
-	if ( sp != root )
-		goto upwards;
+	/* Recurse only on non-generated trees. */
+	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
+		vm_push( (Tree*)lel );
+		lel = tree_child( parser->prg, tree );
+
+		if ( lel != 0 ) {
+			while ( lel != 0 ) {
+				vm_push( (Tree*)lel );
+				lel = lel->next;
+			}
+
+			backwards:
+			lel = (Kid*)vm_pop();
+			if ( !been_committed( lel ) )
+				goto head;
+		}
+
+		upwards:
+		lel = (Kid*)vm_pop();
+	}
+
+
+	if ( sp != root ) {
+		Kid *next = (Kid*)vm_top();
+		if ( next->next == lel )
+			goto backwards;
+		else
+			goto upwards;
+	}
 
 	parser->numRetry = 0;
 	assert( sp == root );
 }
 
-void full_commit( PdaRun *parser )
+void commit_full( PdaRun *parser )
 {
 	#ifdef COLM_LOG_PARSE
 	cerr << "running full commit" << endl;
@@ -186,23 +197,12 @@ void full_commit( PdaRun *parser )
 	
 	Tree **sp = parser->root;
 	Kid *kid = parser->stackTop;
-	long topLevel = 0;
-	while ( kid != 0 && !been_committed( kid ) ) {
-		vm_push( (Tree*)kid );
-		kid = kid->next;
-		topLevel += 1;
-	}
 
-	while ( topLevel > 0 ) {
-		kid = (Kid*)vm_pop();
+	while ( kid != 0 && !been_committed( kid ) ) {
 		commit_kid( parser, sp, kid );
-		topLevel -= 1;
+		kid = kid->next;
 	}
 
-	/* After running the commit the the stack should be where it 
-	 * was when we started. */
-	assert( sp == parser->root );
-
 	/* We cannot always clear all the rcode here. We may need to backup over
 	 * the parse statement. We depend on the context flag. */
 	if ( !parser->revertOn ) {
@@ -383,7 +383,7 @@ again:
 	}
 
 	if ( tables->commitLen[pos] != 0 )
-		full_commit( this );
+		commit_full( this );
 
 	if ( *action & act_rb ) {
 		int objectLength, reduction = *action >> 2;
-- 
cgit v1.2.1


From 1c9e0e428092035b88770b5ee013b7f8e6d180c5 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 10 Nov 2008 21:27:43 +0000
Subject: Added a RESTORE_LHS reverse instruction that is added to the reverse
 code when lhs changes in a reduction. We then traverse the allReverseCode
 backwards during a commit to fetch the 'parsed' tree. Currently asserting
 this is identical to Alg::parsed. Eventually we will get rid of Alg::parsed.
 There are still some problems.

---
 colm/bytecode.cpp |  17 +++++++++
 colm/bytecode.h   |   2 +
 colm/pdarun.cpp   | 108 +++++++++++++++++++++++++++++++++++++-----------------
 3 files changed, 93 insertions(+), 34 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 8edd1df0..63fd3903 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -436,6 +436,14 @@ void rcode_downref( Program *prg, Tree **sp, Code *instr )
 {
 again:
 	switch ( *instr++ ) {
+		case IN_RESTORE_LHS: {
+			Tree *lhs;
+			read_tree( lhs );
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_RESTORE_LHS" << endl;
+			#endif
+			break;
+		}
 		case IN_PARSE_BKT: {
 			Half parserId;
 			Tree *stream, *tree;
@@ -698,6 +706,15 @@ void Execution::execute( Tree **&sp, Code *instr )
 {
 again:
 	switch ( *instr++ ) {
+		case IN_RESTORE_LHS: {
+			Tree *lhs;
+			read_tree( lhs );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_RESTORE_LHS" << endl;
+			#endif
+			break;
+		}
 		case IN_LOAD_NIL: {
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_LOAD_NIL" << endl;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 796af736..36a79266 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -37,6 +37,8 @@ using std::ostream;
 typedef unsigned long ulong;
 typedef unsigned char uchar;
 
+#define IN_RESTORE_LHS           0xc0
+
 #define IN_LOAD_INT              0x01
 #define IN_LOAD_STR              0x02
 #define IN_LOAD_NIL              0x03
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 00cbb975..25a088f8 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -40,6 +40,23 @@ using std::endl;
 #define upper 0xffff0000
 #define reject() induceReject = 1
 
+#define read_word_p( i, p ) do { \
+	i = ((Word)  p[0]); \
+	i |= ((Word) p[1]) << 8; \
+	i |= ((Word) p[2]) << 16; \
+	i |= ((Word) p[3]) << 24; \
+} while(0)
+
+#define read_tree_p( i, p ) do { \
+	Word w; \
+	w = ((Word)  p[0]); \
+	w |= ((Word) p[1]) << 8; \
+	w |= ((Word) p[2]) << 16; \
+	w |= ((Word) p[3]) << 24; \
+	i = (Tree*)w; \
+} while(0)
+
+
 Tree *PdaRun::getParsedRoot( bool stop )
 {
 	return stop ? stackTop->tree : stackTop->next->tree;
@@ -123,26 +140,41 @@ bool been_committed( Kid *kid )
 
 /* The top level of the stack is linked right-to-left. Trees underneath are
  * linked left-to-right. */
-void commit_kid( PdaRun *parser, Tree **root, Kid *lel )
+void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&prcode )
 {
 	Alg *alg = 0;
 	Tree *tree = 0;
 	Tree **sp = root;
+	Tree *restore = 0;
 
 head:
+	/* Commit */
+	#ifdef COLM_LOG_PARSE
+	cerr << "commit visiting: " << 
+			parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
+	#endif
+
 	/* Load up the parsed tree. */
 	tree = lel->tree;
 	alg = tree->alg;
 	if ( alg->parsed != 0 )
 		tree = alg->parsed;
 
-	/* Commit */
-	#ifdef COLM_LOG_PARSE
-	cerr << "commit visiting: " << 
-			parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
-	#endif
+	restore = 0;
+	if ( alg->flags & AF_HAS_RCODE ) {
+		prcode -= 4;
+		Word len;
+		read_word_p( len, prcode );
+		prcode -= len;
+
+		if ( *prcode == IN_RESTORE_LHS ) {
+			cout << "has restore_lhs" << endl;
+			read_tree_p( restore, (prcode+1) );
+		}
+
+	}
+	assert( alg->parsed == restore );
 
-	alg = lel->tree->alg;
 
 	/* Reset retries. */
 	if ( alg->retry_lower > 0 ) {
@@ -156,7 +188,7 @@ head:
 	alg->flags |= AF_COMMITTED;
 
 	/* Recurse only on non-generated trees. */
-	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
+	if ( !(alg->flags & AF_GENERATED) && tree_child( parser->prg, tree ) != 0 ) {
 		vm_push( (Tree*)lel );
 		lel = tree_child( parser->prg, tree );
 
@@ -165,24 +197,25 @@ head:
 				vm_push( (Tree*)lel );
 				lel = lel->next;
 			}
+		}
+	}
+
+backup:
+	if ( sp != root ) {
+		Kid *next = (Kid*)vm_pop();
+		if ( next->next == lel ) {
+			/* Moving backwards. */
+			lel = next;
 
-			backwards:
-			lel = (Kid*)vm_pop();
 			if ( !been_committed( lel ) )
 				goto head;
 		}
+		else {
+			/* Moving upwards. */
+			lel = next;
+		}
 
-		upwards:
-		lel = (Kid*)vm_pop();
-	}
-
-
-	if ( sp != root ) {
-		Kid *next = (Kid*)vm_top();
-		if ( next->next == lel )
-			goto backwards;
-		else
-			goto upwards;
+		goto backup;
 	}
 
 	parser->numRetry = 0;
@@ -198,8 +231,10 @@ void commit_full( PdaRun *parser )
 	Tree **sp = parser->root;
 	Kid *kid = parser->stackTop;
 
+	Code *prcode = parser->allReverseCode->data + parser->allReverseCode->length();
+
 	while ( kid != 0 && !been_committed( kid ) ) {
-		commit_kid( parser, sp, kid );
+		commit_kid( parser, sp, kid, prcode );
 		kid = kid->next;
 	}
 
@@ -464,22 +499,27 @@ again:
 			/* Execute it. */
 			execution.execute( root );
 
-			/* Pull out the reverse code, if any. */
-			bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
-			if ( hasrcode )
-				redAlg->flags |= AF_HAS_RCODE;
-
 			/* Transfer the lhs from the environment to redLel. It is uprefed
 			 * while in the environment. */
 			redLel->tree = execution.lhs;
 
 			/* If the lhs changed then store the original, otherwise downref
 			 * since we took a copy above. */
-			if ( parsed != redLel->tree )
+			if ( parsed != redLel->tree ) {
 				redAlg->parsed = parsed;
+				reverseCode.append( IN_RESTORE_LHS );
+				reverseCode.appendWord( (Word)parsed );
+				reverseCode.append( 5 );
+			}
 			else
 				tree_downref( prg, root, parsed );
 
+			/* Pull out the reverse code, if any. */
+			bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
+			if ( hasrcode )
+				redAlg->flags |= AF_HAS_RCODE;
+
+
 			/* Perhaps the execution environment is telling us we need to
 			 * reject the reduction. */
 			induceReject = execution.reject;
@@ -598,6 +638,12 @@ parseError:
 			assert( alg != 0 );
 			undoLel->tree->alg = 0;
 
+			if ( alg->parsed != 0 ) {
+				/* Get the lhs, it may have been reverted. */
+				tree_downref( prg, root, undoLel->tree );
+				undoLel->tree = alg->parsed;
+			}
+
 			/* Check for an execution environment. */
 			if ( alg->flags & AF_HAS_RCODE ) {
 				Execution execution( prg, reverseCode, this, 0, 0, 0 );
@@ -607,12 +653,6 @@ parseError:
 				alg->flags &= ~AF_HAS_RCODE;
 			}
 
-			if ( alg->parsed != 0 ) {
-				/* Get the lhs, it may have been reverted. */
-				tree_downref( prg, root, undoLel->tree );
-				undoLel->tree = alg->parsed;
-			}
-
 			/* Warm fuzzies ... */
 			assert( undoLel == stackTop );
 
-- 
cgit v1.2.1


From eca13f865eb3d00191f1e88d0d83e5a8ef70c5b8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 10 Nov 2008 23:22:13 +0000
Subject: Need to consider causeReduce when backing up over rcode in the the
 commit function.

---
 colm/pdarun.cpp | 67 +++++++++++++++++++++++++++++++++++++++++++++++----------
 1 file changed, 56 insertions(+), 11 deletions(-)

diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 25a088f8..8f2193d4 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -138,14 +138,24 @@ bool been_committed( Kid *kid )
 	return kid->tree->alg->flags & AF_COMMITTED;
 }
 
+Code *backup_over_rcode( Code *rcode )
+{
+	Word len;
+	rcode -= 4;
+	read_word_p( len, rcode );
+	rcode -= len;
+	return rcode;
+}
+
 /* The top level of the stack is linked right-to-left. Trees underneath are
  * linked left-to-right. */
-void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&prcode )
+void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode )
 {
 	Alg *alg = 0;
 	Tree *tree = 0;
 	Tree **sp = root;
 	Tree *restore = 0;
+	long causeReduce = 0;
 
 head:
 	/* Commit */
@@ -160,21 +170,50 @@ head:
 	if ( alg->parsed != 0 )
 		tree = alg->parsed;
 
+	/* Check for reverse code. */
 	restore = 0;
 	if ( alg->flags & AF_HAS_RCODE ) {
-		prcode -= 4;
-		Word len;
-		read_word_p( len, prcode );
-		prcode -= len;
-
-		if ( *prcode == IN_RESTORE_LHS ) {
-			cout << "has restore_lhs" << endl;
-			read_tree_p( restore, (prcode+1) );
+		/* If tree caused some reductions, now is not the right time to backup
+		 * over the reverse code. We need to backup over the reductions first. Store
+		 * the count of the reductions and do it when the count drops to zero. */
+		if ( alg->causeReduce > 0 ) {
+			/* The top reduce block does not correspond to this alg. */
+			#ifdef COLM_LOG_PARSE
+			cerr << "commit: causeReduce found, delaying backup: " << (long)alg->causeReduce << endl;
+			#endif
+			causeReduce = alg->causeReduce;
 		}
+		else {
+			rcode = backup_over_rcode( rcode );
 
+			if ( *rcode == IN_RESTORE_LHS ) {
+				#if COLM_LOG_PARSE
+				cerr << "commit: has restore_lhs" << endl;
+				#endif
+				read_tree_p( restore, (rcode+1) );
+			}
+		}
 	}
+
+	/* Assert that we have the right restore tree. */
 	assert( alg->parsed == restore );
 
+	/* Check causeReduce, might be time to backup over the reverse code
+	 * belonging to a nonterminal that caused previous reductions. */
+	if ( tree->id >= parser->tables->rtd->firstNonTermId &&
+			!(alg->flags & AF_GENERATED) && causeReduce > 0 )
+	{
+		causeReduce -= 1;
+
+		if ( causeReduce == 0 ) {
+			#ifdef COLM_LOG_PARSE
+			cerr << "commit: causeReduce dropped to zero, backing up over rcode" << endl;
+			#endif
+
+			/* Cause reduce just dropped down to zero. */
+			rcode = backup_over_rcode( rcode );
+		}
+	}
 
 	/* Reset retries. */
 	if ( alg->retry_lower > 0 ) {
@@ -231,10 +270,12 @@ void commit_full( PdaRun *parser )
 	Tree **sp = parser->root;
 	Kid *kid = parser->stackTop;
 
-	Code *prcode = parser->allReverseCode->data + parser->allReverseCode->length();
+	Code *rcode = parser->allReverseCode->data + parser->allReverseCode->length();
 
+	/* The top level of the stack is linked right to left. This is the
+	 * traversal order we need for committing. */
 	while ( kid != 0 && !been_committed( kid ) ) {
-		commit_kid( parser, sp, kid, prcode );
+		commit_kid( parser, sp, kid, rcode );
 		kid = kid->next;
 	}
 
@@ -506,6 +547,10 @@ again:
 			/* If the lhs changed then store the original, otherwise downref
 			 * since we took a copy above. */
 			if ( parsed != redLel->tree ) {
+				#ifdef COLM_LOG_PARSE
+				cerr << "lhs tree was modified, adding a restore instruction" << endl;
+				#endif
+
 				redAlg->parsed = parsed;
 				reverseCode.append( IN_RESTORE_LHS );
 				reverseCode.appendWord( (Word)parsed );
-- 
cgit v1.2.1


From 5c7d8263513519b09e2638eb9cb64be1cb6d6c51 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 11 Nov 2008 01:34:19 +0000
Subject: When committing we need to take into account the causeReduce of the
 next input item that is waiting in the parse function.

---
 colm/bytecode.cpp |  2 +-
 colm/bytecode.h   |  2 +-
 colm/pdarun.cpp   | 23 +++++++++++++++--------
 3 files changed, 17 insertions(+), 10 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 63fd3903..32627b5b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -121,7 +121,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 	PdaTables *tables = prg->rtd->parsers[parserId];
 	PdaRun parser( sp, prg, tables, stream->scanner, stopId, revertOn );
 	parser.run();
-	commit_full( &parser );
+	commit_full( &parser, 0 );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
 	tree_upref( tree );
 	parser.clean();
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 36a79266..b46c8e40 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -424,7 +424,7 @@ void rcode_downref( Program *prg, Tree **stack_root, Code *instr );
 void rcode_downref_all( Program *prg, Tree **stack_root, CodeVect *cv );
 void parsed_downref( Program *prg, Tree **root, Tree *tree );
 void parsed_downref_all( PdaRun *parser );
-void commit_full( PdaRun *parser );
+void commit_full( PdaRun *parser, long commitReduce );
 
 bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool checkNext );
 Head *make_literal( Program *prg, long litoffset );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 8f2193d4..ba5d6042 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -149,13 +149,12 @@ Code *backup_over_rcode( Code *rcode )
 
 /* The top level of the stack is linked right-to-left. Trees underneath are
  * linked left-to-right. */
-void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode )
+void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode, long &causeReduce )
 {
 	Alg *alg = 0;
 	Tree *tree = 0;
 	Tree **sp = root;
 	Tree *restore = 0;
-	long causeReduce = 0;
 
 head:
 	/* Commit */
@@ -200,8 +199,9 @@ head:
 
 	/* Check causeReduce, might be time to backup over the reverse code
 	 * belonging to a nonterminal that caused previous reductions. */
-	if ( tree->id >= parser->tables->rtd->firstNonTermId &&
-			!(alg->flags & AF_GENERATED) && causeReduce > 0 )
+	if ( causeReduce > 0 && 
+			tree->id >= parser->tables->rtd->firstNonTermId &&
+			!(alg->flags & AF_GENERATED) )
 	{
 		causeReduce -= 1;
 
@@ -261,7 +261,7 @@ backup:
 	assert( sp == root );
 }
 
-void commit_full( PdaRun *parser )
+void commit_full( PdaRun *parser, long causeReduce )
 {
 	#ifdef COLM_LOG_PARSE
 	cerr << "running full commit" << endl;
@@ -275,7 +275,7 @@ void commit_full( PdaRun *parser )
 	/* The top level of the stack is linked right to left. This is the
 	 * traversal order we need for committing. */
 	while ( kid != 0 && !been_committed( kid ) ) {
-		commit_kid( parser, sp, kid, rcode );
+		commit_kid( parser, sp, kid, rcode, causeReduce );
 		kid = kid->next;
 	}
 
@@ -458,8 +458,15 @@ again:
 		#endif
 	}
 
-	if ( tables->commitLen[pos] != 0 )
-		commit_full( this );
+	if ( tables->commitLen[pos] != 0 ) {
+		long causeReduce = 0;
+		if ( input != 0 ) { 
+			Alg *alg = input->tree->alg;
+			if ( alg->flags & AF_HAS_RCODE )
+				causeReduce = alg->causeReduce;
+		}
+		commit_full( this, causeReduce );
+	}
 
 	if ( *action & act_rb ) {
 		int objectLength, reduction = *action >> 2;
-- 
cgit v1.2.1


From a5d3ee353957dce28dd0546d1e4a17921ab896e7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 11 Nov 2008 04:38:10 +0000
Subject: need to call the parse function

---
 test/xml/xml.lm | 23 ++++++++++++-----------
 1 file changed, 12 insertions(+), 11 deletions(-)

diff --git a/test/xml/xml.lm b/test/xml/xml.lm
index c8749bab..803d4a5d 100644
--- a/test/xml/xml.lm
+++ b/test/xml/xml.lm
@@ -149,19 +149,20 @@ def document
 
 def start 
 	[document]
+
+start S = parse start(stdin)
+
+for Switch:tag in S {
+	if match Switch
+			["<lm_switch>" SwitchContent:content "</lm_switch>"]
 	{
-		for Switch:tag in lhs {
-			if match Switch
-					["<lm_switch>" SwitchContent:content "</lm_switch>"]
+		print( 'SWITCH\n' )
+		for Text:tag in SwitchContent {
+			if match Text
+					["<text>" TextContent:content "</text>"]
 			{
-				print( 'SWITCH\n' )
-				for Text:tag in SwitchContent {
-					if match Text
-							["<text>" TextContent:content "</text>"]
-					{
-						print( ' ', TextContent, '\n' )
-					}
-				}
+				print( ' ', TextContent, '\n' )
 			}
 		}
 	}
+}
-- 
cgit v1.2.1


From 0f9262ebc36d0c4ef787990b6bc8c891c32f32a7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 11 Nov 2008 22:17:40 +0000
Subject: In XML output print the ignore tokens ahead of the token and on the
 same level. Also print the attributes with an attribute index number. The
 attribute names are not currently compiled into the output program.

---
 colm/bytecode.cpp |  2 +-
 colm/bytecode.h   |  4 +--
 colm/tree.cpp     | 95 ++++++++++++++++++++++++++++++++++++++++++-------------
 3 files changed, 76 insertions(+), 25 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 32627b5b..af229e24 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -784,7 +784,7 @@ again:
 			#endif
 
 			Tree *tree = pop();
-			xml_print_tree( sp, prg, tree );
+			print_xml_tree( sp, prg, tree );
 			tree_downref( prg, sp, tree );
 			break;
 		}
diff --git a/colm/bytecode.h b/colm/bytecode.h
index b46c8e40..9d207087 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -458,8 +458,8 @@ Tree *make_token( Tree **root, Program *prg, long nargs );
 void print_tree( Tree **&sp, Program *prg, Tree *tree );
 void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
 void print_str( Head *str );
-void xml_print_tree( Tree **&sp, Program *prg, Tree *tree );
-void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
+void print_xml_tree( Tree **&sp, Program *prg, Tree *tree );
+void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
 
 long list_length( List *list );
 void list_append( Program *prg, List *list, Tree *val );
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 1206bf91..c9613b34 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -365,7 +365,9 @@ void print_str( Head *str )
 	cout.write( (char*)(str->data), str->length );
 }
 
-void print_ignore_list( Tree **&sp, Program *prg, Tree *tree )
+/* Note that this function causes recursion, thought it is not a big
+ * deal since the recursion it is only caused by nonterminals that are ignored. */
+void print_ignore_list( Tree **sp, Program *prg, Tree *tree )
 {
 	Kid *ignore = tree_ignore( prg, tree );
 
@@ -383,6 +385,7 @@ void print_ignore_list( Tree **&sp, Program *prg, Tree *tree )
 	}
 }
 
+
 void print_kid( ostream &out, Tree **&sp, Program *prg, Kid *kid, bool printIgnore )
 {
 	Tree **root = vm_ptop();
@@ -475,72 +478,120 @@ void xml_escape_data( const char *data, long len )
 	}
 }
 
-void xml_print_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
+/* Might be a good idea to include this in the print_xml_kid function since
+ * it is recursive and can eat up stac, however it's probably not a big deal
+ * since the additional stack depth is only caused for nonterminals that are
+ * ignored. */
+void print_xml_ignore_list( Tree **sp, Program *prg, Tree *tree, long depth )
 {
+	Kid *ignore = tree_ignore( prg, tree );
+	while ( tree_is_ignore( prg, ignore ) ) {
+		print_xml_kid( sp, prg, ignore, depth );
+		ignore = ignore->next;
+	}
+}
+
+
+void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
+{
+	Kid *child;
 	Tree **root = vm_ptop();
-	int i = 0;
+	long i, objectLength;
+	LangElInfo *lelInfo = prg->rtd->lelInfo;
+
+	long kidNum = 0;;
 
 rec_call:
-	for ( i = 0; i < depth; i++ )
-		cout << "  ";
 
-	if ( kid->tree == 0 )
+	if ( kid->tree == 0 ) {
+		for ( i = 0; i < depth; i++ )
+			cout << "  ";
+
 		cout << "NIL" << endl;
+	}
 	else {
-		cout << '<' << prg->rtd->lelInfo[kid->tree->id].name;
-		if ( kid->tree->child != 0 ) {
+		/* First print the ignore tokens. */
+		print_xml_ignore_list( sp, prg, kid->tree, depth );
+
+		for ( i = 0; i < depth; i++ )
+			cout << "  ";
+
+		/* Open the tag. Afterwards we will either print data underneath it or
+		 * we will close it off immediately. */
+		cout << '<' << lelInfo[kid->tree->id].name;
+
+		/* If the parent kid is a repeat then skip this node and go
+		 * right to the first child (repeated item). */
+		if ( vm_ptop() != root ) {
+			objectLength = lelInfo[((Kid*)vm_top())->tree->id].objectLength;
+			if ( kidNum < objectLength )
+				cout << " attr=" << kidNum;
+		}
+
+		objectLength = lelInfo[kid->tree->id].objectLength;
+		child = tree_child( prg, kid->tree );
+		if ( objectLength > 0 || child != 0 ) {
 			cout << '>' << endl;
+			vm_push( (SW) kidNum );
 			vm_push( (SW) kid );
+
+			kidNum = 0;
 			kid = kid->tree->child;
 			while ( kid != 0 ) {
-				depth++;
-				goto rec_call;
-				rec_return:
-				depth--;
+				if ( kid->tree == 0 || !lelInfo[kid->tree->id].ignore ) {
+					depth++;
+					goto rec_call;
+					rec_return:
+					depth--;
+				}
+				
 				kid = kid->next;
+				kidNum += 1;
 
 				/* If the parent kid is a repeat then skip this node and go
 				 * right to the first child (repeated item). */
-				if ( prg->rtd->lelInfo[((Kid*)vm_top())->tree->id].repeat )
+				if ( lelInfo[((Kid*)vm_top())->tree->id].repeat )
 					kid = kid->tree->child;
 			}
+
 			kid = (Kid*) vm_pop();
+			kidNum = (long) vm_pop();
 
 			for ( i = 0; i < depth; i++ )
 				cout << "  ";
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+			cout << "</" << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else if ( kid->tree->id == LEL_ID_PTR ) {
 			cout << '>' << (void*)((Pointer*)kid->tree)->value << 
-					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+					"</" << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else if ( kid->tree->id == LEL_ID_BOOL ) {
 			if ( ((Int*)kid->tree)->value )
 				cout << ">true</";
 			else
 				cout << ">false</";
-			cout << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+			cout << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else if ( kid->tree->id == LEL_ID_INT ) {
 			cout << '>' << ((Int*)kid->tree)->value << 
-					"</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+					"</" << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else if ( kid->tree->id == LEL_ID_STR ) {
 			Head *head = (Head*) ((Str*)kid->tree)->value;
 
 			cout << '>';
 			xml_escape_data( (char*)(head->data), head->length );
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+			cout << "</" << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else if ( 0 < kid->tree->id && kid->tree->id < prg->rtd->firstNonTermId &&
 				kid->tree->tokdata != 0 && 
 				string_length( kid->tree->tokdata ) > 0 && 
-				!prg->rtd->lelInfo[kid->tree->id].literal )
+				!lelInfo[kid->tree->id].literal )
 		{
 			cout << '>';
 			xml_escape_data( string_data( kid->tree->tokdata ), 
 					string_length( kid->tree->tokdata ) );
-			cout << "</" << prg->rtd->lelInfo[kid->tree->id].name << '>' << endl;
+			cout << "</" << lelInfo[kid->tree->id].name << '>' << endl;
 		}
 		else
 			cout << "/>" << endl;
@@ -550,12 +601,12 @@ rec_call:
 		goto rec_return;
 }
 
-void xml_print_tree( Tree **&sp, Program *prg, Tree *tree )
+void print_xml_tree( Tree **&sp, Program *prg, Tree *tree )
 {
 	Kid kid;
 	kid.tree = tree;
 	kid.next = 0;
-	xml_print_kid( sp, prg, &kid, 0 );
+	print_xml_kid( sp, prg, &kid, 0 );
 }
 
 void stream_free( Program *prg, Stream *s )
-- 
cgit v1.2.1


From 86c0c6b3be492f8e79795b55970f01a76c86802a Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 11 Nov 2008 23:07:57 +0000
Subject: Need a VM stack for parsing patterns. The VM stack is now used for
 more than just VM execution (eg: printing and deallocation).

---
 colm/bytecode.cpp  | 13 ++++++++++---
 colm/bytecode.h    |  2 ++
 colm/parsedata.cpp |  7 +++++--
 3 files changed, 17 insertions(+), 5 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index af229e24..ed305c9b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -350,6 +350,14 @@ void Program::allocGlobal()
 	global = tree;
 }
 
+Tree **stack_alloc()
+{
+	//return new Tree*[VM_STACK_SIZE];
+
+	return (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
+		PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, 0, 0 );
+}
+
 void Program::run()
 {
 	assert( sizeof(Int)      <= sizeof(Tree) );
@@ -366,9 +374,8 @@ void Program::run()
 	 * Allocate the VM stack.
 	 */
 
-	//vm_stack = new Tree*[VM_STACK_SIZE];
-	Tree **vm_stack = (Tree**)mmap( 0, sizeof(Tree*)*VM_STACK_SIZE,
-		PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, 0, 0 );
+	Tree **vm_stack = stack_alloc();
+
 	Tree **root = &vm_stack[VM_STACK_SIZE];
 
 	/*
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 9d207087..5126c04f 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -495,6 +495,8 @@ Tree *tree_search( Kid *kid, long id );
 Tree *tree_search( Tree *tree, long id );
 void split_ref( Tree **&sp, Program *prg, Ref *fromRef );
 
+Tree **stack_alloc();
+
 /*
  * Maps
  */
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 3fadf73d..7d42f03b 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1630,13 +1630,15 @@ void ParseData::parsePatterns()
 {
 	Program program( false, runtimeData );
 	FsmRun fsmRun( &program );
+	Tree **vm_stack = stack_alloc();
 
 	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
 		//cerr << "parsing replacement: " << repl->data << endl;
 		InputStreamRepl in( repl );
 		fsmRun.attachInputStream( &in );
 
-		repl->pdaRun = new PdaRun( 0, &program, repl->langEl->pdaTables, &fsmRun, 0, false );
+		repl->pdaRun = new PdaRun( vm_stack, &program,
+				repl->langEl->pdaTables, &fsmRun, 0, false );
 		repl->pdaRun->run();
 
 		//#ifdef COLM_LOG_COMPILE
@@ -1649,7 +1651,8 @@ void ParseData::parsePatterns()
 		InputStreamPattern in( pat );
 		fsmRun.attachInputStream( &in );
 
-		pat->pdaRun = new PdaRun( 0, &program, pat->langEl->pdaTables, &fsmRun, 0, false );
+		pat->pdaRun = new PdaRun( vm_stack, &program,
+				pat->langEl->pdaTables, &fsmRun, 0, false );
 		pat->pdaRun->run();
 
 		//#ifdef COLM_LOG_COMPILE
-- 
cgit v1.2.1


From f173d370d90ec09ec58d0453fdb4247ad98501e7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 00:13:42 +0000
Subject: Stop using parsed_downref and instead downref parsed in the
 rcode_downref under the RESTORE_LHS instruction. Just need to hook in the
 restore of lhs in the reverse code execution and the Alg::parsed field will
 just be a shadow.

---
 colm/bytecode.cpp |  2 +-
 colm/bytecode.h   |  9 +++--
 colm/pdarun.cpp   | 99 ++-----------------------------------------------------
 colm/tree.cpp     |  2 +-
 4 files changed, 9 insertions(+), 103 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index ed305c9b..f8aaf662 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -449,6 +449,7 @@ again:
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_RESTORE_LHS" << endl;
 			#endif
+			tree_downref( prg, sp, lhs );
 			break;
 		}
 		case IN_PARSE_BKT: {
@@ -464,7 +465,6 @@ again:
 			cerr << "IN_PARSE_BKT " << parserId << endl;
 			#endif
 
-			parsed_downref( prg, sp, tree );
 			rcode_downref_all( prg, sp, (CodeVect*)wrev );
 			tree_downref( prg, sp, stream );
 			tree_downref( prg, sp, tree );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 5126c04f..9060d2da 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -247,11 +247,10 @@ typedef unsigned char uchar;
 
 #define AF_GENERATED   0x1
 #define AF_COMMITTED   0x2
-#define AF_REV_FREED   0x4
-#define AF_ARTIFICIAL  0x8
-#define AF_NAMED       0x10
-#define AF_GROUP_MEM   0x20
-#define AF_HAS_RCODE   0x40
+#define AF_ARTIFICIAL  0x4
+#define AF_NAMED       0x8
+#define AF_GROUP_MEM   0x10
+#define AF_HAS_RCODE   0x20
 
 /*
  * Call stack.
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index ba5d6042..a89f67b7 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -178,7 +178,8 @@ head:
 		if ( alg->causeReduce > 0 ) {
 			/* The top reduce block does not correspond to this alg. */
 			#ifdef COLM_LOG_PARSE
-			cerr << "commit: causeReduce found, delaying backup: " << (long)alg->causeReduce << endl;
+			cerr << "commit: causeReduce found, delaying backup: " << 
+					(long)alg->causeReduce << endl;
 			#endif
 			causeReduce = alg->causeReduce;
 		}
@@ -281,104 +282,10 @@ void commit_full( PdaRun *parser, long causeReduce )
 
 	/* We cannot always clear all the rcode here. We may need to backup over
 	 * the parse statement. We depend on the context flag. */
-	if ( !parser->revertOn ) {
-		parsed_downref_all( parser );
+	if ( !parser->revertOn )
 		rcode_downref_all( parser->prg, parser->root, parser->allReverseCode );
-	}
-}
-
-bool been_freed( Kid *kid )
-{
-	return kid->tree->alg->flags & AF_REV_FREED;
 }
 
-/* The top level of the stack is linked right-to-left. Trees underneath are
- * left to right natural order. */
-void parsed_downref_kid( Tree **root, Program *prg, Kid *lel )
-{
-	Alg *alg = 0;
-	Tree *tree = 0;
-	Tree **sp = root;
-
-head:
-	/* Load up the right tree. */
-	tree = lel->tree;
-	alg = tree->alg;
-	if ( alg->parsed != 0 )
-		tree = alg->parsed;
-
-	/* Recurse. */
-	if ( !(alg->flags & AF_GENERATED) && tree->child != 0 ) {
-		vm_push( (Tree*)lel );
-		lel = tree_child( prg, tree );
-
-		while ( lel != 0 ) {
-			if ( !been_freed( lel ) )
-				goto head;
-
-			upwards:
-			lel = lel->next;
-		}
-
-		lel = (Kid*)vm_pop();
-	}
-
-	/* Commit */
-	#ifdef COLM_LOG_PARSE
-	cerr << "parsed_downref_kid visiting: " << 
-			prg->rtd->lelInfo[lel->tree->id].name << endl;
-	#endif
-
-	alg = lel->tree->alg;
-
-	alg->flags |= AF_REV_FREED;
-
-	tree_downref( prg, sp, alg->parsed );
-	alg->parsed = 0;
-
-	if ( sp != root )
-		goto upwards;
-
-	assert( sp == root );
-}
-
-void parsed_downref( Program *prg, Tree **root, Tree *tree )
-{
-	#ifdef COLM_LOG_PARSE
-	cerr << "running parsed_downref on tree" << endl;
-	#endif
-
-	Kid kid;
-	kid.next = 0;
-	kid.tree = tree;
-	parsed_downref_kid( root, prg, &kid );
-}
-
-void parsed_downref_all( PdaRun *parser )
-{
-	#ifdef COLM_LOG_PARSE
-	cerr << "running full parsed_downref" << endl;
-	#endif
-	
-	Tree **sp = parser->root;
-	Kid *kid = parser->stackTop;
-	long topLevel = 0;
-	while ( kid != 0 && !been_freed( kid ) ) {
-		vm_push( (Tree*)kid );
-		kid = kid->next;
-		topLevel += 1;
-	}
-
-	while ( topLevel > 0 ) {
-		kid = (Kid*)vm_pop();
-		parsed_downref_kid( sp, parser->prg, kid );
-		topLevel -= 1;
-	}
-
-	/* After running the commit the the stack should be where it 
-	 * was when we started. */
-	assert( sp == parser->root );
-}
 
 /*
  * shift:         retry goes into lower of shifted node.
diff --git a/colm/tree.cpp b/colm/tree.cpp
index c9613b34..bb38ed6a 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -863,7 +863,7 @@ free_tree:
 		else { 
 			if ( tree->alg != 0 ) {
 				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-				vm_push( tree->alg->parsed );
+				//vm_push( tree->alg->parsed );
 				prg->algPool.free( tree->alg );
 			}
 			string_free( prg, tree->tokdata );
-- 
cgit v1.2.1


From f2ed2c24ae5a098755dfcad3610cd0add92e2127 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 04:46:43 +0000
Subject: Use the result of the RESTORE_LHS after running undo code. Assert the
 result against Alg::parsed.

Fix of stack allocation for pattern an constructor parsing: need to compute the
root of the stack relative to the end of the memory allocation.
---
 colm/bytecode.cpp  |  7 ++++---
 colm/parsedata.cpp |  5 +++--
 colm/pdarun.cpp    | 18 +++++++++++-------
 3 files changed, 18 insertions(+), 12 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index f8aaf662..4cdaae80 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -375,7 +375,6 @@ void Program::run()
 	 */
 
 	Tree **vm_stack = stack_alloc();
-
 	Tree **root = &vm_stack[VM_STACK_SIZE];
 
 	/*
@@ -714,12 +713,14 @@ void Execution::execute( Tree **&sp, Code *instr )
 again:
 	switch ( *instr++ ) {
 		case IN_RESTORE_LHS: {
-			Tree *lhs;
-			read_tree( lhs );
+			Tree *restore;
+			read_tree( restore );
 
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_RESTORE_LHS" << endl;
 			#endif
+			assert( lhs == 0 );
+			lhs = restore;
 			break;
 		}
 		case IN_LOAD_NIL: {
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 7d42f03b..96ba9b7d 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1631,13 +1631,14 @@ void ParseData::parsePatterns()
 	Program program( false, runtimeData );
 	FsmRun fsmRun( &program );
 	Tree **vm_stack = stack_alloc();
+	Tree **root = &vm_stack[VM_STACK_SIZE];
 
 	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
 		//cerr << "parsing replacement: " << repl->data << endl;
 		InputStreamRepl in( repl );
 		fsmRun.attachInputStream( &in );
 
-		repl->pdaRun = new PdaRun( vm_stack, &program,
+		repl->pdaRun = new PdaRun( root, &program,
 				repl->langEl->pdaTables, &fsmRun, 0, false );
 		repl->pdaRun->run();
 
@@ -1651,7 +1652,7 @@ void ParseData::parsePatterns()
 		InputStreamPattern in( pat );
 		fsmRun.attachInputStream( &in );
 
-		pat->pdaRun = new PdaRun( vm_stack, &program,
+		pat->pdaRun = new PdaRun( root, &program,
 				pat->langEl->pdaTables, &fsmRun, 0, false );
 		pat->pdaRun->run();
 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index a89f67b7..10904486 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -470,8 +470,11 @@ again:
 				reverseCode.appendWord( (Word)parsed );
 				reverseCode.append( 5 );
 			}
-			else
+			else {
+				/* No change in the the lhs. Just free the parsed copy we
+				 * took. */
 				tree_downref( prg, root, parsed );
+			}
 
 			/* Pull out the reverse code, if any. */
 			bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
@@ -597,12 +600,6 @@ parseError:
 			assert( alg != 0 );
 			undoLel->tree->alg = 0;
 
-			if ( alg->parsed != 0 ) {
-				/* Get the lhs, it may have been reverted. */
-				tree_downref( prg, root, undoLel->tree );
-				undoLel->tree = alg->parsed;
-			}
-
 			/* Check for an execution environment. */
 			if ( alg->flags & AF_HAS_RCODE ) {
 				Execution execution( prg, reverseCode, this, 0, 0, 0 );
@@ -610,6 +607,13 @@ parseError:
 				/* Do the reverse exeuction. */
 				execution.rexecute( root, allReverseCode );
 				alg->flags &= ~AF_HAS_RCODE;
+
+				if ( execution.lhs != 0 ) {
+					/* Get the lhs, it may have been reverted. */
+					tree_downref( prg, root, undoLel->tree );
+					assert( execution.lhs == alg->parsed );
+					undoLel->tree = execution.lhs;
+				}
 			}
 
 			/* Warm fuzzies ... */
-- 
cgit v1.2.1


From a1d7c7a3417a3f432c4a99cbd7465aa4a74d4b7a Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 04:55:08 +0000
Subject: Don't need to clear the entire vm_stack.

---
 colm/bytecode.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 4cdaae80..76ba7a0a 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -337,8 +337,7 @@ void Program::clear( Tree **vm_stack, Tree **sp )
 	mapElPool.clear();
 
 	//reverseCode.empty();
-
-	memset( vm_stack, 0, sizeof(Tree*) * VM_STACK_SIZE);
+	//memset( vm_stack, 0, sizeof(Tree*) * VM_STACK_SIZE);
 }
 
 void Program::allocGlobal()
-- 
cgit v1.2.1


From 97f2ed0beb69e23c89a0a607e6619b704ac2e13e Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 16:46:26 +0000
Subject: In the commit code restore the tree from the tree pointer extracted
 from the RESTORE_LHS instruction. This is the last place where we are
 dependent on Alg::parsed.

---
 colm/pdarun.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 10904486..95690974 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -166,8 +166,6 @@ head:
 	/* Load up the parsed tree. */
 	tree = lel->tree;
 	alg = tree->alg;
-	if ( alg->parsed != 0 )
-		tree = alg->parsed;
 
 	/* Check for reverse code. */
 	restore = 0;
@@ -198,6 +196,9 @@ head:
 	/* Assert that we have the right restore tree. */
 	assert( alg->parsed == restore );
 
+	if ( restore != 0 )
+		tree = restore;
+
 	/* Check causeReduce, might be time to backup over the reverse code
 	 * belonging to a nonterminal that caused previous reductions. */
 	if ( causeReduce > 0 && 
@@ -481,7 +482,6 @@ again:
 			if ( hasrcode )
 				redAlg->flags |= AF_HAS_RCODE;
 
-
 			/* Perhaps the execution environment is telling us we need to
 			 * reject the reduction. */
 			induceReject = execution.reject;
-- 
cgit v1.2.1


From 84e1b37b013a6e6854348ff406a0c9e1707ba560 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 17:02:15 +0000
Subject: Removed Alg::parsed.

---
 colm/pdarun.cpp | 5 -----
 colm/pdarun.h   | 1 -
 2 files changed, 6 deletions(-)

diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 95690974..1396bc35 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -193,9 +193,6 @@ head:
 		}
 	}
 
-	/* Assert that we have the right restore tree. */
-	assert( alg->parsed == restore );
-
 	if ( restore != 0 )
 		tree = restore;
 
@@ -466,7 +463,6 @@ again:
 				cerr << "lhs tree was modified, adding a restore instruction" << endl;
 				#endif
 
-				redAlg->parsed = parsed;
 				reverseCode.append( IN_RESTORE_LHS );
 				reverseCode.appendWord( (Word)parsed );
 				reverseCode.append( 5 );
@@ -611,7 +607,6 @@ parseError:
 				if ( execution.lhs != 0 ) {
 					/* Get the lhs, it may have been reverted. */
 					tree_downref( prg, root, undoLel->tree );
-					assert( execution.lhs == alg->parsed );
 					undoLel->tree = execution.lhs;
 				}
 			}
diff --git a/colm/pdarun.h b/colm/pdarun.h
index c78538de..ebb2bf89 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -40,7 +40,6 @@ struct FsmTables;
 struct Alg
 {
 	/* Parsing algorithm. */
-	Tree *parsed;
 	long state;
 	long region;
 	char causeReduce;
-- 
cgit v1.2.1


From 23c9f212b2cee0868905b1b2ea2c8c312a74c964 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 12 Nov 2008 20:52:12 +0000
Subject: Be a bit more careful about when we save and restore the original lhs
 parse tree. Doesn't impact memory usage much in the C++ parser unfortunately.

---
 colm/bytecode.cpp | 16 +++++++++++++
 colm/bytecode.h   |  5 ++++
 colm/compile.cpp  | 68 ++++++++++++++++++++++++++++++++++++++++---------------
 colm/parsedata.h  |  4 +++-
 colm/parsetree.h  |  7 ++++++
 colm/pdarun.cpp   | 18 ++++++---------
 6 files changed, 88 insertions(+), 30 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 76ba7a0a..1e0fa95b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -407,6 +407,7 @@ Execution::Execution( Program *prg, CodeVect &reverseCode,
 	code(code), 
 	frame(0), iframe(0),
 	lhs(lhs),
+	parsed(0),
 	matchText(matchText),
 	reject(false), 
 	reverseCode(reverseCode),
@@ -711,6 +712,21 @@ void Execution::execute( Tree **&sp, Code *instr )
 {
 again:
 	switch ( *instr++ ) {
+		case IN_SAVE_LHS: {
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_SAVE_LHS" << endl;
+			#endif
+
+			assert( lhs != 0 );
+
+			/* Save and upref before writing. We don't generate a restore
+			 * here. Instead in the parser we will check if it actually
+			 * changed and insert the instruction then. The presence of this
+			 * instruction here is just a conservative approximation.  */
+			parsed = lhs;
+			tree_upref( parsed );
+			break;
+		}
 		case IN_RESTORE_LHS: {
 			Tree *restore;
 			read_tree( restore );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 9060d2da..9e0d4b73 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -37,6 +37,7 @@ using std::ostream;
 typedef unsigned long ulong;
 typedef unsigned char uchar;
 
+#define IN_SAVE_LHS              0xc1
 #define IN_RESTORE_LHS           0xc0
 
 #define IN_LOAD_INT              0x01
@@ -662,7 +663,11 @@ struct Execution
 	Code *code;
 	Tree **frame;
 	Tree **iframe;
+
+	/* The left hand side passed in and the saved left hand side in case we
+	 * need to preserve it for backtracking before we write to it. */
 	Tree *lhs;
+	Tree *parsed;
 
 	Head *matchText;
 	bool reject;
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 269b73ba..74449095 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -679,6 +679,10 @@ ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code ) const
 	/* Note that we could have modified children. */
 	lookup.objField->refActive = true;
 
+	/* Whenever we take a reference we have to assume writing and that the
+	 * tree is dirty. */
+	lookup.objField->dirtyTree = true;
+
 	if ( lookup.objField->typeRef->iterDef != 0 ) {
 		code.append( lookup.objField->typeRef->iterDef->inRefFromCur );
 		code.appendHalf( lookup.objField->offset );
@@ -1285,6 +1289,9 @@ void LangVarRef::assignValue( ParseData *pd, CodeVect &code,
 	if ( lookup.objField->isConst )
 		error(loc) << "field \"" << name << "\" is const" << endp;
 
+	/* Writing guarantees the field is dirty. tree is dirty. */
+	lookup.objField->dirtyTree = true;
+
 	/* Check the types of the assignment and possibly cast. */
 	UniqueType *objUT = lookup.objField->typeRef->lookupType( pd );
 	assert( lookup.uniqueType == lookup.objField->typeRef->lookupType( pd ) );
@@ -1717,22 +1724,6 @@ void ParseData::addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList )
 	}
 }
 
-void ParseData::addProdRHSLoads( Definition *prod, long codeInsertPos, CodeVect &code )
-{
-	CodeVect loads;
-	long position = 0;
-	for ( ProdElList::Iter rhsEl = *prod->prodElList; rhsEl.lte(); rhsEl++, position++ ) {
-		if ( rhsEl->type == PdaFactor::ReferenceType ) {
-			if ( rhsEl->objField->beenReferenced ) {
-				loads.append ( IN_INIT_RHS_EL );
-				loads.appendHalf( position );
-				loads.appendHalf( rhsEl->objField->offset );
-			}
-		}
-	}
-	code.insert( codeInsertPos, loads );
-}
-
 void ParseData::addMatchLength( ObjectDef *frame, KlangEl *lel )
 {
 	/* Make the type ref. */
@@ -1931,6 +1922,42 @@ void ParseData::findLocalTrees( CharSet &trees )
 	}
 }
 
+void ParseData::addSaveLHS( Definition *prod, CodeVect &code, long &insertPos )
+{
+	CodeBlock *block = prod->redBlock;
+
+	/* If the lhs tree is dirty then we will need to save off the old lhs
+	 * before it gets modified. We want to avoid this for attribute
+	 * modifications. The computation of dirtyTree should deal with this for
+	 * us. */
+	ObjFieldMapEl *lhsFieldMapEl = block->localFrame->objFieldMap->find("lhs");
+	assert( lhsFieldMapEl != 0 );
+	ObjField *lhsField = lhsFieldMapEl->value;
+
+	if ( lhsField->dirtyTree )
+		code.insert( insertPos, IN_SAVE_LHS );
+}
+
+void ParseData::addProdRHSLoads( Definition *prod, CodeVect &code, long &insertPos )
+{
+	CodeVect loads;
+	long elPos = 0;
+	for ( ProdElList::Iter rhsEl = *prod->prodElList; rhsEl.lte(); rhsEl++, elPos++ ) {
+		if ( rhsEl->type == PdaFactor::ReferenceType ) {
+			if ( rhsEl->objField->beenReferenced ) {
+				loads.append ( IN_INIT_RHS_EL );
+				loads.appendHalf( elPos );
+				loads.appendHalf( rhsEl->objField->offset );
+			}
+		}
+	}
+
+	/* Insert and update the insert position. */
+	code.insert( insertPos, loads );
+	insertPos += loads.length();
+}
+
+
 void ParseData::compileReductionCode( Definition *prod )
 {
 	CodeBlock *block = prod->redBlock;
@@ -1947,7 +1974,7 @@ void ParseData::compileReductionCode( Definition *prod )
 	 * frame size yet. We will fill it in later. */
 	code.append( IN_INIT_LOCALS );
 	code.appendHalf( 0 );
-	long afterAllocFrame = code.length();
+	long afterInit = code.length();
 
 	/* Compile the reduce block. */
 	block->compile( this, code );
@@ -1956,7 +1983,12 @@ void ParseData::compileReductionCode( Definition *prod )
 	long frameSize = curLocalFrame->size();
 	code.setHalf( 1, frameSize );
 
-	addProdRHSLoads( prod, afterAllocFrame, code );
+	/* Might need to preserve the LHS for backtracking. The afterInit 
+	 * var may be updated by this call. */
+	addSaveLHS( prod, code, afterInit );
+
+	/* Might need to load right hand side values. */
+	addProdRHSLoads( prod, code, afterInit );
 
 	code.append( IN_POP_LOCALS );
 	code.appendHalf( block->frameId );
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 4d6cce79..9bf464b4 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -680,11 +680,13 @@ struct ParseData
 	void addMatchText( ObjectDef *frame, KlangEl *lel );
 	void addMatchLength( ObjectDef *frame, KlangEl *lel );
 	void addTransTokVar( ObjectDef *frame, KlangEl *lel );
-	void addProdRHSLoads( Definition *prod, long pos, CodeVect &code );
 	void addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList );
 	void addProdRedObjectVar( ObjectDef *localFrame, KlangEl *langEl );
 	void addProdObjects();
 
+	void addSaveLHS( Definition *prod, CodeVect &code, long &insertPos );
+	void addProdRHSLoads( Definition *prod, CodeVect &code, long &insertPos );
+
 	void prepGrammar();
 
 	void makePatternParsers();
diff --git a/colm/parsetree.h b/colm/parsetree.h
index b25a691c..08773cce 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1187,6 +1187,7 @@ struct ObjField
 		isConst(false), 
 		isLhsEl(false), isRhsEl(false), 
 		refActive(false),
+		dirtyTree(false),
 		inGetR( IN_HALT ),
 		inGetWC( IN_HALT ),
 		inGetWV( IN_HALT ),
@@ -1206,6 +1207,12 @@ struct ObjField
 	bool isLhsEl;
 	bool isRhsEl;
 	bool refActive;
+	
+	/* True if some aspect of the tree has possibly been written to. This does
+	 * not include attributes. This is here so we can optimize the storage of
+	 * old lhs vars. If only a lhs attribute changes we don't need to preserve
+	 * the original for backtracking. */
+	bool dirtyTree;
 
 	Code inGetR;
 	Code inGetWC;
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 1396bc35..4ae6b550 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -159,7 +159,7 @@ void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode, long &caus
 head:
 	/* Commit */
 	#ifdef COLM_LOG_PARSE
-	cerr << "commit visiting: " << 
+	cerr << "commit: visiting " << 
 			parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
 	#endif
 
@@ -444,11 +444,6 @@ again:
 			Execution execution( prg, reverseCode, 
 					this, fi->codeWV, redLel->tree, 0 );
 
-			/* Take a copy of the lhs and store it in alg. May need it during
-			 * reverse parsing. */
-			Tree *parsed = redLel->tree;
-			tree_upref( parsed );
-
 			/* Execute it. */
 			execution.execute( root );
 
@@ -456,21 +451,22 @@ again:
 			 * while in the environment. */
 			redLel->tree = execution.lhs;
 
-			/* If the lhs changed then store the original, otherwise downref
-			 * since we took a copy above. */
-			if ( parsed != redLel->tree ) {
+			/* If the lhs was saved and it changed then we need to restore the
+			 * original upon backtracking, otherwise downref since we took a
+			 * copy above. */
+			if ( execution.parsed != 0 && execution.parsed != redLel->tree ) {
 				#ifdef COLM_LOG_PARSE
 				cerr << "lhs tree was modified, adding a restore instruction" << endl;
 				#endif
 
 				reverseCode.append( IN_RESTORE_LHS );
-				reverseCode.appendWord( (Word)parsed );
+				reverseCode.appendWord( (Word)execution.parsed );
 				reverseCode.append( 5 );
 			}
 			else {
 				/* No change in the the lhs. Just free the parsed copy we
 				 * took. */
-				tree_downref( prg, root, parsed );
+				tree_downref( prg, root, execution.parsed );
 			}
 
 			/* Pull out the reverse code, if any. */
-- 
cgit v1.2.1


From 033085573132f2b64744183316a09d5b75d70a8f Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 13 Nov 2008 04:29:57 +0000
Subject: Warning and error fixes for compiling with g++ 4.3.2.

---
 aapl/astring.h     | 1 +
 colm/bytecode.cpp  | 2 +-
 colm/keyops.h      | 2 +-
 colm/parsedata.cpp | 6 +++---
 colm/redbuild.cpp  | 2 +-
 colm/tree.cpp      | 2 +-
 6 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/aapl/astring.h b/aapl/astring.h
index 251e9139..59343726 100644
--- a/aapl/astring.h
+++ b/aapl/astring.h
@@ -26,6 +26,7 @@
 #include <stdlib.h>
 #include <stdarg.h>
 #include <stdio.h>
+#include <string.h>
 #include <iostream>
 #include <assert.h>
 
diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 1e0fa95b..2d32dac4 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -194,7 +194,7 @@ void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, lo
 		cerr << "local tree downref: " << (long)trees[i] << endl;
 		#endif
 
-		tree_downref( prg, sp, local(trees[i]) );
+		tree_downref( prg, sp, local((long)trees[i]) );
 	}
 }
 
diff --git a/colm/keyops.h b/colm/keyops.h
index c9828cfd..8fb9b86b 100644
--- a/colm/keyops.h
+++ b/colm/keyops.h
@@ -192,7 +192,7 @@ struct KeyOps
 	HostType *typeSubsumes( bool isSigned, long long maxVal )
 	{
 		for ( int i = 0; i < hostLang->numHostTypes; i++ ) {
-			if ( ( isSigned && hostLang->hostTypes[i].isSigned || !isSigned ) &&
+			if ( ( (isSigned && hostLang->hostTypes[i].isSigned) || !isSigned ) &&
 					maxVal <= hostLang->hostTypes[i].maxVal )
 				return hostLang->hostTypes + i;
 		}
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 96ba9b7d..7b54c7c2 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -79,7 +79,7 @@ Key makeFsmKeyHex( char *str, const InputLoc &loc, ParseData *pd )
 
 	unsigned long ul = strtoul( str, 0, 16 );
 
-	if ( errno == ERANGE || unusedBits && ul >> (size * 8) ) {
+	if ( errno == ERANGE || (unusedBits && ul >> (size * 8)) ) {
 		error(loc) << "literal " << str << " overflows the alphabet type" << endl;
 		ul = 1 << (size * 8);
 	}
@@ -101,12 +101,12 @@ Key makeFsmKeyDec( char *str, const InputLoc &loc, ParseData *pd )
 	long long ll = strtoll( str, 0, 10 );
 
 	/* Check for underflow. */
-	if ( errno == ERANGE && ll < 0 || ll < minVal) {
+	if ( (errno == ERANGE && ll < 0) || ll < minVal) {
 		error(loc) << "literal " << str << " underflows the alphabet type" << endl;
 		ll = minVal;
 	}
 	/* Check for overflow. */
-	else if ( errno == ERANGE && ll > 0 || ll > maxVal ) {
+	else if ( (errno == ERANGE && ll > 0) || ll > maxVal ) {
 		error(loc) << "literal " << str << " overflows the alphabet type" << endl;
 		ll = maxVal;
 	}
diff --git a/colm/redbuild.cpp b/colm/redbuild.cpp
index b1789460..e7be055b 100644
--- a/colm/redbuild.cpp
+++ b/colm/redbuild.cpp
@@ -517,7 +517,7 @@ void RedFsmBuild::makeStateList()
 
 	for ( StateList::Iter st = fsm->stateList; st.lte(); st++ ) {
 		/* Both or neither should be set. */
-		assert( !( st->eofTarget != 0 xor st->eofActionTable.length() > 0 ) );
+		assert( !( (st->eofTarget != 0) xor (st->eofActionTable.length() > 0) ) );
 
 		makeStateActions( st );
 		makeStateConditions( st );
diff --git a/colm/tree.cpp b/colm/tree.cpp
index bb38ed6a..43e2e285 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -356,7 +356,7 @@ bool test_false( Program *prg, Tree *tree )
 	bool flse = ( 
 		tree == 0 ||
 		tree == prg->falseVal ||
-		tree->id == LEL_ID_INT && ((Int*)tree)->value == 0 );
+		( tree->id == LEL_ID_INT && ((Int*)tree)->value == 0 ) );
 	return flse;
 }
 
-- 
cgit v1.2.1


From fa33e4c69e6ef97dfc935d2e407054736ae6b292 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 20 Nov 2008 18:56:25 +0000
Subject: Added some comments for the AF_ flags. Changed AF_GENERATED to
 AF_TERM_DUP to better reflect the flag's meaning. Added a flags variable into
 tree and all the structures that overlay it. Not growing the structure
 though, just shrinking the id field instead.

---
 colm/bytecode.h   |  19 ++++++-
 colm/config.h.in  |   9 ----
 colm/pdabuild.cpp |   2 +-
 colm/pdarun.cpp   |  14 ++---
 colm/pdarun.h     | 155 ++++++++++++++++++++++++++++++------------------------
 5 files changed, 111 insertions(+), 88 deletions(-)

diff --git a/colm/bytecode.h b/colm/bytecode.h
index 9e0d4b73..9b9c5d5b 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -246,11 +246,28 @@ typedef unsigned char uchar;
 #define LEL_ID_STR    4
 #define LEL_ID_STREAM 5
 
-#define AF_GENERATED   0x1
+/*
+ * Flags
+ */
+
+/* A tree that has been generated by a termDup. */
+#define AF_TERM_DUP    0x1
+
+/* Has been processed by the commit function. All children have also been
+ * processed. */
 #define AF_COMMITTED   0x2
+
+/* Created by a token generation action, not made from the input. */
 #define AF_ARTIFICIAL  0x4
+
+/* Named node from a pattern or constructor. */
 #define AF_NAMED       0x8
+
+/* Member of a group of tokens generated by a token generation action. Grouped
+ * tokens must be sent back to the scanner together. */
 #define AF_GROUP_MEM   0x10
+
+/* There is reverse code associated with this tree node. */
 #define AF_HAS_RCODE   0x20
 
 /*
diff --git a/colm/config.h.in b/colm/config.h.in
index 4dc1ce02..98b87759 100644
--- a/colm/config.h.in
+++ b/colm/config.h.in
@@ -22,15 +22,6 @@
 #ifndef _CONFIG_H
 #define _CONFIG_H
 
-/* Programs. */
-#undef GDC
-#undef GOBJC
-#undef CXX
-#undef CC
-#undef JAVAC
-#undef TXL
-#undef RUBY
-
 /* Configuration */
 #undef COLM_LOG
 #undef COLM_LOG_BYTECODE
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index a95399c9..cfe69546 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1429,7 +1429,7 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 			ignore = ignore->next;
 		}
 
-		node.stop = kid->tree->alg->flags & AF_GENERATED;
+		node.stop = kid->tree->alg->flags & AF_TERM_DUP;
 
 		/* Recurse. */
 		fillNodes( prg, bindings, bindId, nodes, child );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 4ae6b550..50b8b90f 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -200,7 +200,7 @@ head:
 	 * belonging to a nonterminal that caused previous reductions. */
 	if ( causeReduce > 0 && 
 			tree->id >= parser->tables->rtd->firstNonTermId &&
-			!(alg->flags & AF_GENERATED) )
+			!(alg->flags & AF_TERM_DUP) )
 	{
 		causeReduce -= 1;
 
@@ -225,8 +225,8 @@ head:
 	}
 	alg->flags |= AF_COMMITTED;
 
-	/* Recurse only on non-generated trees. */
-	if ( !(alg->flags & AF_GENERATED) && tree_child( parser->prg, tree ) != 0 ) {
+	/* Do not recures on trees that are terminal dups. */
+	if ( !(alg->flags & AF_TERM_DUP) && tree_child( parser->prg, tree ) != 0 ) {
 		vm_push( (Tree*)lel );
 		lel = tree_child( parser->prg, tree );
 
@@ -345,7 +345,7 @@ again:
 				tables->rtd->lelInfo[lel->tree->id].termDupId > 0 )
 		{
 			lel->tree->id = tables->rtd->lelInfo[lel->tree->id].termDupId;
-			lel->tree->alg->flags |= AF_GENERATED;
+			lel->tree->alg->flags |= AF_TERM_DUP;
 		}
 
 		if ( action[1] == 0 )
@@ -561,7 +561,7 @@ parseError:
 		/* Either we are dealing with a terminal that was
 		 * shifted or a nonterminal that was reduced. */
 		if ( stackTop->tree->id < tables->rtd->firstNonTermId || 
-				(stackTop->tree->alg->flags & AF_GENERATED) )
+				(stackTop->tree->alg->flags & AF_TERM_DUP) )
 		{
 			#ifdef COLM_LOG_PARSE
 			cerr << "backing up over effective terminal: " <<
@@ -572,9 +572,9 @@ parseError:
 			stackTop = stackTop->next;
 
 			/* Undo the translation from termDup. */
-			if ( undoLel->tree->alg->flags & AF_GENERATED ) {
+			if ( undoLel->tree->alg->flags & AF_TERM_DUP ) {
 				undoLel->tree->id = tables->rtd->lelInfo[undoLel->tree->id].termDupId;
-				undoLel->tree->alg->flags &= ~AF_GENERATED;
+				undoLel->tree->alg->flags &= ~AF_TERM_DUP;
 			}
 
 			/* Queue it as next input item. */
diff --git a/colm/pdarun.h b/colm/pdarun.h
index ebb2bf89..fb769c9c 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -36,6 +36,7 @@ struct FsmRun;
 struct KlangEl;
 struct PdaTables;
 struct FsmTables;
+struct InputStream;
 
 struct Alg
 {
@@ -57,10 +58,17 @@ struct Kid
 	Kid *next;
 };
 
+struct Ref
+{
+	Kid *kid;
+	Ref *next;
+};
+
 struct Tree
 {
-	/* First three must be overlaid. */
-	long id;
+	/* First four will be overlaid in other structures. */
+	short id;
+	unsigned short flags;
 	long refs;
 	Kid *child;
 
@@ -68,16 +76,11 @@ struct Tree
 	Alg *alg;
 };
 
-struct Ref
-{
-	Kid *kid;
-	Ref *next;
-};
-
 struct Int
 {
-	/* Must overlay over Tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	Kid *child;
 
@@ -86,8 +89,9 @@ struct Int
 
 struct Pointer
 {
-	/* Must overlay over Tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	Kid *child;
 
@@ -96,64 +100,18 @@ struct Pointer
 
 struct Str
 {
-	/* Must overlay over Tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	Kid *child;
 
 	Head *value;
 };
 
-struct TreeIter
-{
-	TreeIter( const Ref &rootRef, int searchId, Tree **stackRoot ) : 
-		rootRef(rootRef), searchId(searchId), 
-		stackRoot(stackRoot), stackSize(0)
-	{
-		ref.kid = 0;
-		ref.next = 0;
-	}
-	
-	Ref rootRef;
-	Ref ref;
-	long searchId;
-	Tree **stackRoot;
-	long stackSize;
-};
-
-struct FunctionInfo
-{
-	const char *name;
-	long frameId;
-	long argSize;
-	long ntrees;
-	long frameSize;
-};
-
-struct UserIter
-{
-	UserIter( Tree **stackRoot, long argSize, long searchId ) : 
-		stackRoot(stackRoot), 
-		argSize(argSize), stackSize(0),
-		resume(0), frame(0), searchId(searchId)
-	{
-		ref.kid = 0;
-		ref.next = 0;
-	}
-		
-	/* The current item. */
-	Ref ref;
-	Tree **stackRoot;
-	long argSize;
-	long stackSize;
-	Code *resume;
-	Tree **frame;
-	long searchId;
-};
-
 struct ListEl
 {
-	/* Must overlay over kid. */
+	/* Must overlay kid. */
 	Tree *value;
 	ListEl *next;
 	ListEl *prev;
@@ -165,8 +123,9 @@ struct ListEl
 
 struct List
 {
-	/* Must overlay over tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	ListEl *head;
 
@@ -190,6 +149,7 @@ struct List
 
 struct MapEl
 {
+	/* Must overlay Kid. */
 	Tree *tree;
 	MapEl *next;
 	MapEl *prev;
@@ -204,8 +164,9 @@ struct MapEl
 
 struct Map
 {
-	/* Must overlay over Tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	MapEl *head;
 
@@ -281,12 +242,11 @@ struct Map
 	void attachRebal( MapEl *element, MapEl *parentEl, MapEl *lastLess );
 };
 
-struct InputStream;
-
 struct Stream
 {
-	/* Must overlay over Tree. */
-	long id;
+	/* Must overlay Tree. */
+	short id;
+	unsigned short flags;
 	long refs;
 	Kid *child;
 
@@ -295,6 +255,61 @@ struct Stream
 	FsmRun *scanner;
 };
 
+/*
+ * Iterators.
+ */
+
+struct TreeIter
+{
+	TreeIter( const Ref &rootRef, int searchId, Tree **stackRoot ) : 
+		rootRef(rootRef), searchId(searchId), 
+		stackRoot(stackRoot), stackSize(0)
+	{
+		ref.kid = 0;
+		ref.next = 0;
+	}
+	
+	Ref rootRef;
+	Ref ref;
+	long searchId;
+	Tree **stackRoot;
+	long stackSize;
+};
+
+struct FunctionInfo
+{
+	const char *name;
+	long frameId;
+	long argSize;
+	long ntrees;
+	long frameSize;
+};
+
+struct UserIter
+{
+	UserIter( Tree **stackRoot, long argSize, long searchId ) : 
+		stackRoot(stackRoot), 
+		argSize(argSize), stackSize(0),
+		resume(0), frame(0), searchId(searchId)
+	{
+		ref.kid = 0;
+		ref.next = 0;
+	}
+		
+	/* The current item. */
+	Ref ref;
+	Tree **stackRoot;
+	long argSize;
+	long stackSize;
+	Code *resume;
+	Tree **frame;
+	long searchId;
+};
+
+/*
+ * Program Data.
+ */
+
 struct PatReplInfo
 {
 	long offset;
-- 
cgit v1.2.1


From 478bc4d7e154e06269d33576432d9e49151131ee Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 21 Nov 2008 16:30:30 +0000
Subject: Start on the movement of algorithm data back to the tree structure.
 Use a flag to indicate that a tree came out of the parser. We can no longer
 rely on the alg pointer being set to determine this.

---
 colm/bytecode.cpp | 11 +++++++----
 colm/bytecode.h   |  4 ++++
 colm/pdarun.h     |  8 ++++++++
 3 files changed, 19 insertions(+), 4 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 2d32dac4..0e05ea97 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -81,10 +81,10 @@ using std::endl;
 
 void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 {
-	/* If the tree already has an alg (it has been parsed) then we need to
-	 * send a copy of it because the parsing that we are about to do requires
-	 * a fresh alg. */
-	if ( tree->alg != 0 ) {
+	/* If the tree was produced by a parsing function then we need to send a
+	 * copy of it because the parsing that we are about to do requires fresh
+	 * parsing algorithm data. */
+	if ( tree->flags & AF_PARSED ) {
 		#ifdef COLM_LOG_BYTECODE
 		cerr << "copying tree in send because alg is set" << endl;
 		#endif
@@ -134,6 +134,9 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 		cv = 0;
 	}
 
+	/* Indicate that this tree came out of a parser. */
+	tree->flags |= AF_PARSED;
+
 	return tree;
 }
 
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 9b9c5d5b..0fe40921 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -270,6 +270,10 @@ typedef unsigned char uchar;
 /* There is reverse code associated with this tree node. */
 #define AF_HAS_RCODE   0x20
 
+/* Tree was produced by a parse routine. This means the data fields for
+ * managing parsing fields will be active. */
+#define AF_PARSED      0x40
+
 /*
  * Call stack.
  */
diff --git a/colm/pdarun.h b/colm/pdarun.h
index fb769c9c..27d15a4a 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -73,7 +73,15 @@ struct Tree
 	Kid *child;
 
 	Head *tokdata;
+
 	Alg *alg;
+
+	/* Parsing algorithm. */
+	long state;
+	long region;
+	char causeReduce;
+	char retry_lower;
+	char retry_upper;
 };
 
 struct Int
-- 
cgit v1.2.1


From 1d941596a7dd116d8b5a2d403da7c3929f3e0254 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 21 Nov 2008 19:26:50 +0000
Subject: Moved the fields from the Alg structure into Tree.

---
 colm/bytecode.cpp |   5 +--
 colm/fsmrun.cpp   |  37 ++++++----------
 colm/pdabuild.cpp |  14 +++---
 colm/pdarun.cpp   | 129 +++++++++++++++++++++++++++++-------------------------
 colm/pdarun.h     |   2 -
 colm/tree.cpp     |  10 ++---
 6 files changed, 95 insertions(+), 102 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 0e05ea97..539a5797 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -93,13 +93,10 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 		tree_upref( tree );
 	}
 
-	assert( tree->alg == 0 );
-	tree->alg = prg->algPool.allocate();
-
 	if ( tree->id >= prg->rtd->firstNonTermId )
 		tree->id = prg->rtd->lelInfo[tree->id].termDupId;
 
-	tree->alg->flags |= AF_ARTIFICIAL;
+	tree->flags |= AF_ARTIFICIAL;
 
 	/* FIXME: Do we need to remove the ignore tokens 
 	 * at this point? Will it cause a leak? */
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 8c6b3aed..abd77b51 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -189,9 +189,7 @@ void FsmRun::sendBackText( const char *data, long length )
 
 void FsmRun::queueBack( Kid *input )
 {
-	Alg *alg = input->tree->alg;
-
-	if ( alg->flags & AF_GROUP_MEM ) {
+	if ( input->tree->flags & AF_GROUP_MEM ) {
 		#ifdef COLM_LOG_PARSE
 		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 		cerr << "queuing back: " << lelInfo[input->tree->id].name << endl;
@@ -245,21 +243,19 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 		#endif
 
 		Head *head = ignore->tree->tokdata;
-		bool artificial = ignore->tree->alg != 0 && 
-				ignore->tree->alg->flags & AF_ARTIFICIAL;
+		bool artificial = ignore->tree->flags & AF_ARTIFICIAL;
 
 		if ( head != 0 && !artificial )
 			sendBackText( string_data( head ), head->length );
 
 		/* Check for reverse code. */
-		Alg *alg = ignore->tree->alg;
-		if ( alg != 0 && alg->flags & AF_HAS_RCODE ) {
+		if ( ignore->tree->flags & AF_HAS_RCODE ) {
 			Execution execution( prg, parser->reverseCode, 
 					parser, 0, 0, 0 );
 
 			/* Do the reverse exeuction. */
 			execution.rexecute( parser->root, parser->allReverseCode );
-			alg->flags &= ~AF_HAS_RCODE;
+			ignore->tree->flags &= ~AF_HAS_RCODE;
 		}
 
 		ignore = ignore->next;
@@ -271,13 +267,12 @@ void FsmRun::sendBack( Kid *input )
 	#ifdef COLM_LOG_PARSE
 	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 	cerr << "sending back: " << lelInfo[input->tree->id].name;
-	if ( input->tree->alg->flags & AF_ARTIFICIAL )
+	if ( input->tree->flags & AF_ARTIFICIAL )
 		cerr << " (artificial)";
 	cerr << endl;
 	#endif
 
-	Alg *alg = input->tree->alg;
-	if ( alg->flags & AF_NAMED ) {
+	if ( input->tree->flags & AF_NAMED ) {
 		/* Send back anything that is in the buffer. */
 		inputStream->pushBack( p, pe-p );
 		p = pe = runBuf->buf;
@@ -287,20 +282,20 @@ void FsmRun::sendBack( Kid *input )
 		inputStream->pushBackNamed();
 	}
 
-	if ( !(alg->flags & AF_ARTIFICIAL) ) {
+	if ( !(input->tree->flags & AF_ARTIFICIAL) ) {
 		/* Push back the token data. */
 		sendBackText( string_data( input->tree->tokdata ), 
 				string_length( input->tree->tokdata ) );
 	}
 
 	/* Check for reverse code. */
-	if ( alg->flags & AF_HAS_RCODE ) {
+	if ( input->tree->flags & AF_HAS_RCODE ) {
 		Execution execution( prg, parser->reverseCode, 
 				parser, 0, 0, 0 );
 
 		/* Do the reverse exeuction. */
 		execution.rexecute( parser->root, parser->allReverseCode );
-		alg->flags &= ~AF_HAS_RCODE;
+		input->tree->flags &= ~AF_HAS_RCODE;
 	}
 
 	/* Always push back the ignore text. */
@@ -355,7 +350,7 @@ void set_AF_GROUP_MEM( PdaRun *parser )
 		/* Only bother with non-ignore tokens. */
 		if ( !lelInfo[queued->tree->id].ignore ) {
 			if ( sendCount > 0 )
-				queued->tree->alg->flags |= AF_GROUP_MEM;
+				queued->tree->flags |= AF_GROUP_MEM;
 			sendCount += 1;
 		}
 		queued = queued->next;
@@ -465,11 +460,8 @@ void execute_generation_action( Program *prg, PdaRun *parser, Code *code, Head *
 	 * token. */
 	Tree *tree = parser->queue->tree;
 	bool hasrcode = make_reverse_code( parser->allReverseCode, parser->reverseCode );
-	if ( hasrcode ) {
-		if ( tree->alg == 0 )
-			tree->alg = prg->algPool.allocate();
-		tree->alg->flags |= AF_HAS_RCODE;
-	}
+	if ( hasrcode )
+		tree->flags |= AF_HAS_RCODE;
 
 	/* Mark generated tokens as belonging to a group. */
 	set_AF_GROUP_MEM( parser );
@@ -510,10 +502,9 @@ Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 	Kid *input = 0;
 	input = prg->kidPool.allocate();
 	input->tree = prg->treePool.allocate();
-	input->tree->alg = prg->algPool.allocate();
 
 	if ( namedLangEl )
-		input->tree->alg->flags |= AF_NAMED;
+		input->tree->flags |= AF_NAMED;
 
 	input->tree->refs = 1;
 	input->tree->id = id;
@@ -694,7 +685,6 @@ void FsmRun::sendEOF( )
 
 	Kid *input = prg->kidPool.allocate();
 	input->tree = prg->treePool.allocate();
-	input->tree->alg = prg->algPool.allocate();
 
 	input->tree->refs = 1;
 	input->tree->id = parser->tables->rtd->eofId;
@@ -770,7 +760,6 @@ long PdaRun::undoParse( Tree *tree, CodeVect *rev )
 
 	assert( stackTop->next == 0 );
 
-	prg->algPool.free( stackTop->tree->alg );
 	prg->treePool.free( stackTop->tree );
 	prg->kidPool.free( stackTop );
 	return 0;
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index cfe69546..58ccb220 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1385,7 +1385,7 @@ void ParseData::makeRuntimeData()
 void mapNodes( Program *prg, int &count, Kid *kid )
 {
 	if ( kid != 0 ) {
-		kid->tree->alg->state = count++;
+		kid->tree->state = count++;
 
 		Kid *ignore = tree_ignore( prg, kid->tree );
 		while ( tree_is_ignore( prg, ignore ) ) {
@@ -1401,15 +1401,15 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 		PatReplNode *nodes, Kid *kid )
 {
 	if ( kid != 0 ) {
-		long ind = kid->tree->alg->state;
+		long ind = kid->tree->state;
 		PatReplNode &node = nodes[ind++];
 
 		Kid *child = tree_child( prg, kid->tree );
 
 		/* Set up the fields. */
 		node.id = kid->tree->id;
-		node.child = child == 0 ? -1 : child->tree->alg->state;
-		node.next = kid->next == 0 ? -1 : kid->next->tree->alg->state;
+		node.child = child == 0 ? -1 : child->tree->state;
+		node.next = kid->next == 0 ? -1 : kid->next->tree->state;
 		node.length = string_length( kid->tree->tokdata );
 		node.data = string_data( kid->tree->tokdata );
 
@@ -1429,7 +1429,7 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 			ignore = ignore->next;
 		}
 
-		node.stop = kid->tree->alg->flags & AF_TERM_DUP;
+		node.stop = kid->tree->flags & AF_TERM_DUP;
 
 		/* Recurse. */
 		fillNodes( prg, bindings, bindId, nodes, child );
@@ -1469,7 +1469,7 @@ void ParseData::fillInPatterns( Program *prg )
 
 	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
 		runtimeData->patReplInfo[pat->patRepId].offset = 
-				pat->pdaRun->stackTop->next->tree->alg->state;
+				pat->pdaRun->stackTop->next->tree->state;
 
 		/* BindIds are indexed base one. */
 		runtimeData->patReplInfo[pat->patRepId].numBindings = 
@@ -1483,7 +1483,7 @@ void ParseData::fillInPatterns( Program *prg )
 
 	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
 		runtimeData->patReplInfo[repl->patRepId].offset = 
-				repl->pdaRun->stackTop->next->tree->alg->state;
+				repl->pdaRun->stackTop->next->tree->state;
 
 		/* BindIds are indexed base one. */
 		runtimeData->patReplInfo[repl->patRepId].numBindings = 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 50b8b90f..71ca612e 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -90,9 +90,8 @@ void PdaRun::init()
 	/* Init the element allocation variables. */
 	stackTop = prg->kidPool.allocate();
 	stackTop->tree = prg->treePool.allocate();
-	stackTop->tree->alg = prg->algPool.allocate();
 
-	stackTop->tree->alg->state = -1;
+	stackTop->tree->state = -1;
 	stackTop->tree->refs = 1;
 	numRetry = 0;
 	errCount = 0;
@@ -109,12 +108,12 @@ void PdaRun::init()
 long PdaRun::stackTopTarget()
 {
 	long state;
-	if ( stackTop->tree->alg->state < 0 )
+	if ( stackTop->tree->state < 0 )
 		state = tables->startState;
 	else {
 		state = tables->targs[(int)tables->indicies[tables->offsets[
-				stackTop->tree->alg->state] + 
-				(stackTop->tree->id - tables->keys[stackTop->tree->alg->state<<1])]];
+				stackTop->tree->state] + 
+				(stackTop->tree->id - tables->keys[stackTop->tree->state<<1])]];
 	}
 	return state;
 }
@@ -135,7 +134,7 @@ long PdaRun::stackTopTarget()
 
 bool been_committed( Kid *kid )
 {
-	return kid->tree->alg->flags & AF_COMMITTED;
+	return kid->tree->flags & AF_COMMITTED;
 }
 
 Code *backup_over_rcode( Code *rcode )
@@ -151,7 +150,6 @@ Code *backup_over_rcode( Code *rcode )
  * linked left-to-right. */
 void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode, long &causeReduce )
 {
-	Alg *alg = 0;
 	Tree *tree = 0;
 	Tree **sp = root;
 	Tree *restore = 0;
@@ -165,21 +163,20 @@ head:
 
 	/* Load up the parsed tree. */
 	tree = lel->tree;
-	alg = tree->alg;
 
 	/* Check for reverse code. */
 	restore = 0;
-	if ( alg->flags & AF_HAS_RCODE ) {
+	if ( tree->flags & AF_HAS_RCODE ) {
 		/* If tree caused some reductions, now is not the right time to backup
 		 * over the reverse code. We need to backup over the reductions first. Store
 		 * the count of the reductions and do it when the count drops to zero. */
-		if ( alg->causeReduce > 0 ) {
+		if ( tree->causeReduce > 0 ) {
 			/* The top reduce block does not correspond to this alg. */
 			#ifdef COLM_LOG_PARSE
 			cerr << "commit: causeReduce found, delaying backup: " << 
-					(long)alg->causeReduce << endl;
+					(long)tree->causeReduce << endl;
 			#endif
-			causeReduce = alg->causeReduce;
+			causeReduce = tree->causeReduce;
 		}
 		else {
 			rcode = backup_over_rcode( rcode );
@@ -193,6 +190,10 @@ head:
 		}
 	}
 
+	/* FIXME: Need to sort out the storage of parse algorithm data. Is it in
+	 * the restored node or the original? This needs to be reconciled with the
+	 * parse and unparse algorithms. */
+
 	if ( restore != 0 )
 		tree = restore;
 
@@ -200,7 +201,7 @@ head:
 	 * belonging to a nonterminal that caused previous reductions. */
 	if ( causeReduce > 0 && 
 			tree->id >= parser->tables->rtd->firstNonTermId &&
-			!(alg->flags & AF_TERM_DUP) )
+			!(tree->flags & AF_TERM_DUP) )
 	{
 		causeReduce -= 1;
 
@@ -215,18 +216,18 @@ head:
 	}
 
 	/* Reset retries. */
-	if ( alg->retry_lower > 0 ) {
+	if ( tree->retry_lower > 0 ) {
 		parser->numRetry -= 1;
-		alg->retry_lower = 0;
+		tree->retry_lower = 0;
 	}
-	if ( alg->retry_upper > 0 ) {
+	if ( tree->retry_upper > 0 ) {
 		parser->numRetry -= 1;
-		alg->retry_upper = 0;
+		tree->retry_upper = 0;
 	}
-	alg->flags |= AF_COMMITTED;
+	tree->flags |= AF_COMMITTED;
 
 	/* Do not recures on trees that are terminal dups. */
-	if ( !(alg->flags & AF_TERM_DUP) && tree_child( parser->prg, tree ) != 0 ) {
+	if ( !(tree->flags & AF_TERM_DUP) && tree_child( parser->prg, tree ) != 0 ) {
 		vm_push( (Tree*)lel );
 		lel = tree_child( parser->prg, tree );
 
@@ -308,9 +309,9 @@ void PdaRun::parseToken( Kid *input )
 	if ( cs < 0 )
 		return;
 
-	input->tree->alg->region = nextRegionInd;
-	input->tree->alg->state = cs;
-	if ( tables->tokenRegions[input->tree->alg->region+1] != 0 )
+	input->tree->region = nextRegionInd;
+	input->tree->state = cs;
+	if ( tables->tokenRegions[input->tree->region+1] != 0 )
 		numRetry += 1;
 
 again:
@@ -328,15 +329,15 @@ again:
 	induceReject = false;
 	targState = tables->targs[pos];
 	action = tables->actions + tables->actInds[pos];
-	if ( lel->tree->alg->retry_lower )
-		action += lel->tree->alg->retry_lower;
+	if ( lel->tree->retry_lower )
+		action += lel->tree->retry_lower;
 
 	if ( *action & act_sb ) {
 		#ifdef COLM_LOG_PARSE
 		cerr << "shifted: " << tables->rtd->lelInfo[lel->tree->id].name;
 		#endif
 		input = input->next;
-		lel->tree->alg->state = cs;
+		lel->tree->state = cs;
 		lel->next = stackTop;
 		stackTop = lel;
 
@@ -345,14 +346,14 @@ again:
 				tables->rtd->lelInfo[lel->tree->id].termDupId > 0 )
 		{
 			lel->tree->id = tables->rtd->lelInfo[lel->tree->id].termDupId;
-			lel->tree->alg->flags |= AF_TERM_DUP;
+			lel->tree->flags |= AF_TERM_DUP;
 		}
 
 		if ( action[1] == 0 )
-			lel->tree->alg->retry_lower = 0;
+			lel->tree->retry_lower = 0;
 		else {
-			lel->tree->alg->retry_lower += 1;
-			assert( lel->tree->alg->retry_upper == 0 );
+			lel->tree->retry_lower += 1;
+			assert( lel->tree->retry_upper == 0 );
 			numRetry += 1; /* FIXME: Has the retry already been counted? */
 			#ifdef COLM_LOG_PARSE
 			cerr << " retry: " << stackTop;
@@ -366,9 +367,8 @@ again:
 	if ( tables->commitLen[pos] != 0 ) {
 		long causeReduce = 0;
 		if ( input != 0 ) { 
-			Alg *alg = input->tree->alg;
-			if ( alg->flags & AF_HAS_RCODE )
-				causeReduce = alg->causeReduce;
+			if ( input->tree->flags & AF_HAS_RCODE )
+				causeReduce = input->tree->causeReduce;
 		}
 		commit_full( this, causeReduce );
 	}
@@ -379,7 +379,7 @@ again:
 		Alg *redAlg;
 
 		if ( input != 0 )
-			input->tree->alg->causeReduce += 1;
+			input->tree->causeReduce += 1;
 
 		redLel = prg->kidPool.allocate();
 		redLel->tree = prg->treePool.allocate();
@@ -391,8 +391,8 @@ again:
 		redLel->next = 0;
 		redAlg->causeReduce = 0;
 		redAlg->retry_lower = 0;
-		redAlg->retry_upper = lel->tree->alg->retry_lower;
-		lel->tree->alg->retry_lower = 0;
+		redAlg->retry_upper = lel->tree->retry_lower;
+		lel->tree->retry_lower = 0;
 
 		/* Allocate the attributes. */
 		objectLength = tables->rtd->lelInfo[redLel->tree->id].objectLength;
@@ -419,7 +419,7 @@ again:
 			redAlg->retry_upper = 0;
 		else {
 			redAlg->retry_upper += 1;
-			assert( lel->tree->alg->retry_lower == 0 );
+			assert( lel->tree->retry_lower == 0 );
 			numRetry += 1;
 			#ifdef COLM_LOG_PARSE
 			cerr << " retry: " << redLel;
@@ -432,7 +432,7 @@ again:
 
 		/* When the production is of zero length we stay in the same state.
 		 * Otherwise we use the state stored in the first child. */
-		targState = rhsLen == 0 ? cs : child->tree->alg->state;
+		targState = rhsLen == 0 ? cs : child->tree->state;
 
 		assert( redLel->tree->refs == 1 );
 
@@ -480,14 +480,21 @@ again:
 		}
 
 		/* Save the algorithm data in the reduced tree. */
-		redLel->tree->alg = redAlg;
+		redLel->tree->state       = redAlg->state;
+		redLel->tree->region      = redAlg->region;
+		redLel->tree->causeReduce = redAlg->causeReduce;
+		redLel->tree->retry_lower = redAlg->retry_lower;
+		redLel->tree->retry_upper = redAlg->retry_upper;
+		redLel->tree->flags       = redAlg->flags;
+
+		prg->algPool.free( redAlg );
 
 		if ( induceReject ) {
 			#ifdef COLM_LOG_PARSE
 			cerr << "error induced during reduction of " <<
 					tables->rtd->lelInfo[redLel->tree->id].name << endl;
 			#endif
-			redLel->tree->alg->state = cs;
+			redLel->tree->state = cs;
 			redLel->next = stackTop;
 			stackTop = redLel;
 			cs = targState;
@@ -513,9 +520,9 @@ parseError:
 
 	while ( 1 ) {
 		if ( input != 0 ) {
-			assert( input->tree->alg->retry_upper == 0 );
+			assert( input->tree->retry_upper == 0 );
 
-			if ( input->tree->alg->retry_lower != 0 ) {
+			if ( input->tree->retry_lower != 0 ) {
 				#ifdef COLM_LOG_PARSE
 				cerr << "found retry targ: " << input << endl;
 				#endif
@@ -524,14 +531,14 @@ parseError:
 				cerr << "found retry: " << input << endl;
 				#endif
 
-				cs = input->tree->alg->state;
+				cs = input->tree->state;
 				goto again;
 			}
 
 			/* If there is no retry and there are no reductions caused by the
 			 * current input token then we are finished with it. Send it back. */
-			if ( input->tree->alg->causeReduce == 0 ) {
-				int next = input->tree->alg->region + 1;
+			if ( input->tree->causeReduce == 0 ) {
+				int next = input->tree->region + 1;
 
 				fsmRun->queueBack( input );
 				input = 0;
@@ -561,7 +568,7 @@ parseError:
 		/* Either we are dealing with a terminal that was
 		 * shifted or a nonterminal that was reduced. */
 		if ( stackTop->tree->id < tables->rtd->firstNonTermId || 
-				(stackTop->tree->alg->flags & AF_TERM_DUP) )
+				(stackTop->tree->flags & AF_TERM_DUP) )
 		{
 			#ifdef COLM_LOG_PARSE
 			cerr << "backing up over effective terminal: " <<
@@ -572,9 +579,9 @@ parseError:
 			stackTop = stackTop->next;
 
 			/* Undo the translation from termDup. */
-			if ( undoLel->tree->alg->flags & AF_TERM_DUP ) {
+			if ( undoLel->tree->flags & AF_TERM_DUP ) {
 				undoLel->tree->id = tables->rtd->lelInfo[undoLel->tree->id].termDupId;
-				undoLel->tree->alg->flags &= ~AF_TERM_DUP;
+				undoLel->tree->flags &= ~AF_TERM_DUP;
 			}
 
 			/* Queue it as next input item. */
@@ -587,18 +594,20 @@ parseError:
 					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
 			#endif
 
+			/* FIXME: Need to reconcile the storage of alg data here. */
+
 			/* Take the alg out of undoLel. */
-			Alg *alg = undoLel->tree->alg;
-			assert( alg != 0 );
-			undoLel->tree->alg = 0;
+			//Alg *alg = undoLel->tree->alg;
+			//assert( alg != 0 );
+			//undoLel->tree->alg = 0;
 
 			/* Check for an execution environment. */
-			if ( alg->flags & AF_HAS_RCODE ) {
+			if ( undoLel->tree->flags & AF_HAS_RCODE ) {
 				Execution execution( prg, reverseCode, this, 0, 0, 0 );
 
 				/* Do the reverse exeuction. */
 				execution.rexecute( root, allReverseCode );
-				alg->flags &= ~AF_HAS_RCODE;
+				undoLel->tree->flags &= ~AF_HAS_RCODE;
 
 				if ( execution.lhs != 0 ) {
 					/* Get the lhs, it may have been reverted. */
@@ -632,26 +641,26 @@ parseError:
 			/* If there is an input queued, this is one less reduction it has
 			 * caused. */
 			if ( input != 0 )
-				input->tree->alg->causeReduce -= 1;
+				input->tree->causeReduce -= 1;
 
-			if ( alg->retry_upper != 0 ) {
+			if ( undoLel->tree->retry_upper != 0 ) {
 				/* There is always an input item here because reduce
 				 * conflicts only happen on a lookahead character. */
 				assert( input != undoLel );
 				assert( input != 0 );
-				assert( alg->retry_lower == 0 );
-				assert( input->tree->alg->retry_upper == 0 );
+				assert( undoLel->tree->retry_lower == 0 );
+				assert( input->tree->retry_upper == 0 );
 
 				/* Transfer the retry from undoLel to input. */
-				input->tree->alg->retry_lower = alg->retry_upper;
-				input->tree->alg->retry_upper = 0;
-				input->tree->alg->state = stackTopTarget();
+				input->tree->retry_lower = undoLel->tree->retry_upper;
+				input->tree->retry_upper = 0;
+				input->tree->state = stackTopTarget();
 			}
 
 			/* Free the reduced item. */
 			tree_downref( prg, root, undoLel->tree );
 			prg->kidPool.free( undoLel );
-			prg->algPool.free( alg );
+			//prg->algPool.free( alg );
 		}
 	}
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 27d15a4a..ec0c13ad 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -74,8 +74,6 @@ struct Tree
 
 	Head *tokdata;
 
-	Alg *alg;
-
 	/* Parsing algorithm. */
 	long state;
 	long region;
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 43e2e285..0d25aaa9 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -861,11 +861,11 @@ free_tree:
 		else if ( tree->id == LEL_ID_STREAM )
 			stream_free( prg, (Stream*) tree );
 		else { 
-			if ( tree->alg != 0 ) {
-				//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-				//vm_push( tree->alg->parsed );
-				prg->algPool.free( tree->alg );
-			}
+			//if ( tree->alg != 0 ) {
+			//	//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
+			//	//vm_push( tree->alg->parsed );
+			//	prg->algPool.free( tree->alg );
+			//}
 			string_free( prg, tree->tokdata );
 
 			Kid *child = tree->child;
-- 
cgit v1.2.1


From bcf2cbccbedea1b8379998f0ddbcf19b02154525 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 21 Nov 2008 20:52:11 +0000
Subject: Removed the Alg data structure from the program. Sorted out some
 issues with replacing lhs and storing the parsing algorithm data.

---
 colm/bytecode.cpp |  5 -----
 colm/bytecode.h   |  2 --
 colm/pdarun.cpp   | 47 +++++++++++++++++------------------------------
 colm/pdarun.h     | 11 -----------
 4 files changed, 17 insertions(+), 48 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 539a5797..63336af0 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -318,10 +318,6 @@ void Program::clear( Tree **vm_stack, Tree **sp )
 	if ( treeLost )
 		cerr << "warning lost trees: " << treeLost << endl;
 
-	long algLost = algPool.numlost();
-	if ( algLost )
-		cerr << "warning lost algs: " << algLost << endl;
-
 	long listLost = listElPool.numlost();
 	if ( listLost )
 		cerr << "warning lost listEls: " << listLost << endl;
@@ -332,7 +328,6 @@ void Program::clear( Tree **vm_stack, Tree **sp )
 
 	kidPool.clear();
 	treePool.clear();
-	algPool.clear();
 	listElPool.clear();
 	mapElPool.clear();
 
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 0fe40921..abed61a1 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -317,7 +317,6 @@ typedef unsigned char uchar;
 
 struct Kid;
 struct Tree;
-struct Alg;
 struct ListEl;
 struct MapEl;
 struct PdaTables;
@@ -653,7 +652,6 @@ struct Program
 
 	PoolAlloc<Kid> kidPool;
 	PoolAlloc<Tree> treePool;
-	PoolAlloc<Alg> algPool;
 	PoolAlloc<ListEl> listElPool;
 	PoolAlloc<MapEl> mapElPool;
 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 71ca612e..6c7940bb 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -190,13 +190,13 @@ head:
 		}
 	}
 
-	/* FIXME: Need to sort out the storage of parse algorithm data. Is it in
-	 * the restored node or the original? This needs to be reconciled with the
-	 * parse and unparse algorithms. */
-
 	if ( restore != 0 )
 		tree = restore;
 
+	/* All the parse algorithm data except for the RCODE flag is in the
+	 * original. That is why we restore first, then we can clear the retry
+	 * values. */
+
 	/* Check causeReduce, might be time to backup over the reverse code
 	 * belonging to a nonterminal that caused previous reductions. */
 	if ( causeReduce > 0 && 
@@ -376,22 +376,19 @@ again:
 	if ( *action & act_rb ) {
 		int objectLength, reduction = *action >> 2;
 		Kid *last, *redLel, *child, *attrs;
-		Alg *redAlg;
 
 		if ( input != 0 )
 			input->tree->causeReduce += 1;
 
 		redLel = prg->kidPool.allocate();
 		redLel->tree = prg->treePool.allocate();
-		redAlg = prg->algPool.allocate();
-
 		redLel->tree->refs = 1;
 		redLel->tree->id = tables->rtd->prodInfo[reduction].lhsId;
 
 		redLel->next = 0;
-		redAlg->causeReduce = 0;
-		redAlg->retry_lower = 0;
-		redAlg->retry_upper = lel->tree->retry_lower;
+		redLel->tree->causeReduce = 0;
+		redLel->tree->retry_lower = 0;
+		redLel->tree->retry_upper = lel->tree->retry_lower;
 		lel->tree->retry_lower = 0;
 
 		/* Allocate the attributes. */
@@ -416,9 +413,9 @@ again:
 				<< " rhsLen: " << rhsLen;
 		#endif
 		if ( action[1] == 0 )
-			redAlg->retry_upper = 0;
+			redLel->tree->retry_upper = 0;
 		else {
-			redAlg->retry_upper += 1;
+			redLel->tree->retry_upper += 1;
 			assert( lel->tree->retry_lower == 0 );
 			numRetry += 1;
 			#ifdef COLM_LOG_PARSE
@@ -472,22 +469,17 @@ again:
 			/* Pull out the reverse code, if any. */
 			bool hasrcode = make_reverse_code( allReverseCode, reverseCode );
 			if ( hasrcode )
-				redAlg->flags |= AF_HAS_RCODE;
+				redLel->tree->flags |= AF_HAS_RCODE;
 
 			/* Perhaps the execution environment is telling us we need to
 			 * reject the reduction. */
 			induceReject = execution.reject;
 		}
 
-		/* Save the algorithm data in the reduced tree. */
-		redLel->tree->state       = redAlg->state;
-		redLel->tree->region      = redAlg->region;
-		redLel->tree->causeReduce = redAlg->causeReduce;
-		redLel->tree->retry_lower = redAlg->retry_lower;
-		redLel->tree->retry_upper = redAlg->retry_upper;
-		redLel->tree->flags       = redAlg->flags;
-
-		prg->algPool.free( redAlg );
+		/* If the left hand side was replaced then the only parse algorithm
+		 * data that is contained in it will the AF_HAS_RCODE flag. Everthing
+		 * else will be in the original. This requires that we restore first
+		 * when going backwards and when doing a commit. */
 
 		if ( induceReject ) {
 			#ifdef COLM_LOG_PARSE
@@ -594,13 +586,6 @@ parseError:
 					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
 			#endif
 
-			/* FIXME: Need to reconcile the storage of alg data here. */
-
-			/* Take the alg out of undoLel. */
-			//Alg *alg = undoLel->tree->alg;
-			//assert( alg != 0 );
-			//undoLel->tree->alg = 0;
-
 			/* Check for an execution environment. */
 			if ( undoLel->tree->flags & AF_HAS_RCODE ) {
 				Execution execution( prg, reverseCode, this, 0, 0, 0 );
@@ -616,6 +601,9 @@ parseError:
 				}
 			}
 
+			/* Only the RCODE flag was in the replaced lhs. All the rest is in
+			 * the the original. We read it after restoring. */
+
 			/* Warm fuzzies ... */
 			assert( undoLel == stackTop );
 
@@ -660,7 +648,6 @@ parseError:
 			/* Free the reduced item. */
 			tree_downref( prg, root, undoLel->tree );
 			prg->kidPool.free( undoLel );
-			//prg->algPool.free( alg );
 		}
 	}
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index ec0c13ad..ad21b941 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -38,17 +38,6 @@ struct PdaTables;
 struct FsmTables;
 struct InputStream;
 
-struct Alg
-{
-	/* Parsing algorithm. */
-	long state;
-	long region;
-	char causeReduce;
-	char retry_lower;
-	char retry_upper;
-	char flags;
-};
-
 struct Kid
 {
 	/* The tree needs to be first since pointers to kids are used to reference
-- 
cgit v1.2.1


From 57d2741adc977acf0d8e266e6bb403bc660df9b9 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 22 Nov 2008 17:58:32 +0000
Subject: Start differentiating between trees and parse trees.

---
 colm/bytecode.cpp |  5 +++++
 colm/bytecode.h   |  5 +++++
 colm/fsmrun.cpp   | 12 ++++++++----
 colm/pdabuild.cpp |  2 ++
 colm/pdarun.cpp   |  7 +++++--
 colm/pdarun.h     | 19 +++++++++++++++++++
 colm/tree.cpp     | 10 ++++------
 7 files changed, 48 insertions(+), 12 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 63336af0..ea5c7cb7 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -318,6 +318,10 @@ void Program::clear( Tree **vm_stack, Tree **sp )
 	if ( treeLost )
 		cerr << "warning lost trees: " << treeLost << endl;
 
+	long parseTreeLost = parseTreePool.numlost();
+	if ( parseTreeLost )
+		cerr << "warning lost parse trees: " << parseTreeLost << endl;
+
 	long listLost = listElPool.numlost();
 	if ( listLost )
 		cerr << "warning lost listEls: " << listLost << endl;
@@ -328,6 +332,7 @@ void Program::clear( Tree **vm_stack, Tree **sp )
 
 	kidPool.clear();
 	treePool.clear();
+	parseTreePool.clear();
 	listElPool.clear();
 	mapElPool.clear();
 
diff --git a/colm/bytecode.h b/colm/bytecode.h
index abed61a1..5a849da5 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -274,6 +274,9 @@ typedef unsigned char uchar;
  * managing parsing fields will be active. */
 #define AF_PARSED      0x40
 
+/* Tree was allocated as a ParseTree. */
+#define AF_PARSE_TREE  0x80
+
 /*
  * Call stack.
  */
@@ -317,6 +320,7 @@ typedef unsigned char uchar;
 
 struct Kid;
 struct Tree;
+struct ParseTree;
 struct ListEl;
 struct MapEl;
 struct PdaTables;
@@ -652,6 +656,7 @@ struct Program
 
 	PoolAlloc<Kid> kidPool;
 	PoolAlloc<Tree> treePool;
+	PoolAlloc<ParseTree> parseTreePool;
 	PoolAlloc<ListEl> listElPool;
 	PoolAlloc<MapEl> mapElPool;
 
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index abd77b51..e26d7541 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -327,7 +327,8 @@ void add_notoken( Program *prg, PdaRun *parser )
 		cerr << "found reverse code but no token, sending _notoken" << endl;
 		#endif
 
-		Tree *tree = prg->treePool.allocate();
+		Tree *tree = (Tree*)prg->parseTreePool.allocate();
+		tree->flags |= AF_PARSE_TREE;
 		tree->refs = 1;
 		tree->id = prg->rtd->noTokenId;
 		tree->tokdata = 0;
@@ -501,7 +502,8 @@ Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 
 	Kid *input = 0;
 	input = prg->kidPool.allocate();
-	input->tree = prg->treePool.allocate();
+	input->tree = (Tree*)prg->parseTreePool.allocate();
+	input->tree->flags |= AF_PARSE_TREE;
 
 	if ( namedLangEl )
 		input->tree->flags |= AF_NAMED;
@@ -622,7 +624,8 @@ void FsmRun::sendIgnore( long id )
 	update_position( this, tokstart, length );
 	tokstart = 0;
 	
-	Tree *tree = prg->treePool.allocate();
+	Tree *tree = (Tree*)prg->parseTreePool.allocate();
+	tree->flags |= AF_PARSE_TREE;
 	tree->refs = 1;
 	tree->id = id;
 	tree->tokdata = ignoreStr;
@@ -684,7 +687,8 @@ void FsmRun::sendEOF( )
 	#endif
 
 	Kid *input = prg->kidPool.allocate();
-	input->tree = prg->treePool.allocate();
+	input->tree = (Tree*)prg->parseTreePool.allocate();
+	input->tree->flags |= AF_PARSE_TREE;
 
 	input->tree->refs = 1;
 	input->tree->id = parser->tables->rtd->eofId;
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 58ccb220..5af8cae1 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -37,6 +37,8 @@
 /* Dumping the fsm. */
 #include "mergesort.h"
 
+#define pt(var) ((ParseTree*)(var))
+
 using namespace std;
 
 char startDefName[] = "start";
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 6c7940bb..22876c01 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -39,6 +39,7 @@ using std::endl;
 #define lower 0x0000ffff
 #define upper 0xffff0000
 #define reject() induceReject = 1
+#define pt(var) ((ParseTree*)(var))
 
 #define read_word_p( i, p ) do { \
 	i = ((Word)  p[0]); \
@@ -89,7 +90,8 @@ void PdaRun::init()
 
 	/* Init the element allocation variables. */
 	stackTop = prg->kidPool.allocate();
-	stackTop->tree = prg->treePool.allocate();
+	stackTop->tree = (Tree*)prg->parseTreePool.allocate();
+	stackTop->tree->flags |= AF_PARSE_TREE;
 
 	stackTop->tree->state = -1;
 	stackTop->tree->refs = 1;
@@ -381,7 +383,8 @@ again:
 			input->tree->causeReduce += 1;
 
 		redLel = prg->kidPool.allocate();
-		redLel->tree = prg->treePool.allocate();
+		redLel->tree = (Tree*)prg->parseTreePool.allocate();
+		redLel->tree->flags |= AF_PARSE_TREE;
 		redLel->tree->refs = 1;
 		redLel->tree->id = tables->rtd->prodInfo[reduction].lhsId;
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index ad21b941..93fc80a6 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -71,6 +71,25 @@ struct Tree
 	char retry_upper;
 };
 
+struct ParseTree
+{
+	/* Entire structure must overlay Tree. */
+	short id;
+	unsigned short flags;
+	long refs;
+	Kid *child;
+
+	Head *tokdata;
+
+	/* Parsing algorithm. */
+	long state;
+	long region;
+	char causeReduce;
+	char retry_lower;
+	char retry_upper;
+};
+
+
 struct Int
 {
 	/* Must overlay Tree. */
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 0d25aaa9..4ff9bf13 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -861,11 +861,6 @@ free_tree:
 		else if ( tree->id == LEL_ID_STREAM )
 			stream_free( prg, (Stream*) tree );
 		else { 
-			//if ( tree->alg != 0 ) {
-			//	//assert( ! (tree->alg->flags & AF_HAS_RCODE) );
-			//	//vm_push( tree->alg->parsed );
-			//	prg->algPool.free( tree->alg );
-			//}
 			string_free( prg, tree->tokdata );
 
 			Kid *child = tree->child;
@@ -876,7 +871,10 @@ free_tree:
 				child = next;
 			}
 
-			prg->treePool.free( tree );
+			if ( tree->flags & AF_PARSE_TREE )
+				prg->parseTreePool.free( (ParseTree*)tree );
+			else
+				prg->treePool.free( tree );
 		}
 	}
 
-- 
cgit v1.2.1


From 0960b48b7404eefc4d4bb1e14a38572aa095b43e Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 22 Nov 2008 18:46:43 +0000
Subject: More on the distinction between parse trees and simple trees, though
 they are still identical in structure at this point. They need to be
 separated more in the code.

---
 colm/pdabuild.cpp | 12 ++++----
 colm/pdarun.cpp   | 88 +++++++++++++++++++++++++++----------------------------
 colm/tree.cpp     |  9 ++++--
 3 files changed, 56 insertions(+), 53 deletions(-)

diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 5af8cae1..1e21335a 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1387,7 +1387,7 @@ void ParseData::makeRuntimeData()
 void mapNodes( Program *prg, int &count, Kid *kid )
 {
 	if ( kid != 0 ) {
-		kid->tree->state = count++;
+		pt(kid->tree)->state = count++;
 
 		Kid *ignore = tree_ignore( prg, kid->tree );
 		while ( tree_is_ignore( prg, ignore ) ) {
@@ -1403,15 +1403,15 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 		PatReplNode *nodes, Kid *kid )
 {
 	if ( kid != 0 ) {
-		long ind = kid->tree->state;
+		long ind = pt(kid->tree)->state;
 		PatReplNode &node = nodes[ind++];
 
 		Kid *child = tree_child( prg, kid->tree );
 
 		/* Set up the fields. */
 		node.id = kid->tree->id;
-		node.child = child == 0 ? -1 : child->tree->state;
-		node.next = kid->next == 0 ? -1 : kid->next->tree->state;
+		node.child = child == 0 ? -1 : pt(child->tree)->state;
+		node.next = kid->next == 0 ? -1 : pt(kid->next->tree)->state;
 		node.length = string_length( kid->tree->tokdata );
 		node.data = string_data( kid->tree->tokdata );
 
@@ -1471,7 +1471,7 @@ void ParseData::fillInPatterns( Program *prg )
 
 	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
 		runtimeData->patReplInfo[pat->patRepId].offset = 
-				pat->pdaRun->stackTop->next->tree->state;
+				pt(pat->pdaRun->stackTop->next->tree)->state;
 
 		/* BindIds are indexed base one. */
 		runtimeData->patReplInfo[pat->patRepId].numBindings = 
@@ -1485,7 +1485,7 @@ void ParseData::fillInPatterns( Program *prg )
 
 	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
 		runtimeData->patReplInfo[repl->patRepId].offset = 
-				repl->pdaRun->stackTop->next->tree->state;
+				pt(repl->pdaRun->stackTop->next->tree)->state;
 
 		/* BindIds are indexed base one. */
 		runtimeData->patReplInfo[repl->patRepId].numBindings = 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 22876c01..450d962c 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -93,7 +93,7 @@ void PdaRun::init()
 	stackTop->tree = (Tree*)prg->parseTreePool.allocate();
 	stackTop->tree->flags |= AF_PARSE_TREE;
 
-	stackTop->tree->state = -1;
+	pt(stackTop->tree)->state = -1;
 	stackTop->tree->refs = 1;
 	numRetry = 0;
 	errCount = 0;
@@ -110,12 +110,12 @@ void PdaRun::init()
 long PdaRun::stackTopTarget()
 {
 	long state;
-	if ( stackTop->tree->state < 0 )
+	if ( pt(stackTop->tree)->state < 0 )
 		state = tables->startState;
 	else {
 		state = tables->targs[(int)tables->indicies[tables->offsets[
-				stackTop->tree->state] + 
-				(stackTop->tree->id - tables->keys[stackTop->tree->state<<1])]];
+				pt(stackTop->tree)->state] + 
+				(stackTop->tree->id - tables->keys[pt(stackTop->tree)->state<<1])]];
 	}
 	return state;
 }
@@ -172,13 +172,13 @@ head:
 		/* If tree caused some reductions, now is not the right time to backup
 		 * over the reverse code. We need to backup over the reductions first. Store
 		 * the count of the reductions and do it when the count drops to zero. */
-		if ( tree->causeReduce > 0 ) {
+		if ( pt(tree)->causeReduce > 0 ) {
 			/* The top reduce block does not correspond to this alg. */
 			#ifdef COLM_LOG_PARSE
 			cerr << "commit: causeReduce found, delaying backup: " << 
-					(long)tree->causeReduce << endl;
+					(long)pt(tree)->causeReduce << endl;
 			#endif
-			causeReduce = tree->causeReduce;
+			causeReduce = pt(tree)->causeReduce;
 		}
 		else {
 			rcode = backup_over_rcode( rcode );
@@ -218,13 +218,13 @@ head:
 	}
 
 	/* Reset retries. */
-	if ( tree->retry_lower > 0 ) {
+	if ( pt(tree)->retry_lower > 0 ) {
 		parser->numRetry -= 1;
-		tree->retry_lower = 0;
+		pt(tree)->retry_lower = 0;
 	}
-	if ( tree->retry_upper > 0 ) {
+	if ( pt(tree)->retry_upper > 0 ) {
 		parser->numRetry -= 1;
-		tree->retry_upper = 0;
+		pt(tree)->retry_upper = 0;
 	}
 	tree->flags |= AF_COMMITTED;
 
@@ -311,9 +311,9 @@ void PdaRun::parseToken( Kid *input )
 	if ( cs < 0 )
 		return;
 
-	input->tree->region = nextRegionInd;
-	input->tree->state = cs;
-	if ( tables->tokenRegions[input->tree->region+1] != 0 )
+	pt(input->tree)->region = nextRegionInd;
+	pt(input->tree)->state = cs;
+	if ( tables->tokenRegions[pt(input->tree)->region+1] != 0 )
 		numRetry += 1;
 
 again:
@@ -331,15 +331,15 @@ again:
 	induceReject = false;
 	targState = tables->targs[pos];
 	action = tables->actions + tables->actInds[pos];
-	if ( lel->tree->retry_lower )
-		action += lel->tree->retry_lower;
+	if ( pt(lel->tree)->retry_lower )
+		action += pt(lel->tree)->retry_lower;
 
 	if ( *action & act_sb ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "shifted: " << tables->rtd->lelInfo[lel->tree->id].name;
+		cerr << "shifted: " << tables->rtd->lelInfo[pt(lel->tree)->id].name;
 		#endif
 		input = input->next;
-		lel->tree->state = cs;
+		pt(lel->tree)->state = cs;
 		lel->next = stackTop;
 		stackTop = lel;
 
@@ -352,10 +352,10 @@ again:
 		}
 
 		if ( action[1] == 0 )
-			lel->tree->retry_lower = 0;
+			pt(lel->tree)->retry_lower = 0;
 		else {
-			lel->tree->retry_lower += 1;
-			assert( lel->tree->retry_upper == 0 );
+			pt(lel->tree)->retry_lower += 1;
+			assert( pt(lel->tree)->retry_upper == 0 );
 			numRetry += 1; /* FIXME: Has the retry already been counted? */
 			#ifdef COLM_LOG_PARSE
 			cerr << " retry: " << stackTop;
@@ -370,7 +370,7 @@ again:
 		long causeReduce = 0;
 		if ( input != 0 ) { 
 			if ( input->tree->flags & AF_HAS_RCODE )
-				causeReduce = input->tree->causeReduce;
+				causeReduce = pt(input->tree)->causeReduce;
 		}
 		commit_full( this, causeReduce );
 	}
@@ -380,7 +380,7 @@ again:
 		Kid *last, *redLel, *child, *attrs;
 
 		if ( input != 0 )
-			input->tree->causeReduce += 1;
+			pt(input->tree)->causeReduce += 1;
 
 		redLel = prg->kidPool.allocate();
 		redLel->tree = (Tree*)prg->parseTreePool.allocate();
@@ -389,10 +389,10 @@ again:
 		redLel->tree->id = tables->rtd->prodInfo[reduction].lhsId;
 
 		redLel->next = 0;
-		redLel->tree->causeReduce = 0;
-		redLel->tree->retry_lower = 0;
-		redLel->tree->retry_upper = lel->tree->retry_lower;
-		lel->tree->retry_lower = 0;
+		pt(redLel->tree)->causeReduce = 0;
+		pt(redLel->tree)->retry_lower = 0;
+		pt(redLel->tree)->retry_upper = pt(lel->tree)->retry_lower;
+		pt(lel->tree)->retry_lower = 0;
 
 		/* Allocate the attributes. */
 		objectLength = tables->rtd->lelInfo[redLel->tree->id].objectLength;
@@ -416,10 +416,10 @@ again:
 				<< " rhsLen: " << rhsLen;
 		#endif
 		if ( action[1] == 0 )
-			redLel->tree->retry_upper = 0;
+			pt(redLel->tree)->retry_upper = 0;
 		else {
-			redLel->tree->retry_upper += 1;
-			assert( lel->tree->retry_lower == 0 );
+			pt(redLel->tree)->retry_upper += 1;
+			assert( pt(lel->tree)->retry_lower == 0 );
 			numRetry += 1;
 			#ifdef COLM_LOG_PARSE
 			cerr << " retry: " << redLel;
@@ -432,7 +432,7 @@ again:
 
 		/* When the production is of zero length we stay in the same state.
 		 * Otherwise we use the state stored in the first child. */
-		targState = rhsLen == 0 ? cs : child->tree->state;
+		targState = rhsLen == 0 ? cs : pt(child->tree)->state;
 
 		assert( redLel->tree->refs == 1 );
 
@@ -489,7 +489,7 @@ again:
 			cerr << "error induced during reduction of " <<
 					tables->rtd->lelInfo[redLel->tree->id].name << endl;
 			#endif
-			redLel->tree->state = cs;
+			pt(redLel->tree)->state = cs;
 			redLel->next = stackTop;
 			stackTop = redLel;
 			cs = targState;
@@ -515,9 +515,9 @@ parseError:
 
 	while ( 1 ) {
 		if ( input != 0 ) {
-			assert( input->tree->retry_upper == 0 );
+			assert( pt(input->tree)->retry_upper == 0 );
 
-			if ( input->tree->retry_lower != 0 ) {
+			if ( pt(input->tree)->retry_lower != 0 ) {
 				#ifdef COLM_LOG_PARSE
 				cerr << "found retry targ: " << input << endl;
 				#endif
@@ -526,14 +526,14 @@ parseError:
 				cerr << "found retry: " << input << endl;
 				#endif
 
-				cs = input->tree->state;
+				cs = pt(input->tree)->state;
 				goto again;
 			}
 
 			/* If there is no retry and there are no reductions caused by the
 			 * current input token then we are finished with it. Send it back. */
-			if ( input->tree->causeReduce == 0 ) {
-				int next = input->tree->region + 1;
+			if ( pt(input->tree)->causeReduce == 0 ) {
+				int next = pt(input->tree)->region + 1;
 
 				fsmRun->queueBack( input );
 				input = 0;
@@ -632,20 +632,20 @@ parseError:
 			/* If there is an input queued, this is one less reduction it has
 			 * caused. */
 			if ( input != 0 )
-				input->tree->causeReduce -= 1;
+				pt(input->tree)->causeReduce -= 1;
 
-			if ( undoLel->tree->retry_upper != 0 ) {
+			if ( pt(undoLel->tree)->retry_upper != 0 ) {
 				/* There is always an input item here because reduce
 				 * conflicts only happen on a lookahead character. */
 				assert( input != undoLel );
 				assert( input != 0 );
-				assert( undoLel->tree->retry_lower == 0 );
-				assert( input->tree->retry_upper == 0 );
+				assert( pt(undoLel->tree)->retry_lower == 0 );
+				assert( pt(input->tree)->retry_upper == 0 );
 
 				/* Transfer the retry from undoLel to input. */
-				input->tree->retry_lower = undoLel->tree->retry_upper;
-				input->tree->retry_upper = 0;
-				input->tree->state = stackTopTarget();
+				pt(input->tree)->retry_lower = pt(undoLel->tree)->retry_upper;
+				pt(input->tree)->retry_upper = 0;
+				pt(input->tree)->state = stackTopTarget();
 			}
 
 			/* Free the reduced item. */
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 4ff9bf13..7c624e2a 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -290,7 +290,8 @@ Tree *make_token( Tree **root, Program *prg, long nargs )
 	Tree *tree;
 
 	if ( lelInfo[id].ignore ) {
-		tree = prg->treePool.allocate();
+		tree = (Tree*)prg->parseTreePool.allocate();
+		tree->flags |= AF_PARSE_TREE;
 		tree->refs = 1;
 		tree->id = id;
 		tree->tokdata = tokdata;
@@ -299,7 +300,8 @@ Tree *make_token( Tree **root, Program *prg, long nargs )
 		long objectLength = lelInfo[id].objectLength;
 		Kid *attrs = alloc_attrs( prg, objectLength );
 
-		tree = prg->treePool.allocate();
+		tree = (Tree*)prg->parseTreePool.allocate();
+		tree->flags |= AF_PARSE_TREE;
 		tree->id = id;
 		tree->refs = 1;
 		tree->tokdata = tokdata;
@@ -325,7 +327,8 @@ Tree *make_tree( Tree **root, Program *prg, long nargs )
 	long id = idInt->value;
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 
-	Tree *tree = prg->treePool.allocate();
+	Tree *tree = (Tree*)prg->parseTreePool.allocate();
+	tree->flags |= AF_PARSE_TREE;
 	tree->id = id;
 	tree->refs = 1;
 
-- 
cgit v1.2.1


From 9913736da5dbcd240f0f605ee1b73833e01bd5f8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 22 Nov 2008 22:41:46 +0000
Subject: Removed the parse algorithm data from the Tree structure. Not sending
 ignore tokens as parse trees. After a reduction action make sure the lhs is a
 full parse tree, as must be done in the send function. All entry points into
 the parsing algorithm must be protected in this way.

---
 colm/bytecode.cpp | 16 ++++++++++------
 colm/bytecode.h   |  3 ++-
 colm/fsmrun.cpp   |  3 +--
 colm/pdarun.cpp   |  1 +
 colm/pdarun.h     | 10 +++++-----
 colm/tree.cpp     | 21 +++++++++++++++------
 6 files changed, 34 insertions(+), 20 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index ea5c7cb7..28766f39 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -77,21 +77,25 @@ using std::endl;
 	i |= ((Word) *instr++) << 8; \
 } while(0)
 
-/* Type conversions. */
-
-void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
+Tree *prep_parse_tree( Program *prg, Tree *tree )
 {
 	/* If the tree was produced by a parsing function then we need to send a
 	 * copy of it because the parsing that we are about to do requires fresh
 	 * parsing algorithm data. */
-	if ( tree->flags & AF_PARSED ) {
+	if ( !(tree->flags & AF_PARSE_TREE) || tree->flags & AF_PARSED ) {
 		#ifdef COLM_LOG_BYTECODE
-		cerr << "copying tree in send because alg is set" << endl;
+		cerr << "copying tree in send function" << endl;
 		#endif
 		Kid *unused = 0;
-		tree = copy_real_tree( prg, tree, 0, unused );
+		tree = copy_real_tree( prg, tree, 0, unused, true );
 		tree_upref( tree );
 	}
+	return  tree;
+}
+
+void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
+{
+	tree = prep_parse_tree( prg, tree );
 
 	if ( tree->id >= prg->rtd->firstNonTermId )
 		tree->id = prg->rtd->lelInfo[tree->id].termDupId;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 5a849da5..51bc9f5e 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -475,9 +475,10 @@ void ignore_data( Tree *tree, char *dest );
 long ignore_length( Tree *tree );
 Tree *split_tree( Program *prg, Tree *t );
 Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
-Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown );
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown, bool parsed );
 Tree *make_tree( Tree **root, Program *prg, long nargs );
 Tree *make_token( Tree **root, Program *prg, long nargs );
+Tree *prep_parse_tree( Program *prg, Tree *tree );
 
 void print_tree( Tree **&sp, Program *prg, Tree *tree );
 void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index e26d7541..10ae7dc0 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -624,8 +624,7 @@ void FsmRun::sendIgnore( long id )
 	update_position( this, tokstart, length );
 	tokstart = 0;
 	
-	Tree *tree = (Tree*)prg->parseTreePool.allocate();
-	tree->flags |= AF_PARSE_TREE;
+	Tree *tree = prg->treePool.allocate();
 	tree->refs = 1;
 	tree->id = id;
 	tree->tokdata = ignoreStr;
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 450d962c..6d25883e 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -450,6 +450,7 @@ again:
 			/* Transfer the lhs from the environment to redLel. It is uprefed
 			 * while in the environment. */
 			redLel->tree = execution.lhs;
+			redLel->tree = prep_parse_tree( prg, redLel->tree );
 
 			/* If the lhs was saved and it changed then we need to restore the
 			 * original upon backtracking, otherwise downref since we took a
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 93fc80a6..f1a0b64a 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -64,11 +64,11 @@ struct Tree
 	Head *tokdata;
 
 	/* Parsing algorithm. */
-	long state;
-	long region;
-	char causeReduce;
-	char retry_lower;
-	char retry_upper;
+//	long state;
+//	long region;
+//	char causeReduce;
+//	char retry_lower;
+//	char retry_upper;
 };
 
 struct ParseTree
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 7c624e2a..c9625fb5 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -621,13 +621,19 @@ void stream_free( Program *prg, Stream *s )
 	prg->mapElPool.free( (MapEl*)s );
 }
 
-Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
+Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, 
+		Kid *&newNextDown, bool parseTree )
 {
-	assert( tree->refs >= 2 );
-
 	/* Need to keep a lookout for next down. If 
 	 * copying it, return the copy. */
-	Tree *newTree = prg->treePool.allocate();
+	Tree *newTree;
+	if ( parseTree ) {
+		newTree = (Tree*) prg->parseTreePool.allocate();
+		newTree->flags |= AF_PARSE_TREE;
+	}
+	else {
+		newTree = prg->treePool.allocate();
+	}
 
 	newTree->id = tree->id;
 	newTree->tokdata = string_copy( prg, tree->tokdata );
@@ -735,6 +741,8 @@ Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
 
 Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
 {
+	assert( tree->refs >= 2 );
+
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 	long genericId = lelInfo[tree->id].genericId;
 	if ( genericId > 0 ) {
@@ -754,8 +762,9 @@ Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
 		assert(false);
 	else if ( tree->id == LEL_ID_STR )
 		assert(false);
-	else
-		tree = copy_real_tree( prg, tree, oldNextDown, newNextDown );
+	else {
+		tree = copy_real_tree( prg, tree, oldNextDown, newNextDown, false );
+	}
 
 	assert( tree->refs == 0 );
 	return tree;
-- 
cgit v1.2.1


From 444d03d11a7fca334e382b4038bf96f6ba50c4bf Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 23 Nov 2008 17:14:12 +0000
Subject: The make_tree and make_token functions now produce normal non-parse
 trees. The copy functions no longer downref the source, they just do a pure
 copy. Removed the check on the refcount from copy_list and copy_map. These
 functions should just always produce a copy since they are needed outside of
 the split functions.

---
 colm/bytecode.cpp |  12 ++++--
 colm/bytecode.h   |   2 +-
 colm/fsmrun.cpp   |   2 +-
 colm/pdarun.cpp   |   2 +-
 colm/pdarun.h     |   7 ----
 colm/tree.cpp     | 116 +++++++++++++++++++++++++-----------------------------
 6 files changed, 65 insertions(+), 76 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 28766f39..965e1251 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -77,7 +77,7 @@ using std::endl;
 	i |= ((Word) *instr++) << 8; \
 } while(0)
 
-Tree *prep_parse_tree( Program *prg, Tree *tree )
+Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree )
 {
 	/* If the tree was produced by a parsing function then we need to send a
 	 * copy of it because the parsing that we are about to do requires fresh
@@ -87,15 +87,19 @@ Tree *prep_parse_tree( Program *prg, Tree *tree )
 		cerr << "copying tree in send function" << endl;
 		#endif
 		Kid *unused = 0;
-		tree = copy_real_tree( prg, tree, 0, unused, true );
-		tree_upref( tree );
+		Tree *newTree = copy_real_tree( prg, tree, 0, unused, true );
+		tree_upref( newTree );
+
+		tree_downref( prg, sp, tree );
+
+		tree = newTree;
 	}
 	return  tree;
 }
 
 void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 {
-	tree = prep_parse_tree( prg, tree );
+	tree = prep_parse_tree( prg, root, tree );
 
 	if ( tree->id >= prg->rtd->firstNonTermId )
 		tree->id = prg->rtd->lelInfo[tree->id].termDupId;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 51bc9f5e..6fce4b19 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -478,7 +478,7 @@ Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
 Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown, bool parsed );
 Tree *make_tree( Tree **root, Program *prg, long nargs );
 Tree *make_token( Tree **root, Program *prg, long nargs );
-Tree *prep_parse_tree( Program *prg, Tree *tree );
+Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree );
 
 void print_tree( Tree **&sp, Program *prg, Tree *tree );
 void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 10ae7dc0..183762ec 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -763,7 +763,7 @@ long PdaRun::undoParse( Tree *tree, CodeVect *rev )
 
 	assert( stackTop->next == 0 );
 
-	prg->treePool.free( stackTop->tree );
+	tree_downref( prg, root, stackTop->tree );
 	prg->kidPool.free( stackTop );
 	return 0;
 }
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 6d25883e..766910c2 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -450,7 +450,7 @@ again:
 			/* Transfer the lhs from the environment to redLel. It is uprefed
 			 * while in the environment. */
 			redLel->tree = execution.lhs;
-			redLel->tree = prep_parse_tree( prg, redLel->tree );
+			redLel->tree = prep_parse_tree( prg, root, redLel->tree );
 
 			/* If the lhs was saved and it changed then we need to restore the
 			 * original upon backtracking, otherwise downref since we took a
diff --git a/colm/pdarun.h b/colm/pdarun.h
index f1a0b64a..9634b20c 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -62,13 +62,6 @@ struct Tree
 	Kid *child;
 
 	Head *tokdata;
-
-	/* Parsing algorithm. */
-//	long state;
-//	long region;
-//	char causeReduce;
-//	char retry_lower;
-//	char retry_upper;
 };
 
 struct ParseTree
diff --git a/colm/tree.cpp b/colm/tree.cpp
index c9625fb5..45ac50a6 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -290,8 +290,7 @@ Tree *make_token( Tree **root, Program *prg, long nargs )
 	Tree *tree;
 
 	if ( lelInfo[id].ignore ) {
-		tree = (Tree*)prg->parseTreePool.allocate();
-		tree->flags |= AF_PARSE_TREE;
+		tree = prg->treePool.allocate();
 		tree->refs = 1;
 		tree->id = id;
 		tree->tokdata = tokdata;
@@ -300,8 +299,7 @@ Tree *make_token( Tree **root, Program *prg, long nargs )
 		long objectLength = lelInfo[id].objectLength;
 		Kid *attrs = alloc_attrs( prg, objectLength );
 
-		tree = (Tree*)prg->parseTreePool.allocate();
-		tree->flags |= AF_PARSE_TREE;
+		tree = prg->treePool.allocate();
 		tree->id = id;
 		tree->refs = 1;
 		tree->tokdata = tokdata;
@@ -327,8 +325,7 @@ Tree *make_tree( Tree **root, Program *prg, long nargs )
 	long id = idInt->value;
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 
-	Tree *tree = (Tree*)prg->parseTreePool.allocate();
-	tree->flags |= AF_PARSE_TREE;
+	Tree *tree = prg->treePool.allocate();
 	tree->id = id;
 	tree->refs = 1;
 
@@ -638,8 +635,6 @@ Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown,
 	newTree->id = tree->id;
 	newTree->tokdata = string_copy( prg, tree->tokdata );
 
-	tree->refs -= 1;
-
 	/* Copy the child list, will handle attributes, ignores 
 	 * and the children. */
 	Kid *child = tree->child, *last = 0;
@@ -673,76 +668,63 @@ Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown,
 
 List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
 {
-	if ( list->refs > 1 ) {
-		#ifdef COLM_LOG_BYTECODE
-		cerr << "splitting list: " << list << " refs: " << 
-				list->refs << endl;
-		#endif
-
-		/* Not a need copy. */
-		List *newList = (List*)prg->mapElPool.allocate();
-		newList->id = list->genericInfo->langElId;
-		newList->genericInfo = list->genericInfo;
-
-		list->refs -= 1;
+	#ifdef COLM_LOG_BYTECODE
+	cerr << "splitting list: " << list << " refs: " << 
+			list->refs << endl;
+	#endif
 
-		ListEl *src = list->head;
-		while( src != 0 ) {
-			ListEl *newEl = prg->listElPool.allocate();
-			newEl->value = src->value;
-			tree_upref( newEl->value );
+	/* Not a need copy. */
+	List *newList = (List*)prg->mapElPool.allocate();
+	newList->id = list->genericInfo->langElId;
+	newList->genericInfo = list->genericInfo;
 
-			newList->append( newEl );
+	ListEl *src = list->head;
+	while( src != 0 ) {
+		ListEl *newEl = prg->listElPool.allocate();
+		newEl->value = src->value;
+		tree_upref( newEl->value );
 
-			/* Watch out for next down. */
-			if ( (Kid*)src == oldNextDown )
-				newNextDown = (Kid*)newEl;
+		newList->append( newEl );
 
-			src = src->next;
-		}
+		/* Watch out for next down. */
+		if ( (Kid*)src == oldNextDown )
+			newNextDown = (Kid*)newEl;
 
-		list = newList;
+		src = src->next;
 	}
-	return list;
-}
 
+	return newList;
+}
 	
 Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
 {
-	if ( map->refs > 1 ) {
-		#ifdef COLM_LOG_BYTECODE
-		cerr << "splitting map: " << map << " refs: " << 
-				map->refs << endl;
-		#endif
-
-		Map *newMap = (Map*)prg->mapElPool.allocate();
-		newMap->id = map->genericInfo->langElId;
-		newMap->genericInfo = map->genericInfo;
-		newMap->treeSize = map->treeSize;
-		newMap->root = 0;
-
-		/* If there is a root, copy the tree. */
-		if ( map->root != 0 ) {
-			newMap->root = newMap->copyBranch( prg, map->root, 
-					oldNextDown, newNextDown );
-		}
+	#ifdef COLM_LOG_BYTECODE
+	cerr << "splitting map: " << map << " refs: " << 
+			map->refs << endl;
+	#endif
 
-		map->refs -= 1;
+	Map *newMap = (Map*)prg->mapElPool.allocate();
+	newMap->id = map->genericInfo->langElId;
+	newMap->genericInfo = map->genericInfo;
+	newMap->treeSize = map->treeSize;
+	newMap->root = 0;
 
-		for ( MapEl *el = newMap->head; el != 0; el = el->next ) {
-			assert( map->genericInfo->typeArg == TYPE_TREE );
-			tree_upref( el->tree );
-		}
+	/* If there is a root, copy the tree. */
+	if ( map->root != 0 ) {
+		newMap->root = newMap->copyBranch( prg, map->root, 
+				oldNextDown, newNextDown );
+	}
 
-		map = newMap;
+	for ( MapEl *el = newMap->head; el != 0; el = el->next ) {
+		assert( map->genericInfo->typeArg == TYPE_TREE );
+		tree_upref( el->tree );
 	}
-	return map;
+
+	return newMap;
 }
 
 Tree *copy_tree( Program *prg, Tree *tree, Kid *oldNextDown, Kid *&newNextDown )
 {
-	assert( tree->refs >= 2 );
-
 	LangElInfo *lelInfo = prg->rtd->lelInfo;
 	long genericId = lelInfo[tree->id].genericId;
 	if ( genericId > 0 ) {
@@ -782,8 +764,14 @@ Tree *split_tree( Program *prg, Tree *tree )
 			#endif
 
 			Kid *oldNextDown = 0, *newNextDown = 0;
-			tree = copy_tree( prg, tree, oldNextDown, newNextDown );
-			tree_upref( tree );
+			Tree *newTree = copy_tree( prg, tree, oldNextDown, newNextDown );
+			tree_upref( newTree );
+
+			/* Downref the original. Don't need to consider freeing because
+			 * refs were > 1. */
+			tree->refs -= 1;
+
+			tree = newTree;
 		}
 
 		assert( tree->refs == 1 );
@@ -1401,6 +1389,10 @@ void split_ref( Tree **&sp, Program *prg, Ref *fromRef )
 			Tree *newTree = copy_tree( prg, ref->kid->tree, 
 					oldNextKidDown, newNextKidDown );
 			tree_upref( newTree );
+			
+			/* Downref the original. Don't need to consider freeing because
+			 * refs were > 1. */
+			ref->kid->tree->refs -= 1;
 
 			while ( ref != 0 && ref != nextDown ) {
 				next = ref->next;
-- 
cgit v1.2.1


From 50cbcf057612a9ee77e8dd88e30730a14e9776b6 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Tue, 9 Dec 2008 21:14:20 +0000
Subject: Modified the example in the thesis. Copied it here.

---
 test/til.lm | 98 ++++++++++++++++++++++++++++++++++++++++++++-----------------
 1 file changed, 71 insertions(+), 27 deletions(-)

diff --git a/test/til.lm b/test/til.lm
index 346fc50f..24acd4e3 100644
--- a/test/til.lm
+++ b/test/til.lm
@@ -89,36 +89,80 @@ def goto_statement
 
 program P = parse program(stdin)
 
-for S:statement* in P
+#for S:statement* in P
+#{
+#	if match S [L0: id ':' 
+#			First: statement 
+#			Rest: statement*]
+#	{
+#		for Check: statement* in Rest
+#		{
+#			if match Check 
+#				['if' E: expression 'then' 
+#					'goto' Targ: id ';'
+#				'end'
+#				T: statement*]
+#			{
+#				# This truncates Rest
+#				Check = construct statement* []
+#
+#				# Replace the labeled statement through to the goto with a
+#				# do ... while.
+#				S = construct statement*
+#					['do'
+#						First
+#						Rest
+#					'while' E ';'
+#					T]
+#				break
+#			}
+#		}
+#	}
+#}
+
+for S: statement* in P
 {
-	if match S [L0: id ':' 
-			First: statement 
-			Rest: statement*]
-	{
-		for Check: statement* in Rest
+    if match S [Label: id ':' 
+            First: statement 
+            Rest: statement*]
+    {
+		expression Expr
+		statement* Following
+
+		# Look though the remaining statements for a goto back to the label.
+		# The repeat iterator yields only top-level statement lists. It
+		# restricts our search to the same nesting depth as the label.
+        for Check: statement* in Rest
+        {
+            if match Check 
+                ['if' E: expression 'then' 
+                    'goto' L:id ';'
+                'end'
+                SL: statement*]
+            {
+				Expr = E
+				Following = SL
+
+				# Check iterates over tails of Rest. Assigning an empty list
+				# to check truncates the Rest list. What we cut off is saved in
+				# Following (excluding the if statement).
+                Check = construct statement* []
+            }
+        }
+
+		# If a goto was found, then perform the rewrite.
+		if ( Expr )
 		{
-			if match Check 
-				['if' E: expression 'then' 
-					'goto' Targ: id ';'
-				'end'
-				T: statement*] &&
-				Targ == L0
-			{
-				# This truncates Rest
-				Check = construct statement* []
-
-				# Replace the labeled statement through to the goto with a
-				# do ... while.
-				S = construct statement*
-					['do'
-						First
-						Rest
-					'while' E ';'
-					T]
-				break
-			}
+            # Replace the labelled statement through to the goto 
+			# with a do ... while.
+            S = construct statement*
+                ['do'
+                    First
+                    Rest
+                'while' Expr ';'
+                Following]
 		}
-	}
+    }
 }
 
 print(P, '\n')
-- 
cgit v1.2.1


From 34f8eabcf0a11adefc1ab924f29d96ff99cf7d2d Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 6 Feb 2009 01:33:50 +0000
Subject: Fixed a broken reference to flags (from alg) that was wrapped in an
 ifdef COLM_LOG_PARSE and didn't surface until logging was turned on.

---
 colm/fsmrun.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 183762ec..df4b26d7 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -237,7 +237,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 		#ifdef COLM_LOG_PARSE
 		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
 		cerr << "sending back: " << lelInfo[ignore->tree->id].name;
-		if ( ignore->tree->alg != 0 && ignore->tree->alg->flags & AF_ARTIFICIAL )
+		if ( ignore->tree->flags & AF_ARTIFICIAL )
 			cerr << " (artificial)";
 		cerr << endl;
 		#endif
-- 
cgit v1.2.1


From 687a4b9503616a7ed872b7eab08e69d7709cc7fa Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 6 Feb 2009 02:08:57 +0000
Subject: Started on producing refefences from qualified items. Working on
 calling functions with reference parameters. On return they need to be
 popped, this is not done yet.

---
 colm/bytecode.cpp |  13 ++++++
 colm/bytecode.h   |   1 +
 colm/compile.cpp  | 136 +++++++++++++++++++++++++++++++++++++++++++++++++-----
 colm/parsetree.h  |   5 +-
 colm/tree.cpp     |   2 +-
 5 files changed, 144 insertions(+), 13 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 965e1251..985fc16e 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -2029,6 +2029,19 @@ again:
 			push( (SW)ref->kid );
 			break;
 		}
+		case IN_REF_FROM_QUAL_REF: {
+			short int field;
+			read_half( field );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_REF_FROM_QUAL_REF " << field << endl;
+			#endif
+
+			Ref *ref = (Ref*)plocal(field);
+			push( (SW)ref );
+			push( (SW)ref->kid );
+			break;
+		}
 		case IN_TRITER_REF_FROM_CUR: {
 			short int field;
 			read_half( field );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 6fce4b19..743b5221 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -141,6 +141,7 @@ typedef unsigned char uchar;
 
 #define IN_REF_FROM_LOCAL        0x62
 #define IN_REF_FROM_REF          0x97
+#define IN_REF_FROM_QUAL_REF     0xa5
 #define IN_TRITER_REF_FROM_CUR   0x63
 #define IN_UITER_REF_FROM_CUR    0x64
                                 
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 74449095..d9ef83f0 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -353,6 +353,51 @@ ObjectDef *objDefFromUT( ParseData *pd, UniqueType *ut )
 	return objDef;
 }
 
+/* The qualification must start at a local frame. There cannot be any pointer. */
+long LangVarRef::loadQualificationRefs( ParseData *pd, CodeVect &code ) const
+{
+	long count = 0;
+	ObjectDef *rootObj = pd->curLocalFrame;
+
+	/* Start the search from the root object. */
+	ObjectDef *searchObjDef = rootObj;
+
+	for ( QualItemVect::Iter qi = *qual; qi.lte(); qi++ ) {
+		/* Lookup the field in the current qualification. */
+		ObjFieldMapEl *objDefMapEl = searchObjDef->objFieldMap->find( qi->data );
+		if ( objDefMapEl == 0 )
+			error(qi->loc) << "cannot resolve qualification " << qi->data << endp;
+		ObjField *el = objDefMapEl->value;
+
+		if ( qi.pos() > 0 ) {
+			code.append( IN_REF_FROM_QUAL_REF );
+			code.appendHalf( 0 );
+		}
+		else if ( el->typeRef->iterDef != 0 ) {
+			code.append( el->typeRef->iterDef->inRefFromCur );
+			code.appendHalf( el->offset );
+		}
+		else if ( el->typeRef->isRef ) {
+			code.append( IN_REF_FROM_REF );
+			code.appendHalf( el->offset );
+		}
+		else {
+			code.append( IN_REF_FROM_LOCAL );
+			code.appendHalf( el->offset );
+		}
+
+		UniqueType *elUT = el->typeRef->lookupType( pd );
+		if ( elUT->typeId == TYPE_ITER )
+			elUT = el->typeRef->searchTypeRef->lookupType( pd );
+		
+		assert( qi->type == QualItem::Dot );
+
+		searchObjDef = objDefFromUT( pd, elUT );
+		count += 1;
+	}
+	return count;
+}
+
 void LangVarRef::loadQualification( ParseData *pd, CodeVect &code, 
 		ObjectDef *rootObj, int lastPtrInQual, bool forWriting, bool revert ) const
 {
@@ -661,29 +706,63 @@ UniqueType *LangVarRef::evaluate( ParseData *pd, CodeVect &code, bool forWriting
 	return ut;
 }
 
+void LangVarRef::canTakeRef( ParseData *pd, VarRefLookup &lookup ) const
+{
+	bool canTake = false;
+
+	/* If the var is not a local, it must be an attribute accessed
+	 * via a local and attributes. */
+	if ( lookup.inObject->type == ObjectDef::FrameType )
+		canTake = true;
+	else if ( isLocalRef(pd) && lookup.lastPtrInQual < 0 && lookup.uniqueType->typeId != TYPE_PTR ) 
+		canTake = true;
+
+	if ( !canTake ) {
+		error(loc) << "can only take references of locals or "
+				"attributes accessed via a local" << endp;
+	}
+
+	if ( lookup.objField->refActive )
+		error(loc) << "reference currently active, cannot take another" << endp;
+}
+
 /* Return the field referenced. */
-ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code ) const
+ObjField *LangVarRef::preEvaluateRef( ParseData *pd, CodeVect &code ) const
 {
 	/* Lookup the loadObj. */
 	VarRefLookup lookup = lookupField( pd );
 
-	if ( lookup.inObject->type != ObjectDef::FrameType )
-		error(loc) << "can only take references of local variables" << endl;
-	
-	if ( lookup.objField->refActive )
-		error(loc) << "reference current active, cannot take another" << endl;
+	canTakeRef( pd, lookup );
+
+	loadQualificationRefs( pd, code );
+
+	return lookup.objField;
+}
+
+/* Return the field referenced. */
+ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code, long pushCount ) const
+{
+	/* Lookup the loadObj. */
+	VarRefLookup lookup = lookupField( pd );
+
+	canTakeRef( pd, lookup );
 
 	/* Ensure that the field is referenced. */
 	lookup.inObject->referenceField( pd, lookup.objField );
 
 	/* Note that we could have modified children. */
-	lookup.objField->refActive = true;
+	if ( qual->length() == 0 )
+		lookup.objField->refActive = true;
 
 	/* Whenever we take a reference we have to assume writing and that the
 	 * tree is dirty. */
 	lookup.objField->dirtyTree = true;
 
-	if ( lookup.objField->typeRef->iterDef != 0 ) {
+	if ( qual->length() > 0 ) {
+		code.append( IN_REF_FROM_QUAL_REF );
+		code.appendHalf( pushCount );
+	}
+	else if ( lookup.objField->typeRef->iterDef != 0 ) {
 		code.append( lookup.objField->typeRef->iterDef->inRefFromCur );
 		code.appendHalf( lookup.objField->offset );
 	}
@@ -717,16 +796,45 @@ ObjField **LangVarRef::evaluateArgs( ParseData *pd, CodeVect &code,
 
 	/* Evaluate and push the args. */
 	if ( args != 0 ) {
-		/* If we have the parameter list, initialize an iterator. */
+		/* We use this only if there is a paramter list. */
 		ParameterList::Iter p;
+		long pushCount = 0;
+
+		/* First pass we need to push object loads for reference parameters. */
 		paramList != 0 && ( p = *paramList );
+		for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
+			/* Get the expression and the UT for the arg. */
+			LangExpr *expression = *pe;
+			UniqueType *paramUT = lookup.objMethod->paramUTs[pe.pos()];
 
+			if ( paramUT->typeId == TYPE_REF ) {
+				/* Make sure we are dealing with a variable reference. */
+				if ( expression->type != LangExpr::TermType )
+					error(loc) << "not a term: argument must be a local variable" << endp;
+				if ( expression->term->type != LangTerm::VarRefType )
+					error(loc) << "not a variable: argument must be a local variable" << endp;
+
+				/* Lookup the field. */
+				LangVarRef *varRef = expression->term->varRef;
+
+				ObjField *refOf = varRef->preEvaluateRef( pd, code );
+				paramRefs[pe.pos()] = refOf;
+
+				pushCount += varRef->qual->length() * 2;
+			}
+
+			/* Advance the parameter list iterator if we have it. */
+			paramList != 0 && p.increment();
+		}
+
+		paramList != 0 && ( p = *paramList );
 		for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
 			/* Get the expression and the UT for the arg. */
 			LangExpr *expression = *pe;
 			UniqueType *paramUT = lookup.objMethod->paramUTs[pe.pos()];
 
 			if ( paramUT->typeId == TYPE_REF ) {
+				
 				/* Make sure we are dealing with a variable reference. */
 				if ( expression->type != LangExpr::TermType )
 					error(loc) << "not a term: argument must be a local variable" << endp;
@@ -736,14 +844,20 @@ ObjField **LangVarRef::evaluateArgs( ParseData *pd, CodeVect &code,
 				/* Lookup the field. */
 				LangVarRef *varRef = expression->term->varRef;
 
-				ObjField *refOf = varRef->evaluateRef( pd, code );
+				pushCount -= varRef->qual->length() * 2;
+
+				ObjField *refOf = varRef->evaluateRef( pd, code, pushCount );
 				paramRefs[pe.pos()] = refOf;
+
+				pushCount += 2;
 			}
 			else {
 				UniqueType *exprUT = expression->evaluate( pd, code );
 
 				if ( !castAssignment( pd, code, paramUT, 0, exprUT ) )
 					error(loc) << "arg " << pe.pos()+1 << " is of the wrong type" << endp;
+
+				pushCount += 1;
 			}
 
 			/* Advance the parameter list iterator if we have it. */
@@ -1667,7 +1781,7 @@ void LangStmt::compile( ParseData *pd, CodeVect &code ) const
 		}
 		case YieldType: {
 			/* take a reference and yield it. Immediately reset the referece. */
-			ObjField *objField = varRef->evaluateRef( pd, code );
+			ObjField *objField = varRef->evaluateRef( pd, code, 0 );
 			objField->refActive = false;
 			code.append( IN_YIELD );
 			break;
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 08773cce..c34ed104 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1343,6 +1343,7 @@ struct LangVarRef
 	void loadGlobalObj( ParseData *pd, CodeVect &code, 
 			int lastPtrInQual, bool forWriting ) const;
 	void loadObj( ParseData *pd, CodeVect &code, int lastPtrInQual, bool forWriting ) const;
+	void canTakeRef( ParseData *pd, VarRefLookup &lookup ) const;
 
 	void setFieldIter( ParseData *pd, CodeVect &code, 
 			ObjectDef *inObject, UniqueType *objUT, UniqueType *exprType, bool revert ) const;
@@ -1357,8 +1358,10 @@ struct LangVarRef
 	void callOperation( ParseData *pd, CodeVect &code, VarRefLookup &lookup ) const;
 	UniqueType *evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args ) const;
 	UniqueType *evaluate( ParseData *pd, CodeVect &code, bool forWriting = false ) const;
-	ObjField *evaluateRef( ParseData *pd, CodeVect &code ) const;
+	ObjField *evaluateRef( ParseData *pd, CodeVect &code, long pushCount ) const;
+	ObjField *preEvaluateRef( ParseData *pd, CodeVect &code ) const;
 	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs ) const;
+	long loadQualificationRefs( ParseData *pd, CodeVect &code ) const;
 
 	InputLoc loc;
 	QualItemVect *qual;
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 45ac50a6..476585ce 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -525,7 +525,7 @@ rec_call:
 		if ( vm_ptop() != root ) {
 			objectLength = lelInfo[((Kid*)vm_top())->tree->id].objectLength;
 			if ( kidNum < objectLength )
-				cout << " attr=" << kidNum;
+				cout << " an=\"" << kidNum << '"';
 		}
 
 		objectLength = lelInfo[kid->tree->id].objectLength;
-- 
cgit v1.2.1


From f889618be5404ca0a33feeec6812a8a48795d4b3 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 04:58:41 +0000
Subject: REF_FROM_QUAL_REF needs to fetch the field. After a call with
 reference args that have qualifications returns we need to pop the
 qualification references.

---
 colm/bytecode.cpp | 23 ++++++++++++++++++++---
 colm/bytecode.h   |  5 +++++
 colm/compile.cpp  | 32 +++++++++++++++++++++++++++++++-
 colm/parsetree.h  |  2 ++
 colm/tree.cpp     | 13 +++++++++++++
 5 files changed, 71 insertions(+), 4 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 985fc16e..283a3b9b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -1200,6 +1200,17 @@ again:
 			tree_downref( prg, sp, val );
 			break;
 		}
+		case IN_POP_N_WORDS: {
+			short n;
+			read_half( n );
+
+			#ifdef COLM_LOG_BYTECODE
+			cerr << "IN_POP_N_WORDS " << n << endl;
+			#endif
+
+			popn( n );
+			break;
+		}
 		case IN_STR_ATOI: {
 			#ifdef COLM_LOG_BYTECODE
 			cerr << "IN_STR_ATOI" << endl;
@@ -2030,16 +2041,22 @@ again:
 			break;
 		}
 		case IN_REF_FROM_QUAL_REF: {
+			short int back;
 			short int field;
+			read_half( back );
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_REF_FROM_QUAL_REF " << field << endl;
+			cerr << "IN_REF_FROM_QUAL_REF " << back << " " << field << endl;
 			#endif
 
-			Ref *ref = (Ref*)plocal(field);
+			Ref *ref = (Ref*)(sp + back);
+
+			Tree *obj = ref->kid->tree;
+			Kid *attr_kid = get_field_kid( obj, field );
+
 			push( (SW)ref );
-			push( (SW)ref->kid );
+			push( (SW)attr_kid );
 			break;
 		}
 		case IN_TRITER_REF_FROM_CUR: {
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 743b5221..52e4d216 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -72,6 +72,7 @@ typedef unsigned char uchar;
 #define IN_INIT_LOCALS           0x18
 #define IN_POP_LOCALS            0xb0
 #define IN_POP                   0x19
+#define IN_POP_N_WORDS           0xa2
 #define IN_DUP_TOP               0x1a
 #define IN_REJECT                0x1b
 #define IN_MATCH                 0x1c
@@ -350,6 +351,7 @@ Kid *alloc_attrs( Program *prg, long length );
 void free_attrs( Program *prg, Kid *attrs );
 void set_attr( Tree *tree, long pos, Tree *val );
 Tree *get_attr( Tree *tree, long pos );
+Kid *get_attr_kid( Tree *tree, long pos );
 
 /* Return the size of a type in words. */
 template<class T> int sizeof_in_words()
@@ -510,6 +512,9 @@ Tree *get_field_split( Program *prg, Tree *tree, Word field );
 Tree *get_rhs_el( Program *prg, Tree *lhs, long position );
 void set_field( Program *prg, Tree *tree, long field, Tree *value );
 
+/* For making references of attributes. */
+Kid *get_field_kid( Tree *tree, Word field );
+
 Tree *tree_iter_advance( Program *prg, Tree **&sp, TreeIter *iter );
 Tree *tree_iter_next_child( Program *prg, Tree **&sp, TreeIter *iter );
 Tree *tree_iter_prev_child( Program *prg, Tree **&sp, TreeIter *iter );
diff --git a/colm/compile.cpp b/colm/compile.cpp
index d9ef83f0..393b5814 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -372,6 +372,7 @@ long LangVarRef::loadQualificationRefs( ParseData *pd, CodeVect &code ) const
 		if ( qi.pos() > 0 ) {
 			code.append( IN_REF_FROM_QUAL_REF );
 			code.appendHalf( 0 );
+			code.appendHalf( el->offset );
 		}
 		else if ( el->typeRef->iterDef != 0 ) {
 			code.append( el->typeRef->iterDef->inRefFromCur );
@@ -761,6 +762,7 @@ ObjField *LangVarRef::evaluateRef( ParseData *pd, CodeVect &code, long pushCount
 	if ( qual->length() > 0 ) {
 		code.append( IN_REF_FROM_QUAL_REF );
 		code.appendHalf( pushCount );
+		code.appendHalf( lookup.objField->offset );
 	}
 	else if ( lookup.objField->typeRef->iterDef != 0 ) {
 		code.append( lookup.objField->typeRef->iterDef->inRefFromCur );
@@ -904,6 +906,32 @@ void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &loo
 		code.appendHalf( lookup.objMethod->funcId );
 }
 
+void LangVarRef::popPrePush( ParseData *pd, CodeVect &code, 
+		VarRefLookup &lookup, ExprVect *args ) const
+{
+	long popCount = 0;
+
+	/* Evaluate and push the args. */
+	if ( args != 0 ) {
+		/* We use this only if there is a paramter list. */
+		for ( ExprVect::Iter pe = *args; pe.lte(); pe++ ) {
+			/* Get the expression and the UT for the arg. */
+			LangExpr *expression = *pe;
+			UniqueType *paramUT = lookup.objMethod->paramUTs[pe.pos()];
+
+			if ( paramUT->typeId == TYPE_REF ) {
+				/* Lookup the field. */
+				LangVarRef *varRef = expression->term->varRef;
+				popCount += varRef->qual->length() * 2;
+			}
+		}
+		if ( popCount > 0 ) {
+			code.append( IN_POP_N_WORDS );
+			code.appendHalf( (short)popCount );
+		}
+	}
+}
+
 UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *args ) const
 {
 	/* Evaluate the object. */
@@ -915,7 +943,9 @@ UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *a
 	/* Write the call opcode. */
 	callOperation( pd, code, lookup );
 
-	resetActiveRefs( pd, lookup, paramRefs );
+	popPrePush( pd, code, lookup, args );
+
+	resetActiveRefs( pd, lookup, paramRefs);
 	delete[] paramRefs;
 
 	/* Return the type to the expression. */
diff --git a/colm/parsetree.h b/colm/parsetree.h
index c34ed104..db38462b 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1362,6 +1362,8 @@ struct LangVarRef
 	ObjField *preEvaluateRef( ParseData *pd, CodeVect &code ) const;
 	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs ) const;
 	long loadQualificationRefs( ParseData *pd, CodeVect &code ) const;
+	void popPrePush( ParseData *pd, CodeVect &code, 
+			VarRefLookup &lookup, ExprVect *args ) const;
 
 	InputLoc loc;
 	QualItemVect *qual;
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 476585ce..e79e569d 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -68,6 +68,14 @@ Tree *get_attr( Tree *tree, long pos )
 	return cur->tree;
 }
 
+Kid *get_attr_kid( Tree *tree, long pos )
+{
+	Kid *cur = tree->child;
+	for ( long i = 0; i < pos; i++ )
+		cur = cur->next;
+	return cur;
+}
+
 Kid *copy_obj_data( Program *prg, long length, Kid *src )
 {
 	Kid *cur = 0;
@@ -1010,6 +1018,11 @@ Tree *get_field( Tree *tree, Word field )
 	return get_attr( tree, field );
 }
 
+Kid *get_field_kid( Tree *tree, Word field )
+{
+	return get_attr_kid( tree, field );
+}
+
 Tree *get_field_split( Program *prg, Tree *tree, Word field )
 {
 	Tree *val = get_attr( tree, field );
-- 
cgit v1.2.1


From 9b628d70a28e51fad7cfff853e14b8a442895e21 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 14:44:20 +0000
Subject: Need to pop the reference param qualifications after destroying the
 iterator context.

---
 colm/compile.cpp | 8 ++++++--
 colm/parsetree.h | 2 +-
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index 393b5814..c61e9faf 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -906,7 +906,7 @@ void LangVarRef::callOperation( ParseData *pd, CodeVect &code, VarRefLookup &loo
 		code.appendHalf( lookup.objMethod->funcId );
 }
 
-void LangVarRef::popPrePush( ParseData *pd, CodeVect &code, 
+void LangVarRef::popRefQuals( ParseData *pd, CodeVect &code, 
 		VarRefLookup &lookup, ExprVect *args ) const
 {
 	long popCount = 0;
@@ -943,7 +943,7 @@ UniqueType *LangVarRef::evaluateCall( ParseData *pd, CodeVect &code, ExprVect *a
 	/* Write the call opcode. */
 	callOperation( pd, code, lookup );
 
-	popPrePush( pd, code, lookup, args );
+	popRefQuals( pd, code, lookup, args );
 
 	resetActiveRefs( pd, lookup, paramRefs);
 	delete[] paramRefs;
@@ -1565,6 +1565,8 @@ void LangStmt::compileForIterBody( ParseData *pd,
 	/* Destroy the iterator. */
 	code.append( iterUT->iterDef->inDestroy );
 	code.appendHalf( objField->offset );
+
+	/* Clean up any prepush args. */
 }
 
 LangTerm *LangStmt::chooseDefaultIter( ParseData *pd, LangTerm *fromVarRef ) const
@@ -1655,6 +1657,8 @@ void LangStmt::compileForIter( ParseData *pd, CodeVect &code ) const
 
 	compileForIterBody( pd, code, iterUT );
 
+	iterCallTerm->varRef->popRefQuals( pd, code, lookup, iterCallTerm->args );
+
 	iterCallTerm->varRef->resetActiveRefs( pd, lookup, paramRefs );
 	delete[] paramRefs;
 }
diff --git a/colm/parsetree.h b/colm/parsetree.h
index db38462b..96449c43 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1362,7 +1362,7 @@ struct LangVarRef
 	ObjField *preEvaluateRef( ParseData *pd, CodeVect &code ) const;
 	void resetActiveRefs( ParseData *pd, VarRefLookup &lookup, ObjField **paramRefs ) const;
 	long loadQualificationRefs( ParseData *pd, CodeVect &code ) const;
-	void popPrePush( ParseData *pd, CodeVect &code, 
+	void popRefQuals( ParseData *pd, CodeVect &code, 
 			VarRefLookup &lookup, ExprVect *args ) const;
 
 	InputLoc loc;
-- 
cgit v1.2.1


From 8f244d290f3df474ac8da7289d0f184e860f9c69 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 15:03:09 +0000
Subject: Can use qualifications in yield statements.

---
 colm/compile.cpp | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index c61e9faf..aab44efc 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1815,9 +1815,16 @@ void LangStmt::compile( ParseData *pd, CodeVect &code ) const
 		}
 		case YieldType: {
 			/* take a reference and yield it. Immediately reset the referece. */
+			varRef->preEvaluateRef( pd, code );
 			ObjField *objField = varRef->evaluateRef( pd, code, 0 );
-			objField->refActive = false;
 			code.append( IN_YIELD );
+
+			if ( varRef->qual->length() > 0 ) {
+				code.append( IN_POP_N_WORDS );
+				code.appendHalf( (short)(varRef->qual->length()*2) );
+			}
+
+			objField->refActive = false;
 			break;
 		}
 	}
-- 
cgit v1.2.1


From 3f21e5c2e1a425e164bfd368a410faabf3a62680 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 16:00:17 +0000
Subject: Reorganized the src variables. All sources are now a combination of
 RUNTIME and COLM. Prep for making production and debug runtime libs.

---
 colm/Makefile.in | 34 +++++++++++++++++++---------------
 1 file changed, 19 insertions(+), 15 deletions(-)

diff --git a/colm/Makefile.in b/colm/Makefile.in
index 11616d65..435dd3eb 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -18,6 +18,13 @@
 #   along with Colm; if not, write to the Free Software
 #   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 
+
+# Logging:
+# colm: rt on/off
+# rt_prd: off
+# rt_db: on
+# rt_clm: rt on/off
+
 INCS += -I../aapl
 DEFS +=
 
@@ -25,13 +32,8 @@ CFLAGS += -g -Wall -Wwrite-strings
 LDFLAGS +=
 
 # Frequently changed ones first.
-CC_SRCS = \
+COLM_SRC = \
 	compile.cpp \
-	bytecode.cpp \
-	tree.cpp \
-	fsmrun.cpp \
-	pdarun.cpp \
-	input.cpp \
 	lmparse.cpp \
 	lmscan.cpp \
 	parsetree.cpp \
@@ -48,9 +50,6 @@ CC_SRCS = \
 	redfsm.cpp \
 	fsmexec.cpp \
 	main.cpp \
-	list.cpp \
-	map.cpp \
-	string.cpp \
 	redbuild.cpp \
 	closure.cpp \
 	fsmap.cpp \
@@ -59,6 +58,10 @@ CC_SRCS = \
 
 RUNTIME_SRC = fsmrun.cpp pdarun.cpp bytecode.cpp list.cpp \
 	map.cpp string.cpp input.cpp tree.cpp
+
+ALL_SRC = $(COLM_SRC) $(RUNTIME_SRC)
+
+# Files in ALL_SRC that are generated.
 GEN_SRC = version.h lmscan.cpp lmparse.h lmparse.cpp 
 
 RUNTIME = runtime.a
@@ -78,18 +81,19 @@ BUILD_PARSERS = @BUILD_PARSERS@
 CXX = @CXX@
 
 # Get objects and dependencies from sources.
-OBJS = $(CC_SRCS:%.cpp=%.o)
+COLM_OBJ = $(COLM_SRC:%.cpp=%.o)
+RUNTIME_OBJ = $(RUNTIME_SRC:%.cpp=%.o)
+
 DEPS = $(CC_SRCS:%.cpp=.%.d)
-RUNTIME_OBJS = $(RUNTIME_SRC:%.cpp=%.o)
 
 # Rules.
 all: colm $(RUNTIME)
 
-colm: $(GEN_SRC) $(OBJS) $(LIBS)
-	$(CXX) $(LDFLAGS) -o $@ $(OBJS) $(LIBS)
+colm: $(GEN_SRC) $(COLM_OBJ) $(RUNTIME_OBJ) $(LIBS)
+	$(CXX) $(LDFLAGS) -o $@ $(COLM_OBJ) $(RUNTIME_OBJ) $(LIBS)
 
-$(RUNTIME): $(RUNTIME_OBJS)
-	ar -cr $@ $(RUNTIME_OBJS)
+$(RUNTIME): $(RUNTIME_OBJ)
+	ar -cr $@ $(RUNTIME_OBJ)
 
 version.h: ../version.mk
 	echo '#define VERSION "$(VERSION)"' > version.h
-- 
cgit v1.2.1


From fa95840873220d4d1b5f80bb6cb8d06e8e3cea59 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 17:11:53 +0000
Subject: In the colm-only code guard log statements with a runtime flag. In
 the runtime code guard it with an ifdef and a runtime flag.

---
 colm/bytecode.cpp  | 634 ++++++++++++++++++++++++++++++++++++++++-------------
 colm/config.h.in   |   6 +
 colm/fsmap.cpp     |  13 +-
 colm/fsmgraph.cpp  |  20 +-
 colm/fsmrun.cpp    | 124 +++++++----
 colm/lmparse.kl    |   6 +-
 colm/main.cpp      |  12 +-
 colm/parsedata.cpp |  24 +-
 colm/pdabuild.cpp  |  14 +-
 colm/pdarun.cpp    |  86 +++++---
 colm/tree.cpp      |  36 ++-
 11 files changed, 703 insertions(+), 272 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 283a3b9b..25d4d38b 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -77,6 +77,12 @@ using std::endl;
 	i |= ((Word) *instr++) << 8; \
 } while(0)
 
+int colm_log_bytecode = 1;
+int colm_log_parse = 1;
+int colm_log_match = 1;
+int colm_log_compile = 1;
+int colm_log_conds = 1;
+
 Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree )
 {
 	/* If the tree was produced by a parsing function then we need to send a
@@ -84,7 +90,9 @@ Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree )
 	 * parsing algorithm data. */
 	if ( !(tree->flags & AF_PARSE_TREE) || tree->flags & AF_PARSED ) {
 		#ifdef COLM_LOG_BYTECODE
-		cerr << "copying tree in send function" << endl;
+		if ( colm_log_bytecode ) {
+			cerr << "copying tree in send function" << endl;
+		}
 		#endif
 		Kid *unused = 0;
 		Tree *newTree = copy_real_tree( prg, tree, 0, unused, true );
@@ -199,7 +207,9 @@ void downref_local_trees( Program *prg, Tree **sp, Tree **frame, char *trees, lo
 {
 	for ( long i = 0; i < treesLen; i++ ) {
 		#ifdef COLM_LOG_BYTECODE
-		cerr << "local tree downref: " << (long)trees[i] << endl;
+		if ( colm_log_bytecode ) {
+			cerr << "local tree downref: " << (long)trees[i] << endl;
+		}
 		#endif
 
 		tree_downref( prg, sp, local((long)trees[i]) );
@@ -295,7 +305,9 @@ void Program::clearGlobal( Tree **sp )
 void Program::clear( Tree **vm_stack, Tree **sp )
 {
 	#ifdef COLM_LOG_BYTECODE
-	cerr << "clearing the prg" << endl;
+	if ( colm_log_bytecode ) {
+		cerr << "clearing the prg" << endl;
+	}
 	#endif
 
 	clearGlobal( sp );
@@ -395,7 +407,9 @@ void Program::run()
 
 		/* Pull out the reverse code and free it. */
 		#ifdef COLM_LOG_BYTECODE
-		cerr << "freeing the root reverse code" << endl;
+		if ( colm_log_bytecode ) {
+			cerr << "freeing the root reverse code" << endl;
+		}
 		#endif
 
 		/* The root code should all be commit code and reverseCode
@@ -454,7 +468,9 @@ again:
 			Tree *lhs;
 			read_tree( lhs );
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_RESTORE_LHS" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_RESTORE_LHS" << endl;
+			}
 			#endif
 			tree_downref( prg, sp, lhs );
 			break;
@@ -469,7 +485,9 @@ again:
 			read_word( wrev );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PARSE_BKT " << parserId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PARSE_BKT " << parserId << endl;
+			}
 			#endif
 
 			rcode_downref_all( prg, sp, (CodeVect*)wrev );
@@ -484,7 +502,9 @@ again:
 			read_tree( str );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PULL_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PULL_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, stream );
@@ -498,7 +518,9 @@ again:
 			read_word( len );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PUSH_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PUSH_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, stream );
@@ -506,7 +528,9 @@ again:
 		}
 		case IN_LOAD_GLOBAL_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			}
 			#endif
 			break;
 		}
@@ -515,7 +539,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_FIELD_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_FIELD_BKT " << field << endl;
+			}
 			#endif
 			break;
 		}
@@ -526,7 +552,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_FIELD_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_FIELD_BKT " << field << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, val );
@@ -537,7 +565,9 @@ again:
 			read_tree( ptr );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PTR_DEREF_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PTR_DEREF_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, ptr );
@@ -548,7 +578,9 @@ again:
 			read_word( oldval );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			}
 			#endif
 
 			Head *head = (Head*)oldval;
@@ -557,7 +589,9 @@ again:
 		}
 		case IN_LIST_APPEND_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_APPEND_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_APPEND_BKT" << endl;
+			}
 			#endif
 			break;
 		}
@@ -566,7 +600,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, val );
@@ -577,7 +613,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			}
 			#endif
 			break;
 		}
@@ -588,7 +626,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, val );
@@ -601,7 +641,9 @@ again:
 			read_tree( key );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_INSERT_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_INSERT_BKT" << endl;
+			}
 			#endif
 			
 			tree_downref( prg, sp, key );
@@ -613,7 +655,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_STORE_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_STORE_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, key );
@@ -626,7 +670,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_REMOVE_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_REMOVE_BKT" << endl;
+			}
 			#endif
 
 			tree_downref( prg, sp, key );
@@ -722,7 +768,9 @@ again:
 	switch ( *instr++ ) {
 		case IN_SAVE_LHS: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SAVE_LHS" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SAVE_LHS" << endl;
+			}
 			#endif
 
 			assert( lhs != 0 );
@@ -740,7 +788,9 @@ again:
 			read_tree( restore );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_RESTORE_LHS" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_RESTORE_LHS" << endl;
+			}
 			#endif
 			assert( lhs == 0 );
 			lhs = restore;
@@ -748,7 +798,9 @@ again:
 		}
 		case IN_LOAD_NIL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_NIL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_NIL" << endl;
+			}
 			#endif
 
 			push( 0 );
@@ -756,7 +808,9 @@ again:
 		}
 		case IN_LOAD_TRUE: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_TRUE" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_TRUE" << endl;
+			}
 			#endif
 
 			tree_upref( prg->trueVal );
@@ -765,7 +819,9 @@ again:
 		}
 		case IN_LOAD_FALSE: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_FALSE" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_FALSE" << endl;
+			}
 			#endif
 
 			tree_upref( prg->falseVal );
@@ -777,7 +833,9 @@ again:
 			read_word( i );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_INT " << i << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_INT " << i << endl;
+			}
 			#endif
 
 			Tree *tree = construct_integer( prg, i );
@@ -790,7 +848,9 @@ again:
 			read_word( offset );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_STR " << offset << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_STR " << offset << endl;
+			}
 			#endif
 
 			Head *lit = make_literal( prg, offset );
@@ -801,7 +861,9 @@ again:
 		}
 		case IN_PRINT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PRINT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PRINT" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -811,7 +873,9 @@ again:
 		}
 		case IN_PRINT_XML: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PRINT_XML" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PRINT_XML" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -821,7 +885,9 @@ again:
 		}
 		case IN_LOAD_GLOBAL_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_GLOBAL_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_GLOBAL_R" << endl;
+			}
 			#endif
 
 			tree_upref( prg->global );
@@ -830,7 +896,9 @@ again:
 		}
 		case IN_LOAD_GLOBAL_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_GLOBAL_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_GLOBAL_WV" << endl;
+			}
 			#endif
 
 			tree_upref( prg->global );
@@ -843,7 +911,9 @@ again:
 		}
 		case IN_LOAD_GLOBAL_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_GLOBAL_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_GLOBAL_WC" << endl;
+			}
 			#endif
 
 			/* This is identical to the _R version, but using it for writing
@@ -854,7 +924,9 @@ again:
 		}
 		case IN_LOAD_GLOBAL_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LOAD_GLOBAL_BKT" << endl;
+			}
 			#endif
 
 			tree_upref( prg->global );
@@ -868,7 +940,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_INIT_RHS_EL " << position << " " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_INIT_RHS_EL " << position << " " << field << endl;
+			}
 			#endif
 
 			Tree *val = get_rhs_el( prg, lhs, position );
@@ -881,7 +955,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_ADVANCE " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_ADVANCE " << field << endl;
+			}
 			#endif
 
 			/* Get the iterator. */
@@ -903,7 +979,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_GET_CUR_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_GET_CUR_R " << field << endl;
+			}
 			#endif
 
 			UserIter *uiter = (UserIter*) local(field);
@@ -917,7 +995,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_GET_CUR_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_GET_CUR_WC " << field << endl;
+			}
 			#endif
 
 			UserIter *uiter = (UserIter*) local(field);
@@ -932,7 +1012,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_SET_CUR_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_SET_CUR_WC " << field << endl;
+			}
 			#endif
 
 			Tree *t = pop();
@@ -948,7 +1030,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LOCAL_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LOCAL_R " << field << endl;
+			}
 			#endif
 
 			Tree *val = local(field);
@@ -961,7 +1045,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LOCAL_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LOCAL_WC " << field << endl;
+			}
 			#endif
 
 			Tree *split = get_local_split( prg, frame, field );
@@ -974,7 +1060,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LOCAL_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LOCAL_WC " << field << endl;
+			}
 			#endif
 
 			Tree *val = pop();
@@ -984,7 +1072,9 @@ again:
 		}
 		case IN_SAVE_RET: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SAVE_RET " << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SAVE_RET " << endl;
+			}
 			#endif
 
 			Tree *val = pop();
@@ -996,7 +1086,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LOCAL_REF_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LOCAL_REF_R " << field << endl;
+			}
 			#endif
 
 			Ref *ref = (Ref*) plocal(field);
@@ -1010,7 +1102,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LOCAL_REF_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LOCAL_REF_WC " << field << endl;
+			}
 			#endif
 
 			Ref *ref = (Ref*) plocal(field);
@@ -1025,7 +1119,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LOCAL_REF_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LOCAL_REF_WC " << field << endl;
+			}
 			#endif
 
 			Tree *val = pop();
@@ -1039,7 +1135,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_FIELD_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_FIELD_R " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1055,7 +1153,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_FIELD_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_FIELD_WC " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1071,7 +1171,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_FIELD_WV " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_FIELD_WV " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1092,7 +1194,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_FIELD_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_FIELD_BKT " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1108,7 +1212,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_FIELD_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_FIELD_WC " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1127,7 +1233,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_FIELD_WV " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_FIELD_WV " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1154,7 +1262,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_FIELD_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_FIELD_BKT " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -1172,7 +1282,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_FIELD_LEAVE_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_FIELD_LEAVE_WC " << field << endl;
+			}
 			#endif
 
 			/* Note that we don't downref the object here because we are
@@ -1193,7 +1305,9 @@ again:
 		}
 		case IN_POP: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_POP" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_POP" << endl;
+			}
 			#endif
 
 			Tree *val = pop();
@@ -1205,7 +1319,9 @@ again:
 			read_half( n );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_POP_N_WORDS " << n << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_POP_N_WORDS " << n << endl;
+			}
 			#endif
 
 			popn( n );
@@ -1213,7 +1329,9 @@ again:
 		}
 		case IN_STR_ATOI: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STR_ATOI" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STR_ATOI" << endl;
+			}
 			#endif
 
 			Str *str = (Str*)pop();
@@ -1226,7 +1344,9 @@ again:
 		}
 		case IN_INT_TO_STR: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_INT_TO_STR" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_INT_TO_STR" << endl;
+			}
 			#endif
 
 			Int *i = (Int*)pop();
@@ -1239,7 +1359,9 @@ again:
 		}
 		case IN_CONCAT_STR: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CONCAT_STR" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_CONCAT_STR" << endl;
+			}
 			#endif
 
 			Str *s2 = (Str*)pop();
@@ -1254,7 +1376,9 @@ again:
 		}
 		case IN_STR_UORD8: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STR_UORD8" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STR_UORD8" << endl;
+			}
 			#endif
 
 			Str *str = (Str*)pop();
@@ -1267,7 +1391,9 @@ again:
 		}
 		case IN_STR_UORD16: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STR_UORD16" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STR_UORD16" << endl;
+			}
 			#endif
 
 			Str *str = (Str*)pop();
@@ -1281,7 +1407,9 @@ again:
 
 		case IN_STR_LENGTH: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STR_LENGTH" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STR_LENGTH" << endl;
+			}
 			#endif
 
 			Str *str = (Str*)pop();
@@ -1297,7 +1425,9 @@ again:
 			read_half( dist );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_JMP_FALSE " << dist << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_JMP_FALSE " << dist << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1311,7 +1441,9 @@ again:
 			read_half( dist );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_JMP_TRUE " << dist << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_JMP_TRUE " << dist << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1325,7 +1457,9 @@ again:
 			read_half( dist );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_JMP " << dist << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_JMP " << dist << endl;
+			}
 			#endif
 
 			instr += dist;
@@ -1333,7 +1467,9 @@ again:
 		}
 		case IN_REJECT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_REJECT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_REJECT" << endl;
+			}
 			#endif
 			reject = true;
 			break;
@@ -1344,7 +1480,9 @@ again:
 		 */
 		case IN_TST_EQL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_EQL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_EQL" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1359,7 +1497,9 @@ again:
 		}
 		case IN_TST_NOT_EQL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_NOT_EQL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_NOT_EQL" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1374,7 +1514,9 @@ again:
 		}
 		case IN_TST_LESS: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_LESS" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_LESS" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1389,7 +1531,9 @@ again:
 		}
 		case IN_TST_LESS_EQL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_LESS_EQL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_LESS_EQL" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1403,7 +1547,9 @@ again:
 		}
 		case IN_TST_GRTR: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_GRTR" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_GRTR" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1418,7 +1564,9 @@ again:
 		}
 		case IN_TST_GRTR_EQL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_GRTR_EQL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_GRTR_EQL" << endl;
+			}
 			#endif
 
 			Tree *o2 = (Tree*)pop();
@@ -1433,7 +1581,9 @@ again:
 		}
 		case IN_TST_LOGICAL_AND: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_LOGICAL_AND" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_LOGICAL_AND" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1450,7 +1600,9 @@ again:
 		}
 		case IN_TST_LOGICAL_OR: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TST_LOGICAL_OR" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TST_LOGICAL_OR" << endl;
+			}
 			#endif
 
 			Tree *o2 = pop();
@@ -1467,7 +1619,9 @@ again:
 		}
 		case IN_NOT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_NOT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_NOT" << endl;
+			}
 			#endif
 
 			Tree *tree = (Tree*)pop();
@@ -1481,7 +1635,9 @@ again:
 
 		case IN_ADD_INT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_ADD_INT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_ADD_INT" << endl;
+			}
 			#endif
 
 			Int *o2 = (Int*)pop();
@@ -1496,7 +1652,9 @@ again:
 		}
 		case IN_MULT_INT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MULT_INT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MULT_INT" << endl;
+			}
 			#endif
 
 			Int *o2 = (Int*)pop();
@@ -1511,7 +1669,9 @@ again:
 		}
 		case IN_SUB_INT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SUB_INT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SUB_INT" << endl;
+			}
 			#endif
 
 			Int *o2 = (Int*)pop();
@@ -1526,7 +1686,9 @@ again:
 		}
 		case IN_DUP_TOP: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_DUP_TOP" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_DUP_TOP" << endl;
+			}
 			#endif
 
 			Tree *val = top();
@@ -1541,7 +1703,9 @@ again:
 			read_half( searchTypeId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_FROM_REF " << field << " " << searchTypeId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_FROM_REF " << field << " " << searchTypeId << endl;
+			}
 			#endif
 
 			Ref rootRef;
@@ -1556,7 +1720,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_DESTROY " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_DESTROY " << field << endl;
+			}
 			#endif
 
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1568,7 +1734,9 @@ again:
 			read_word( id );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TREE_SEARCH " << id << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TREE_SEARCH " << id << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1583,7 +1751,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_ADVANCE " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_ADVANCE " << field << endl;
+			}
 			#endif
 
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1597,7 +1767,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_NEXT_CHILD " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_NEXT_CHILD " << field << endl;
+			}
 			#endif
 
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1611,7 +1783,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_PREV_CHILD " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_PREV_CHILD " << field << endl;
+			}
 			#endif
 
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1625,7 +1799,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_GET_CUR_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_GET_CUR_R " << field << endl;
+			}
 			#endif
 			
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1639,7 +1815,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_GET_CUR_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_GET_CUR_WC " << field << endl;
+			}
 			#endif
 			
 			TreeIter *iter = (TreeIter*) plocal(field);
@@ -1654,7 +1832,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_SET_CUR_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_SET_CUR_WC " << field << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1670,7 +1850,9 @@ again:
 			read_half( patternId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MATCH " << patternId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MATCH " << patternId << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1698,7 +1880,9 @@ again:
 			}
 
 			#ifdef COLM_LOG_MATCH
-			cerr << "match result: " << matched << endl;
+			if ( colm_log_match ) {
+				cerr << "match result: " << matched << endl;
+			}
 			#endif
 
 			Tree *result = matched ? tree : 0;
@@ -1718,7 +1902,9 @@ again:
 			read_half( stopId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PARSE_WV " << parserId << " " << stopId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PARSE_WV " << parserId << " " << stopId << endl;
+			}
 			#endif
 
 			/* Comes back from parse upreffed. */
@@ -1743,7 +1929,9 @@ again:
 			read_half( stopId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PARSE_WC " << parserId << " " << stopId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PARSE_WC " << parserId << " " << stopId << endl;
+			}
 			#endif
 
 			/* Comes back from parse upreffed. */
@@ -1757,7 +1945,9 @@ again:
 		}
 		case IN_STREAM_PULL: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PULL" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PULL" << endl;
+			}
 			#endif
 			Tree *len = pop();
 			Tree *stream = pop();
@@ -1781,7 +1971,9 @@ again:
 			read_tree( string );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PULL_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PULL_BKT" << endl;
+			}
 			#endif
 
 			undo_pull( prg, (Stream*)stream, string );
@@ -1793,7 +1985,9 @@ again:
 			/* FIXME: Need to check the refcounting here. */
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PUSH" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PUSH" << endl;
+			}
 			#endif
 			Tree *tree = pop();
 			Tree *stream = pop();
@@ -1817,7 +2011,9 @@ again:
 			read_word( len );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STREAM_PUSH_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STREAM_PUSH_BKT" << endl;
+			}
 			#endif
 
 			undo_stream_push( sp, prg, (Stream*)stream, len );
@@ -1834,7 +2030,9 @@ again:
 			read_word( wrev );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PARSE_BKT " << parserId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PARSE_BKT " << parserId << endl;
+			}
 			#endif
 
 			undo_parse( sp, prg, (Stream*)stream, parserId, tree, (CodeVect*)wrev );
@@ -1847,7 +2045,9 @@ again:
 			read_half( patternId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CONSTRUCT " << patternId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_CONSTRUCT " << patternId << endl;
+			}
 			#endif
 
 			int rootNode = prg->rtd->patReplInfo[patternId].offset;
@@ -1882,7 +2082,9 @@ again:
 			read_half( tokenId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CONSTRUCT_TERM " << tokenId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_CONSTRUCT_TERM " << tokenId << endl;
+			}
 			#endif
 
 			/* Pop the string we are constructing the token from. */
@@ -1897,7 +2099,9 @@ again:
 			read_byte( nargs );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAKE_TOKEN " << (ulong) nargs << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAKE_TOKEN " << (ulong) nargs << endl;
+			}
 			#endif
 
 			Tree *result = make_token( sp, prg, nargs );
@@ -1911,7 +2115,9 @@ again:
 			read_byte( nargs );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAKE_TREE " << (ulong) nargs << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAKE_TREE " << (ulong) nargs << endl;
+			}
 			#endif
 
 			Tree *result = make_tree( sp, prg, nargs );
@@ -1922,7 +2128,9 @@ again:
 		}
 		case IN_SEND: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SEND" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SEND" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1932,7 +2140,9 @@ again:
 		}
 		case IN_IGNORE: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_IGNORE" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_IGNORE" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1942,7 +2152,9 @@ again:
 		}
 		case IN_TREE_NEW: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TREE_NEW " << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TREE_NEW " << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -1953,7 +2165,9 @@ again:
 		}
 		case IN_PTR_DEREF_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PTR_DEREF_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PTR_DEREF_R" << endl;
+			}
 			#endif
 
 			Pointer *ptr = (Pointer*)pop();
@@ -1966,7 +2180,9 @@ again:
 		}
 		case IN_PTR_DEREF_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PTR_DEREF_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PTR_DEREF_WC" << endl;
+			}
 			#endif
 
 			Pointer *ptr = (Pointer*)pop();
@@ -1979,7 +2195,9 @@ again:
 		}
 		case IN_PTR_DEREF_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PTR_DEREF_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PTR_DEREF_WV" << endl;
+			}
 			#endif
 
 			Pointer *ptr = (Pointer*)pop();
@@ -2001,7 +2219,9 @@ again:
 			read_word( p );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_PTR_DEREF_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PTR_DEREF_BKT" << endl;
+			}
 			#endif
 
 			Pointer *ptr = (Pointer*)p;
@@ -2018,7 +2238,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_REF_FROM_LOCAL " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_REF_FROM_LOCAL " << field << endl;
+			}
 			#endif
 
 			/* First push the null next pointer, then the kid pointer. */
@@ -2032,7 +2254,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_REF_FROM_REF " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_REF_FROM_REF " << field << endl;
+			}
 			#endif
 
 			Ref *ref = (Ref*)plocal(field);
@@ -2047,7 +2271,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_REF_FROM_QUAL_REF " << back << " " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_REF_FROM_QUAL_REF " << back << " " << field << endl;
+			}
 			#endif
 
 			Ref *ref = (Ref*)(sp + back);
@@ -2064,7 +2290,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_TRITER_REF_FROM_CUR " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_TRITER_REF_FROM_CUR " << field << endl;
+			}
 			#endif
 
 			/* Push the next pointer first, then the kid. */
@@ -2078,7 +2306,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_REF_FROM_CUR " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_REF_FROM_CUR " << field << endl;
+			}
 			#endif
 
 			/* Push the next pointer first, then the kid. */
@@ -2089,7 +2319,9 @@ again:
 		}
 		case IN_GET_TOKEN_DATA_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_TOKEN_DATA_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_TOKEN_DATA_R" << endl;
+			}
 			#endif
 
 			Tree *tree = (Tree*) pop();
@@ -2102,7 +2334,9 @@ again:
 		}
 		case IN_SET_TOKEN_DATA_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_TOKEN_DATA_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_TOKEN_DATA_WC" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -2117,7 +2351,9 @@ again:
 		}
 		case IN_SET_TOKEN_DATA_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_TOKEN_DATA_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_TOKEN_DATA_WV" << endl;
+			}
 			#endif
 
 			Tree *tree = pop();
@@ -2139,7 +2375,9 @@ again:
 		}
 		case IN_SET_TOKEN_DATA_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_TOKEN_DATA_BKT " << endl;
+			}
 			#endif
 
 			Word oldval;
@@ -2154,7 +2392,9 @@ again:
 		}
 		case IN_GET_TOKEN_POS_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_TOKEN_POS_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_TOKEN_POS_R" << endl;
+			}
 			#endif
 
 			Tree *tree = (Tree*) pop();
@@ -2169,7 +2409,9 @@ again:
 		}
 		case IN_GET_MATCH_LENGTH_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_MATCH_LENGTH_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_MATCH_LENGTH_R" << endl;
+			}
 			#endif
 			Tree *integer = construct_integer( prg, string_length(matchText) );
 			tree_upref( integer );
@@ -2178,7 +2420,9 @@ again:
 		}
 		case IN_GET_MATCH_TEXT_R: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_MATCH_TEXT_R" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_MATCH_TEXT_R" << endl;
+			}
 			#endif
 			Head *s = string_copy( prg, matchText );
 			Tree *tree = construct_string( prg, s );
@@ -2188,7 +2432,9 @@ again:
 		}
 		case IN_LIST_LENGTH: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_LENGTH" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_LENGTH" << endl;
+			}
 			#endif
 
 			List *list = (List*) pop();
@@ -2200,7 +2446,9 @@ again:
 		}
 		case IN_LIST_APPEND_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_APPEND_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_APPEND_WV" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2221,7 +2469,9 @@ again:
 		}
 		case IN_LIST_APPEND_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_APPEND_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_APPEND_WC" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2236,7 +2486,9 @@ again:
 		}
 		case IN_LIST_APPEND_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_APPEND_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_APPEND_BKT" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2248,7 +2500,9 @@ again:
 		}
 		case IN_LIST_REMOVE_END_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_REMOVE_END_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_REMOVE_END_WC" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2260,7 +2514,9 @@ again:
 		}
 		case IN_LIST_REMOVE_END_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_REMOVE_END_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_REMOVE_END_WV" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2281,7 +2537,9 @@ again:
 		}
 		case IN_LIST_REMOVE_END_BKT: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_LIST_REMOVE_END_BKT" << endl;
+			}
 			#endif
 
 			Tree *val;
@@ -2298,7 +2556,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LIST_MEM_R " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LIST_MEM_R " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2314,7 +2574,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LIST_MEM_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LIST_MEM_WC " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2330,7 +2592,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LIST_MEM_WV " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LIST_MEM_WV " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2351,7 +2615,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_LIST_MEM_BKT " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2367,7 +2633,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LIST_MEM_WC " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LIST_MEM_WC " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2383,7 +2651,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LIST_MEM_WV " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LIST_MEM_WV " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2408,7 +2678,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_SET_LIST_MEM_BKT " << field << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2420,7 +2692,9 @@ again:
 		}
 		case IN_MAP_INSERT_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_INSERT_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_INSERT_WV" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2454,7 +2728,9 @@ again:
 		}
 		case IN_MAP_INSERT_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_INSERT_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_INSERT_WC" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2481,7 +2757,9 @@ again:
 			read_tree( key );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_INSERT_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_INSERT_BKT" << endl;
+			}
 			#endif
 			
 			Tree *obj = pop();
@@ -2497,7 +2775,9 @@ again:
 		}
 		case IN_MAP_STORE_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_STORE_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_STORE_WC" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2518,7 +2798,9 @@ again:
 		}
 		case IN_MAP_STORE_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_STORE_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_STORE_WV" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2553,7 +2835,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_STORE_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_STORE_BKT" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2569,7 +2853,9 @@ again:
 		}
 		case IN_MAP_REMOVE_WC: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_REMOVE_WC" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_REMOVE_WC" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2585,7 +2871,9 @@ again:
 		}
 		case IN_MAP_REMOVE_WV: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_REMOVE_WV" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_REMOVE_WV" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2612,7 +2900,9 @@ again:
 			read_tree( val );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_REMOVE_BKT" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_REMOVE_BKT" << endl;
+			}
 			#endif
 
 			/* Either both or neither. */
@@ -2627,7 +2917,9 @@ again:
 		}
 		case IN_MAP_LENGTH: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_LENGTH" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_LENGTH" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2641,7 +2933,9 @@ again:
 		}
 		case IN_MAP_FIND: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_MAP_FIND" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_MAP_FIND" << endl;
+			}
 			#endif
 
 			Tree *obj = pop();
@@ -2659,7 +2953,9 @@ again:
 			read_half( size );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_INIT_LOCALS " << size << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_INIT_LOCALS " << size << endl;
+			}
 			#endif
 
 			frame = ptop();
@@ -2673,7 +2969,9 @@ again:
 			read_half( size );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_POP_LOCALS " << frameId << " " << size << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_POP_LOCALS " << frameId << " " << size << endl;
+			}
 			#endif
 
 			FrameInfo *fi = &prg->rtd->frameInfo[frameId];
@@ -2688,7 +2986,9 @@ again:
 			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CALL_WV " << fi->name << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_CALL_WV " << fi->name << endl;
+			}
 			#endif
 
 			push( 0 ); /* Return value. */
@@ -2706,7 +3006,9 @@ again:
 			FunctionInfo *fi = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_CALL_WC " << fi->name << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_CALL_WC " << fi->name << endl;
+			}
 			#endif
 
 			push( 0 ); /* Return value. */
@@ -2719,7 +3021,9 @@ again:
 		}
 		case IN_YIELD: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_YIELD" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_YIELD" << endl;
+			}
 			#endif
 
 			Kid *kid = (Kid*)pop();
@@ -2757,8 +3061,10 @@ again:
 			read_half( searchId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_CREATE_WV " << field << " " << 
-					funcId << " " << searchId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_CREATE_WV " << field << " " << 
+						funcId << " " << searchId << endl;
+			}
 			#endif
 
 			FunctionInfo *fi = prg->rtd->functionInfo + funcId;
@@ -2785,8 +3091,10 @@ again:
 			read_half( searchId );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_CREATE_WC " << field << " " << 
-					funcId << " " << searchId << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_CREATE_WC " << field << " " << 
+						funcId << " " << searchId << endl;
+			}
 			#endif
 
 			FunctionInfo *fi = prg->rtd->functionInfo + funcId;
@@ -2810,7 +3118,9 @@ again:
 			read_half( field );
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_UITER_DESTROY " << field << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_UITER_DESTROY " << field << endl;
+			}
 			#endif
 
 			UserIter *uiter = (UserIter*) local(field);
@@ -2824,7 +3134,9 @@ again:
 			FunctionInfo *fui = &prg->rtd->functionInfo[funcId];
 
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_RET " << fui->name << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_RET " << fui->name << endl;
+			}
 			#endif
 
 			FrameInfo *fi = &prg->rtd->frameInfo[fui->frameId];
@@ -2840,7 +3152,9 @@ again:
 		}
 		case IN_OPEN_FILE: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_OPEN_FILE" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_OPEN_FILE" << endl;
+			}
 			#endif
 
 			Tree *name = pop();
@@ -2852,7 +3166,9 @@ again:
 		}
 		case IN_GET_STDIN: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_GET_STDIN" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_GET_STDIN" << endl;
+			}
 			#endif
 
 			/* Pop the root object. */
@@ -2868,7 +3184,9 @@ again:
 		}
 		case IN_STOP: {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "IN_STOP" << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "IN_STOP" << endl;
+			}
 			#endif
 
 			cout.flush();
diff --git a/colm/config.h.in b/colm/config.h.in
index 98b87759..f9da39b1 100644
--- a/colm/config.h.in
+++ b/colm/config.h.in
@@ -37,5 +37,11 @@
 #define COLM_LOG_COMPILE 1
 #endif
 
+extern int colm_log_bytecode;
+extern int colm_log_parse;
+extern int colm_log_match;
+extern int colm_log_compile;
+extern int colm_log_conds;
+
 
 #endif /* _CONFIG_H */
diff --git a/colm/fsmap.cpp b/colm/fsmap.cpp
index bf190888..45e02f3e 100644
--- a/colm/fsmap.cpp
+++ b/colm/fsmap.cpp
@@ -808,7 +808,6 @@ bool FsmGraph::hasOutData( FsmState *state )
  * Setting Conditions.
  */
 
-
 void logNewExpansion( Expansion *exp );
 void logCondSpace( CondSpace *condSpace );
 
@@ -824,11 +823,13 @@ CondSpace *FsmGraph::addCondSpace( const CondSet &condSet )
 		condData->condSpaceMap.insert( condSpace );
 
 		#ifdef COLM_LOG_CONDS
-		cerr << "adding new condition space" << endl;
-		cerr << "  condition set: ";
-		logCondSpace( condSpace );
-		cerr << endl;
-		cerr << "  baseKey: " << baseKey.getVal() << endl;
+		if ( colm_log_conds ) {
+			cerr << "adding new condition space" << endl;
+			cerr << "  condition set: ";
+			logCondSpace( condSpace );
+			cerr << endl;
+			cerr << "  baseKey: " << baseKey.getVal() << endl;
+		}
 		#endif
 	}
 	return condSpace;
diff --git a/colm/fsmgraph.cpp b/colm/fsmgraph.cpp
index 9ea082f0..af643721 100644
--- a/colm/fsmgraph.cpp
+++ b/colm/fsmgraph.cpp
@@ -890,7 +890,7 @@ void FsmGraph::isolateStartState( )
 	setMisfitAccounting( false );
 }
 
-#ifdef COLM_LOG_CONDS
+#if COLM_LOG_CONDS
 void logCondSpace( CondSpace *condSpace )
 {
 	if ( condSpace == 0 )
@@ -948,7 +948,9 @@ void FsmGraph::findTransExpansions( ExpansionList &expansionList,
 				expansion->toValsList.append( targVals );
 
 			#ifdef COLM_LOG_CONDS
-			logNewExpansion( expansion );
+			if ( colm_log_conds ) {
+				logNewExpansion( expansion );
+			}
 			#endif
 			expansionList.append( expansion );
 		}
@@ -980,7 +982,9 @@ void FsmGraph::findCondExpInTrans( ExpansionList &expansionList, FsmState *state
 
 			expansionList.append( expansion );
 			#ifdef COLM_LOG_CONDS
-			logNewExpansion( expansion );
+			if ( colm_log_conds ) {
+				logNewExpansion( expansion );
+			}
 			#endif
 		}
 	}
@@ -1006,8 +1010,10 @@ void FsmGraph::findCondExpansions( ExpansionList &expansionList,
 
 			if ( srcOnlyCS.length() > 0 ) {
 				#ifdef COLM_LOG_CONDS
-				cerr << "there are " << srcOnlyCS.length() << " item(s) that are "
-							"only in the srcCS" << endl;
+				if ( colm_log_conds ) {
+					cerr << "there are " << srcOnlyCS.length() << " item(s) that are "
+								"only in the srcCS" << endl;
+				}
 				#endif
 
 				CondSet mergedCS = destCS;
@@ -1311,7 +1317,9 @@ void FsmGraph::findEmbedExpansions( ExpansionList &expansionList,
 					expansion->toCondSpace = newStateCond->condSpace;
 					expansion->toValsList.append( 1 );
 					#ifdef COLM_LOG_CONDS
-					logNewExpansion( expansion );
+					if ( colm_log_conds ) {
+						logNewExpansion( expansion );
+					}
 					#endif
 					expansionList.append( expansion );
 				}
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index df4b26d7..f7602d2f 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -71,7 +71,9 @@ void FsmRun::undoStreamPush( long length )
 void FsmRun::streamPush( const char *data, long length )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "readying fake push" << endl;
+	if ( colm_log_parse ) {
+		cerr << "readying fake push" << endl;
+	}
 	#endif
 
 	if ( p == runBuf->buf ) {
@@ -142,7 +144,9 @@ void undo_position( FsmRun *fsmRun, const char *data, long length )
 void FsmRun::sendBackText( const char *data, long length )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "push back of " << length << " characters" << endl;
+	if ( colm_log_parse ) {
+		cerr << "push back of " << length << " characters" << endl;
+	}
 	#endif
 
 	if ( length == 0 )
@@ -150,7 +154,9 @@ void FsmRun::sendBackText( const char *data, long length )
 
 	if ( p == runBuf->buf ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "pushing back runbuf" << endl;
+		if ( colm_log_parse ) {
+			cerr << "pushing back runbuf" << endl;
+		}
 		#endif
 
 		/* Move to the next run buffer. */
@@ -175,8 +181,10 @@ void FsmRun::sendBackText( const char *data, long length )
 	p -= length;
 
 	#ifdef COLM_LOG_PARSE
-	if ( memcmp( data, p, length ) != 0 )
-		cerr << "mismatch of pushed back text" << endl;
+	if ( colm_log_parse ) {
+		if ( memcmp( data, p, length ) != 0 )
+			cerr << "mismatch of pushed back text" << endl;
+	}
 	#endif
 
 	assert( memcmp( data, p, length ) == 0 );
@@ -191,8 +199,10 @@ void FsmRun::queueBack( Kid *input )
 {
 	if ( input->tree->flags & AF_GROUP_MEM ) {
 		#ifdef COLM_LOG_PARSE
-		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-		cerr << "queuing back: " << lelInfo[input->tree->id].name << endl;
+		if ( colm_log_parse ) {
+			LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+			cerr << "queuing back: " << lelInfo[input->tree->id].name << endl;
+		}
 		#endif
 
 		if ( parser->queue == 0 )
@@ -235,11 +245,13 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 	/* Ignore tokens are queued in reverse order. */
 	while ( tree_is_ignore( prg, ignore ) ) {
 		#ifdef COLM_LOG_PARSE
-		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-		cerr << "sending back: " << lelInfo[ignore->tree->id].name;
-		if ( ignore->tree->flags & AF_ARTIFICIAL )
-			cerr << " (artificial)";
-		cerr << endl;
+		if ( colm_log_parse ) {
+			LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+			cerr << "sending back: " << lelInfo[ignore->tree->id].name;
+			if ( ignore->tree->flags & AF_ARTIFICIAL )
+				cerr << " (artificial)";
+			cerr << endl;
+		}
 		#endif
 
 		Head *head = ignore->tree->tokdata;
@@ -265,11 +277,13 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 void FsmRun::sendBack( Kid *input )
 {
 	#ifdef COLM_LOG_PARSE
-	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	cerr << "sending back: " << lelInfo[input->tree->id].name;
-	if ( input->tree->flags & AF_ARTIFICIAL )
-		cerr << " (artificial)";
-	cerr << endl;
+	if ( colm_log_parse ) {
+		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+		cerr << "sending back: " << lelInfo[input->tree->id].name;
+		if ( input->tree->flags & AF_ARTIFICIAL )
+			cerr << " (artificial)";
+		cerr << endl;
+	}
 	#endif
 
 	if ( input->tree->flags & AF_NAMED ) {
@@ -324,7 +338,9 @@ void add_notoken( Program *prg, PdaRun *parser )
 	/* Check if there was anything generated. */
 	if ( parser->queue == 0 && parser->reverseCode.length() > 0 ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "found reverse code but no token, sending _notoken" << endl;
+		if ( colm_log_parse ) {
+			cerr << "found reverse code but no token, sending _notoken" << endl;
+		}
 		#endif
 
 		Tree *tree = (Tree*)prg->parseTreePool.allocate();
@@ -371,8 +387,10 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 		send->next = 0;
 		if ( lelInfo[send->tree->id].ignore ) {
 			#ifdef COLM_LOG_PARSE
-			cerr << "ignoring queued item: " << 
-					parser->tables->rtd->lelInfo[send->tree->id].name << endl;
+			if ( colm_log_parse ) {
+				cerr << "ignoring queued item: " << 
+						parser->tables->rtd->lelInfo[send->tree->id].name << endl;
+			}
 			#endif
 			
 			parser->ignore( send->tree );
@@ -380,8 +398,10 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 		}
 		else {
 			#ifdef COLM_LOG_PARSE
-			cerr << "sending queue item: " << 
-					parser->tables->rtd->lelInfo[send->tree->id].name << endl;
+			if ( colm_log_parse ) {
+				cerr << "sending queue item: " << 
+						parser->tables->rtd->lelInfo[send->tree->id].name << endl;
+			}
 			#endif
 
 			send_handle_error( fsmRun, parser, send );
@@ -392,7 +412,9 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 void FsmRun::sendToken( long id )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
+	}
 	#endif
 
 	bool ctxDepParsing = prg->ctxDepParsing;
@@ -435,7 +457,9 @@ void FsmRun::sendNamedLangEl()
 		klangEl = klangEl->termDup;
 	
 	#ifdef COLM_LOG_PARSE
-	cerr << "named langEl: " << parser->tables->rtd->lelInfo[klangEl->id].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "named langEl: " << parser->tables->rtd->lelInfo[klangEl->id].name << endl;
+	}
 	#endif
 
 	/* Copy the token data. */
@@ -476,8 +500,10 @@ void execute_generation_action( Program *prg, PdaRun *parser, Code *code, Head *
 void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bindId )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "generation action: " << 
-			parser->tables->rtd->lelInfo[id].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "generation action: " << 
+				parser->tables->rtd->lelInfo[id].name << endl;
+	}
 	#endif
 
 	/* Find the code. */
@@ -588,7 +614,9 @@ void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input )
 
 		if ( parser->isParserStopFinished() ) {
 			#ifdef COLM_LOG_PARSE
-			cerr << "stopping the parse" << endl;
+			if ( colm_log_parse ) {
+				cerr << "stopping the parse" << endl;
+			}
 			#endif
 			fsmRun->cs = fsmRun->tables->errorState;
 			parser->stopParsing = true;
@@ -596,8 +624,10 @@ void send_handle_error( FsmRun *fsmRun, PdaRun *parser, Kid *input )
 	}
 
 	#ifdef COLM_LOG_PARSE
-	cerr << "new token region: " << 
-			parser->tables->rtd->regionInfo[fsmRun->region].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "new token region: " << 
+				parser->tables->rtd->regionInfo[fsmRun->region].name << endl;
+	}
 	#endif
 }
 
@@ -615,7 +645,9 @@ void PdaRun::ignore( Tree *tree )
 void FsmRun::sendIgnore( long id )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
+	}
 	#endif
 
 	/* Make the ignore string. */
@@ -682,7 +714,9 @@ Head *FsmRun::extractToken( long length )
 void FsmRun::sendEOF( )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "token: _EOF" << endl;
+	if ( colm_log_parse ) {
+		cerr << "token: _EOF" << endl;
+	}
 	#endif
 
 	Kid *input = prg->kidPool.allocate();
@@ -696,7 +730,9 @@ void FsmRun::sendEOF( )
 	long frameId = parser->tables->rtd->regionInfo[region].eofFrameId;
 	if ( ctxDepParsing && frameId >= 0 ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "HAVE PRE_EOF BLOCK" << endl;
+		if ( colm_log_parse ) {
+			cerr << "HAVE PRE_EOF BLOCK" << endl;
+		}
 		#endif
 
 		/* Get the code for the pre-eof block. */
@@ -826,7 +862,9 @@ long FsmRun::run( PdaRun *destParser )
 
 		if ( cs == tables->errorState && parser->stopParsing ) {
 			#ifdef COLM_LOG_PARSE
-			cerr << "scanner has been stopped" << endl;
+			if ( colm_log_parse ) {
+				cerr << "scanner has been stopped" << endl;
+			}
 			#endif
 			goto done;
 		}
@@ -848,7 +886,9 @@ long FsmRun::run( PdaRun *destParser )
 
 			if ( parser->getNextRegion( 1 ) != 0 ) {
 				#ifdef COLM_LOG_PARSE
-				cerr << "scanner failed, trying next region" << endl;
+				if ( colm_log_parse ) {
+					cerr << "scanner failed, trying next region" << endl;
+				}
 				#endif
 
 				/* May have accumulated ignore tokens from a previous region.
@@ -860,8 +900,10 @@ long FsmRun::run( PdaRun *destParser )
 				region = parser->getNextRegion();
 				cs = tables->entryByRegion[region];
 				#ifdef COLM_LOG_PARSE
-				cerr << "new token region: " << 
-						parser->tables->rtd->regionInfo[region].name << endl;
+				if ( colm_log_parse ) {
+					cerr << "new token region: " << 
+							parser->tables->rtd->regionInfo[region].name << endl;
+				}
 				#endif
 				continue;
 			}
@@ -869,7 +911,9 @@ long FsmRun::run( PdaRun *destParser )
 			if ( parser->numRetry > 0 ) {
 				/* Invoke the parser's error handling. */
 				#ifdef COLM_LOG_PARSE
-				cerr << "invoking parse error from the scanner" << endl;
+				if ( colm_log_parse ) {
+					cerr << "invoking parse error from the scanner" << endl;
+				}
 				#endif
 
 				parser->sendBackIgnore();
@@ -883,8 +927,10 @@ long FsmRun::run( PdaRun *destParser )
 					region = parser->getNextRegion();
 					cs = tables->entryByRegion[region];
 					#ifdef COLM_LOG_PARSE
-					cerr << "new token region: " << 
-							parser->tables->rtd->regionInfo[region].name << endl;
+					if ( colm_log_parse ) {
+						cerr << "new token region: " << 
+								parser->tables->rtd->regionInfo[region].name << endl;
+					}
 					#endif
 					continue;
 				}
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 728bdd76..ef34d20f 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -40,9 +40,9 @@ include "lmparse.kh";
 
 start: root_item_list
 	final {
-		#ifdef COLM_LOG_COMPILE
-		cerr << "parsing complete" << endl;
-		#endif
+		if ( colm_log_compile ) {
+			cerr << "parsing complete" << endl;
+		}
 
 		pd->rootCodeBlock = new CodeBlock( $1->stmtList );
 	};
diff --git a/colm/main.cpp b/colm/main.cpp
index 8b8ac853..3c50e882 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -232,9 +232,9 @@ void openOutput( )
 		}
 	}
 
-	#ifdef COLM_LOG_COMPILE
-	cerr << "opening output file: " << outputFileName << endl;
-	#endif
+	if ( colm_log_compile ) {
+		cerr << "opening output file: " << outputFileName << endl;
+	}
 
 	/* Make sure we are not writing to the same file as the input file. */
 	if ( outputFileName != 0 && strcmp( inputFileName, outputFileName  ) == 0 ) {
@@ -291,9 +291,9 @@ void compileOutput( const char *argv0 )
 		" %s"
 		" %s/../colm/runtime.a",
 		location, location, location, exec, outputFileName, location );
-	#ifdef COLM_LOG_COMPILE
-	cout << "compiling: " << outputFileName << endl;
-	#endif
+	if ( colm_log_compile ) {
+		cout << "compiling: " << outputFileName << endl;
+	}
 	int res = system( command );
 	if ( res != 0 )
 		cout << "there was a problem compiling the output" << endl;
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 7b54c7c2..1ed0403d 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1642,9 +1642,11 @@ void ParseData::parsePatterns()
 				repl->langEl->pdaTables, &fsmRun, 0, false );
 		repl->pdaRun->run();
 
-		//#ifdef COLM_LOG_COMPILE
-		//xml_print_list( runtimeData, repl->pdaRun->stackTop, 0 );
-		//#endif
+			//#ifdef COLM_LOG_COMPILE
+			//if ( colm_log_compile ) {
+			//xml_print_list( runtimeData, repl->pdaRun->stackTop, 0 );
+			//#endif
+			//}
 	}
 
 	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
@@ -1656,9 +1658,11 @@ void ParseData::parsePatterns()
 				pat->langEl->pdaTables, &fsmRun, 0, false );
 		pat->pdaRun->run();
 
-		//#ifdef COLM_LOG_COMPILE
-		//xml_print_list( runtimeData, pat->pdaRun->stackTop, 0 );
-		//#endif
+			//#ifdef COLM_LOG_COMPILE
+			//if ( colm_log_compile ) {
+			//xml_print_list( runtimeData, pat->pdaRun->stackTop, 0 );
+			//#endif
+			//}
 	}
 
 	fillInPatterns( &program );
@@ -1731,10 +1735,10 @@ void ParseData::semanticAnalysis()
 
 	FsmGraph *fsmGraph = makeScanner();
 
-	#ifdef COLM_LOG_COMPILE
-	printNameTree( fsmGraph->rootName );
-	printNameIndex( fsmGraph->nameIndex );
-	#endif
+	if ( colm_log_compile ) {
+		printNameTree( fsmGraph->rootName );
+		printNameIndex( fsmGraph->nameIndex );
+	}
 
 	prepGrammar();
 
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 1e21335a..2c370644 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -657,15 +657,15 @@ void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl )
 		}
 	}
 
-	#ifdef COLM_LOG_COMPILE
-	/* Warn about states with empty token region lists. */
-	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
-		if ( state->regions.length() == 0 ) {
-			warning() << "state has an empty token region, state: " << 
-				state->stateNum << endl;
+	if ( colm_log_compile ) {
+		/* Warn about states with empty token region lists. */
+		for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+			if ( state->regions.length() == 0 ) {
+				warning() << "state has an empty token region, state: " << 
+					state->stateNum << endl;
+			}
 		}
 	}
-	#endif
 
 	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
 		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 766910c2..fd52668b 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -159,8 +159,10 @@ void commit_kid( PdaRun *parser, Tree **root, Kid *lel, Code *&rcode, long &caus
 head:
 	/* Commit */
 	#ifdef COLM_LOG_PARSE
-	cerr << "commit: visiting " << 
-			parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
+	if ( colm_log_parse ) {
+		cerr << "commit: visiting " << 
+				parser->prg->rtd->lelInfo[lel->tree->id].name << endl;
+	}
 	#endif
 
 	/* Load up the parsed tree. */
@@ -175,8 +177,10 @@ head:
 		if ( pt(tree)->causeReduce > 0 ) {
 			/* The top reduce block does not correspond to this alg. */
 			#ifdef COLM_LOG_PARSE
-			cerr << "commit: causeReduce found, delaying backup: " << 
-					(long)pt(tree)->causeReduce << endl;
+			if ( colm_log_parse ) {
+				cerr << "commit: causeReduce found, delaying backup: " << 
+						(long)pt(tree)->causeReduce << endl;
+			}
 			#endif
 			causeReduce = pt(tree)->causeReduce;
 		}
@@ -209,7 +213,9 @@ head:
 
 		if ( causeReduce == 0 ) {
 			#ifdef COLM_LOG_PARSE
-			cerr << "commit: causeReduce dropped to zero, backing up over rcode" << endl;
+			if ( colm_log_parse ) {
+				cerr << "commit: causeReduce dropped to zero, backing up over rcode" << endl;
+			}
 			#endif
 
 			/* Cause reduce just dropped down to zero. */
@@ -266,7 +272,9 @@ backup:
 void commit_full( PdaRun *parser, long causeReduce )
 {
 	#ifdef COLM_LOG_PARSE
-	cerr << "running full commit" << endl;
+	if ( colm_log_parse ) {
+		cerr << "running full commit" << endl;
+	}
 	#endif
 	
 	Tree **sp = parser->root;
@@ -336,7 +344,9 @@ again:
 
 	if ( *action & act_sb ) {
 		#ifdef COLM_LOG_PARSE
-		cerr << "shifted: " << tables->rtd->lelInfo[pt(lel->tree)->id].name;
+		if ( colm_log_parse ) {
+			cerr << "shifted: " << tables->rtd->lelInfo[pt(lel->tree)->id].name;
+		}
 		#endif
 		input = input->next;
 		pt(lel->tree)->state = cs;
@@ -358,11 +368,15 @@ again:
 			assert( pt(lel->tree)->retry_upper == 0 );
 			numRetry += 1; /* FIXME: Has the retry already been counted? */
 			#ifdef COLM_LOG_PARSE
-			cerr << " retry: " << stackTop;
+			if ( colm_log_parse ) {
+				cerr << " retry: " << stackTop;
+			}
 			#endif
 		}
 		#ifdef COLM_LOG_PARSE
-		cerr << endl;
+		if ( colm_log_parse ) {
+			cerr << endl;
+		}
 		#endif
 	}
 
@@ -411,9 +425,11 @@ again:
 		redLel->tree->child = kid_list_concat( attrs, child );
 
 		#ifdef COLM_LOG_PARSE
-		cerr << "reduced: "
-				<< tables->rtd->prodInfo[reduction].name
-				<< " rhsLen: " << rhsLen;
+		if ( colm_log_parse ) {
+			cerr << "reduced: "
+					<< tables->rtd->prodInfo[reduction].name
+					<< " rhsLen: " << rhsLen;
+		}
 		#endif
 		if ( action[1] == 0 )
 			pt(redLel->tree)->retry_upper = 0;
@@ -422,12 +438,16 @@ again:
 			assert( pt(lel->tree)->retry_lower == 0 );
 			numRetry += 1;
 			#ifdef COLM_LOG_PARSE
-			cerr << " retry: " << redLel;
+			if ( colm_log_parse ) {
+				cerr << " retry: " << redLel;
+			}
 			#endif
 		}
 
 		#ifdef COLM_LOG_PARSE
-		cerr << endl;
+		if ( colm_log_parse ) {
+			cerr << endl;
+		}
 		#endif
 
 		/* When the production is of zero length we stay in the same state.
@@ -457,7 +477,9 @@ again:
 			 * copy above. */
 			if ( execution.parsed != 0 && execution.parsed != redLel->tree ) {
 				#ifdef COLM_LOG_PARSE
-				cerr << "lhs tree was modified, adding a restore instruction" << endl;
+				if ( colm_log_parse ) {
+					cerr << "lhs tree was modified, adding a restore instruction" << endl;
+				}
 				#endif
 
 				reverseCode.append( IN_RESTORE_LHS );
@@ -487,8 +509,10 @@ again:
 
 		if ( induceReject ) {
 			#ifdef COLM_LOG_PARSE
-			cerr << "error induced during reduction of " <<
-					tables->rtd->lelInfo[redLel->tree->id].name << endl;
+			if ( colm_log_parse ) {
+				cerr << "error induced during reduction of " <<
+						tables->rtd->lelInfo[redLel->tree->id].name << endl;
+			}
 			#endif
 			pt(redLel->tree)->state = cs;
 			redLel->next = stackTop;
@@ -508,7 +532,9 @@ again:
 
 parseError:
 	#ifdef COLM_LOG_PARSE
-	cerr << "hit error, backtracking" << endl;
+	if ( colm_log_parse ) {
+		cerr << "hit error, backtracking" << endl;
+	}
 	#endif
 
 	if ( numRetry == 0 )
@@ -520,11 +546,15 @@ parseError:
 
 			if ( pt(input->tree)->retry_lower != 0 ) {
 				#ifdef COLM_LOG_PARSE
-				cerr << "found retry targ: " << input << endl;
+				if ( colm_log_parse ) {
+					cerr << "found retry targ: " << input << endl;
+				}
 				#endif
 				numRetry -= 1;
 				#ifdef COLM_LOG_PARSE
-				cerr << "found retry: " << input << endl;
+				if ( colm_log_parse ) {
+					cerr << "found retry: " << input << endl;
+				}
 				#endif
 
 				cs = pt(input->tree)->state;
@@ -540,7 +570,9 @@ parseError:
 				input = 0;
 				if ( tables->tokenRegions[next] != 0 ) {
 					#ifdef COLM_LOG_PARSE
-					cerr << "found a new region" << endl;
+					if ( colm_log_parse ) {
+						cerr << "found a new region" << endl;
+					}
 					#endif
 					numRetry -= 1;
 					cs = stackTopTarget();
@@ -567,8 +599,10 @@ parseError:
 				(stackTop->tree->flags & AF_TERM_DUP) )
 		{
 			#ifdef COLM_LOG_PARSE
-			cerr << "backing up over effective terminal: " <<
-					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
+			if ( colm_log_parse ) {
+				cerr << "backing up over effective terminal: " <<
+						tables->rtd->lelInfo[stackTop->tree->id].name << endl;
+			}
 			#endif
 
 			/* Pop the item from the stack. */
@@ -586,8 +620,10 @@ parseError:
 		}
 		else {
 			#ifdef COLM_LOG_PARSE
-			cerr << "backing up over non-terminal: " <<
-					tables->rtd->lelInfo[stackTop->tree->id].name << endl;
+			if ( colm_log_parse ) {
+				cerr << "backing up over non-terminal: " <<
+						tables->rtd->lelInfo[stackTop->tree->id].name << endl;
+			}
 			#endif
 
 			/* Check for an execution environment. */
diff --git a/colm/tree.cpp b/colm/tree.cpp
index e79e569d..d41b4fbf 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -677,8 +677,10 @@ Tree *copy_real_tree( Program *prg, Tree *tree, Kid *oldNextDown,
 List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
 {
 	#ifdef COLM_LOG_BYTECODE
-	cerr << "splitting list: " << list << " refs: " << 
-			list->refs << endl;
+	if ( colm_log_bytecode ) {
+		cerr << "splitting list: " << list << " refs: " << 
+				list->refs << endl;
+	}
 	#endif
 
 	/* Not a need copy. */
@@ -707,8 +709,10 @@ List *copy_list( Program *prg, List *list, Kid *oldNextDown, Kid *&newNextDown )
 Map *copy_map( Program *prg, Map *map, Kid *oldNextDown, Kid *&newNextDown )
 {
 	#ifdef COLM_LOG_BYTECODE
-	cerr << "splitting map: " << map << " refs: " << 
-			map->refs << endl;
+	if ( colm_log_bytecode ) {
+		cerr << "splitting map: " << map << " refs: " << 
+				map->refs << endl;
+	}
 	#endif
 
 	Map *newMap = (Map*)prg->mapElPool.allocate();
@@ -767,8 +771,10 @@ Tree *split_tree( Program *prg, Tree *tree )
 
 		if ( tree->refs > 1 ) {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "splitting tree: " << tree << " refs: " << 
-					tree->refs << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "splitting tree: " << tree << " refs: " << 
+						tree->refs << endl;
+			}
 			#endif
 
 			Kid *oldNextDown = 0, *newNextDown = 0;
@@ -1388,8 +1394,10 @@ void split_ref( Tree **&sp, Program *prg, Ref *fromRef )
 	while ( ref != 0 ) {
 		if ( ref->kid->tree->refs > 1 ) {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "splitting tree: " << ref->kid << " refs: " << 
-					ref->kid->tree->refs << endl;
+			if ( colm_log_bytecode ) {
+				cerr << "splitting tree: " << ref->kid << " refs: " << 
+						ref->kid->tree->refs << endl;
+			}
 			#endif
 
 			Ref *nextDown = ref->next;
@@ -1509,9 +1517,11 @@ bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool chec
 	PatReplNode *nodes = prg->rtd->patReplNodes;
 
 	#ifdef COLM_LOG_MATCH
-	LangElInfo *lelInfo = prg->rtd->lelInfo;
-	cerr << "match_pattern " << ( pat == -1 ? "NULL" : lelInfo[nodes[pat].id].name ) <<
-			" vs " << ( kid == 0 ? "NULL" : lelInfo[kid->tree->id].name ) << endl;
+	if ( colm_log_match ) {
+		LangElInfo *lelInfo = prg->rtd->lelInfo;
+		cerr << "match_pattern " << ( pat == -1 ? "NULL" : lelInfo[nodes[pat].id].name ) <<
+				" vs " << ( kid == 0 ? "NULL" : lelInfo[kid->tree->id].name ) << endl;
+	}
 	#endif
 
 	/* match node, recurse on children. */
@@ -1533,7 +1543,9 @@ bool match_pattern( Tree **bindings, Program *prg, long pat, Kid *kid, bool chec
 			/* No failure, all okay. */
 			if ( nodes[pat].bindId > 0 ) {
 				#ifdef COLM_LOG_MATCH
-				cerr << "bindId: " << nodes[pat].bindId << endl;
+				if ( colm_log_match ) {
+					cerr << "bindId: " << nodes[pat].bindId << endl;
+				}
 				#endif
 				bindings[nodes[pat].bindId] = kid->tree;
 			}
-- 
cgit v1.2.1


From bf06f1c0f5b3d0fd0e039d36b610272965dc4c60 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 19:12:35 +0000
Subject: Colm logging and target logging are now turned on with -v and -l. No
 need to reconfigure and recompile colm.

---
 colm/Makefile.in    | 43 +++++++++++++++++++++++++++++-------------
 colm/bytecode.cpp   | 10 +++++-----
 colm/bytecode.h     |  3 ++-
 colm/colm.h         |  1 +
 colm/fsmcodegen.cpp |  7 +++++++
 colm/main.cpp       | 30 +++++++++++++++++++++--------
 configure           | 54 +++++------------------------------------------------
 configure.in        | 14 +++++---------
 8 files changed, 77 insertions(+), 85 deletions(-)

diff --git a/colm/Makefile.in b/colm/Makefile.in
index 435dd3eb..131bd771 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -26,7 +26,10 @@
 # rt_clm: rt on/off
 
 INCS += -I../aapl
-DEFS +=
+
+DEFS_COLM += -DCOLM_LOG
+DEFS_RT_P +=
+DEFS_RT_D += -DCOLM_LOG
 
 CFLAGS += -g -Wall -Wwrite-strings
 LDFLAGS +=
@@ -64,7 +67,8 @@ ALL_SRC = $(COLM_SRC) $(RUNTIME_SRC)
 # Files in ALL_SRC that are generated.
 GEN_SRC = version.h lmscan.cpp lmparse.h lmparse.cpp 
 
-RUNTIME = runtime.a
+RUNTIME_P = runtime_p.a
+RUNTIME_D = runtime_d.a
 
 LIBS = 
 
@@ -82,18 +86,22 @@ CXX = @CXX@
 
 # Get objects and dependencies from sources.
 COLM_OBJ = $(COLM_SRC:%.cpp=%.o)
-RUNTIME_OBJ = $(RUNTIME_SRC:%.cpp=%.o)
+RUNTIME_OBJ_P = $(RUNTIME_SRC:%.cpp=%_p.o)
+RUNTIME_OBJ_D = $(RUNTIME_SRC:%.cpp=%_d.o)
 
-DEPS = $(CC_SRCS:%.cpp=.%.d)
+DEPS = $(COLM_SRC:%.cpp=.%.d) $(RUNTIME_SRC:%.cpp=.%_p.d) $(RUNTIME_SRC:%.cpp=.%_d.d)
 
 # Rules.
-all: colm $(RUNTIME)
+all: colm $(RUNTIME_P) $(RUNTIME_D)
+
+colm: $(GEN_SRC) $(COLM_OBJ) $(RUNTIME_OBJ_D) $(LIBS)
+	$(CXX) $(LDFLAGS) -o $@ $(COLM_OBJ) $(RUNTIME_OBJ_D) $(LIBS)
 
-colm: $(GEN_SRC) $(COLM_OBJ) $(RUNTIME_OBJ) $(LIBS)
-	$(CXX) $(LDFLAGS) -o $@ $(COLM_OBJ) $(RUNTIME_OBJ) $(LIBS)
+$(RUNTIME_P): $(RUNTIME_OBJ_P)
+	ar -cr $@ $^
 
-$(RUNTIME): $(RUNTIME_OBJ)
-	ar -cr $@ $(RUNTIME_OBJ)
+$(RUNTIME_D): $(RUNTIME_OBJ_D)
+	ar -cr $@ $^
 
 version.h: ../version.mk
 	echo '#define VERSION "$(VERSION)"' > version.h
@@ -114,9 +122,18 @@ lmscan.cpp: lmscan.rl
 
 endif
 
-%.o: %.cpp
-	@$(CXX) -M $(DEFS) $(INCS) $< > .$*.d
-	$(CXX) -c $(CFLAGS) $(DEFS) $(INCS) -o $@ $<
+$(COLM_OBJ): %.o: %.cpp
+	@$(CXX) -M $(DEFS_COLM) $(INCS) $< > .$*.d
+	$(CXX) -c $(CFLAGS) $(DEFS_COLM) $(INCS) -o $@ $<
+
+$(RUNTIME_OBJ_P): %_p.o: %.cpp
+	@$(CXX) -M -MT $@ $(DEFS_RT_P) $(INCS) $< > .$*_p.d
+	$(CXX) -c $(CFLAGS) $(DEFS_RT_P) $(INCS) -o $@ $<
+
+$(RUNTIME_OBJ_D): %_d.o: %.cpp
+	@$(CXX) -M -MT $@ $(DEFS_RT_D) $(INCS) $< > .$*_d.d
+	$(CXX) -c $(CFLAGS) $(DEFS_RT_D) $(INCS) -o $@ $<
+
 
 distclean: clean
 	rm -f Makefile config.h
@@ -126,7 +143,7 @@ EXTRA_CLEAN = $(GEN_SRC)
 endif
 
 clean:
-	rm -f tags .*.d *.o colm $(EXTRA_CLEAN) $(RUNTIME)
+	rm -f tags .*.d *.o colm $(EXTRA_CLEAN) $(RUNTIME_P) $(RUNTIME_D)
 
 install: all
 	install -d $(PREFIX)/bin
diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 25d4d38b..787fa353 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -77,11 +77,11 @@ using std::endl;
 	i |= ((Word) *instr++) << 8; \
 } while(0)
 
-int colm_log_bytecode = 1;
-int colm_log_parse = 1;
-int colm_log_match = 1;
-int colm_log_compile = 1;
-int colm_log_conds = 1;
+int colm_log_bytecode = 0;
+int colm_log_parse = 0;
+int colm_log_match = 0;
+int colm_log_compile = 0;
+int colm_log_conds = 0;
 
 Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree )
 {
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 52e4d216..c13578a7 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -583,7 +583,8 @@ template <class T> T *PoolAlloc<T>::allocate()
 	if ( pool == 0 ) {
 		if ( nextel == FRESH_BLOCK ) {
 			#ifdef COLM_LOG_BYTECODE
-			cerr << "allocating " << FRESH_BLOCK << " Elements of type T" << endl;
+			if ( colm_log_bytecode )
+				cerr << "allocating " << FRESH_BLOCK << " Elements of type T" << endl;
 			#endif
 
 			PoolBlock<T> *newBlock = new PoolBlock<T>;
diff --git a/colm/colm.h b/colm/colm.h
index 6ae9fc68..b3a99e0d 100644
--- a/colm/colm.h
+++ b/colm/colm.h
@@ -47,6 +47,7 @@ extern const char *outputFileName;
 extern std::ostream *outStream;
 extern bool generateGraphviz;
 extern bool branchPointInfo;
+extern bool verbose, logging;
 extern bool addUniqueEmptyProductions;
 
 extern int gblErrorCount;
diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 94a2307e..29d840ee 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -1061,6 +1061,13 @@ void FsmCodeGen::writeCode()
 	out << 
 		"int main( int argc, char **argv )\n"
 		"{\n"
+		"	/* Always on because because logging is controlled with ifdefs in\n"
+		"	 * the runtime lib. */\n"
+		"	colm_log_bytecode = 1;\n"
+		"	colm_log_parse = 1;\n"
+		"	colm_log_match = 1;\n"
+		"	colm_log_compile = 1;\n"
+		"	colm_log_conds = 1;\n"
 		"	Program program( true, &main_runtimeData );\n"
 		"	program.run();\n"
 		"	return 0;\n"
diff --git a/colm/main.cpp b/colm/main.cpp
index 3c50e882..db2336a5 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -73,6 +73,8 @@ const char *inputFileName = 0;
 const char *outputFileName = 0;
 
 bool generateGraphviz = false;
+bool verbose = false;
+bool logging = false;
 bool branchPointInfo = false;
 bool addUniqueEmptyProductions = false;
 
@@ -150,9 +152,11 @@ void usage()
 "usage: colm [options] file\n"
 "general:\n"
 "   -h, -H, -?, --help   print this usage and exit\n"
-"   -v, --version        print version information and exit\n"
+"   --version            print version information and exit\n"
 "   -o <file>            write output to <file>\n"
 "   -i                   show conflict information\n"
+"   -v                   make colm verbose\n"
+"   -l                   compile logging into the output executable\n"
 	;	
 }
 
@@ -289,8 +293,8 @@ void compileOutput( const char *argv0 )
 		" -g"
 		" -o %s"
 		" %s"
-		" %s/../colm/runtime.a",
-		location, location, location, exec, outputFileName, location );
+		" %s/../colm/runtime_%c.a",
+		location, location, location, exec, outputFileName, location, logging ? 'd' : 'p' );
 	if ( colm_log_compile ) {
 		cout << "compiling: " << outputFileName << endl;
 	}
@@ -301,12 +305,18 @@ void compileOutput( const char *argv0 )
 
 void process_args( int argc, const char **argv )
 {
-	ParamCheck pc( "io:S:M:vHh?-:s", argc, argv );
+	ParamCheck pc( "vlio:S:M:vHh?-:s", argc, argv );
 
 	while ( pc.check() ) {
 		switch ( pc.state ) {
 		case ParamCheck::match:
 			switch ( pc.parameter ) {
+			case 'v':
+				verbose = true;
+				break;
+			case 'l':
+				logging = true;
+				break;
 			case 'i':
 				branchPointInfo = true;
 				break;
@@ -322,10 +332,6 @@ void process_args( int argc, const char **argv )
 				}
 				break;
 
-			/* Version and help. */
-			case 'v':
-				version();
-				exit(0);
 			case 'H': case 'h': case '?':
 				usage();
 				exit(0);
@@ -372,6 +378,14 @@ int main(int argc, const char **argv)
 {
 	process_args( argc, argv );
 
+	if ( verbose ) {
+		colm_log_bytecode = 1;
+		colm_log_parse = 1;
+		colm_log_match = 1;
+		colm_log_compile = 1;
+		colm_log_conds = 1;
+	}
+
 	/* Bail on above errors. */
 	if ( gblErrorCount > 0 )
 		exit(1);
diff --git a/configure b/configure
index 0b75c81e..f08d8a02 100755
--- a/configure
+++ b/configure
@@ -1207,15 +1207,6 @@ if test -n "$ac_init_help"; then
 
   cat <<\_ACEOF
 
-Optional Features:
-  --disable-FEATURE       do not include FEATURE (same as --enable-FEATURE=no)
-  --enable-FEATURE[=ARG]  include FEATURE [ARG=yes]
-"turn on logging"
-"turns on bytecode logging"
-"turns on parse logging"
-"turns on match logging"
-"turns on compile logging"
-
 Some influential environment variables:
   CC          C compiler command
   CFLAGS      C compiler flags
@@ -2987,46 +2978,11 @@ fi
 
 
 # Logging features
-# Check whether --enable-log was given.
-if test "${enable_log+set}" = set; then
-  enableval=$enable_log; cat >>confdefs.h <<\_ACEOF
-#define COLM_LOG 1
-_ACEOF
-
-fi
-
-# Check whether --enable-log-bytecode was given.
-if test "${enable_log_bytecode+set}" = set; then
-  enableval=$enable_log_bytecode; cat >>confdefs.h <<\_ACEOF
-#define COLM_LOG_BYTECODE 1
-_ACEOF
-
-fi
-
-# Check whether --enable-log-parse was given.
-if test "${enable_log_parse+set}" = set; then
-  enableval=$enable_log_parse; cat >>confdefs.h <<\_ACEOF
-#define COLM_LOG_PARSE 1
-_ACEOF
-
-fi
-
-# Check whether --enable-log-match was given.
-if test "${enable_log_match+set}" = set; then
-  enableval=$enable_log_match; cat >>confdefs.h <<\_ACEOF
-#define COLM_LOG_MATCH 1
-_ACEOF
-
-fi
-
-# Check whether --enable-log-compile was given.
-if test "${enable_log_compile+set}" = set; then
-  enableval=$enable_log_compile; cat >>confdefs.h <<\_ACEOF
-#define COLM_LOG_COMPILE 1
-_ACEOF
-
-fi
-
+# AC_ARG_ENABLE(log, "turn on logging", AC_DEFINE(COLM_LOG))
+# AC_ARG_ENABLE(log-bytecode, "turns on bytecode logging", AC_DEFINE(COLM_LOG_BYTECODE))
+# AC_ARG_ENABLE(log-parse, "turns on parse logging", AC_DEFINE(COLM_LOG_PARSE))
+# AC_ARG_ENABLE(log-match, "turns on match logging", AC_DEFINE(COLM_LOG_MATCH))
+# AC_ARG_ENABLE(log-compile, "turns on compile logging", AC_DEFINE(COLM_LOG_COMPILE))
 
 if test $BUILD_PARSERS = true; then
 
diff --git a/configure.in b/configure.in
index e1d898c7..94fb7ba2 100644
--- a/configure.in
+++ b/configure.in
@@ -41,15 +41,11 @@ dnl Check for definition of MAKE.
 AC_PROG_MAKE_SET
 
 # Logging features
-AC_ARG_ENABLE(log, "turn on logging", AC_DEFINE(COLM_LOG))
-AC_ARG_ENABLE(log-bytecode, "turns on bytecode logging", 
-		AC_DEFINE(COLM_LOG_BYTECODE))
-AC_ARG_ENABLE(log-parse, "turns on parse logging", 
-		AC_DEFINE(COLM_LOG_PARSE))
-AC_ARG_ENABLE(log-match, "turns on match logging", 
-		AC_DEFINE(COLM_LOG_MATCH))
-AC_ARG_ENABLE(log-compile, "turns on compile logging", 
-		AC_DEFINE(COLM_LOG_COMPILE))
+# AC_ARG_ENABLE(log, "turn on logging", AC_DEFINE(COLM_LOG))
+# AC_ARG_ENABLE(log-bytecode, "turns on bytecode logging", AC_DEFINE(COLM_LOG_BYTECODE))
+# AC_ARG_ENABLE(log-parse, "turns on parse logging", AC_DEFINE(COLM_LOG_PARSE))
+# AC_ARG_ENABLE(log-match, "turns on match logging", AC_DEFINE(COLM_LOG_MATCH))
+# AC_ARG_ENABLE(log-compile, "turns on compile logging", AC_DEFINE(COLM_LOG_COMPILE))
 
 if test $BUILD_PARSERS = true; then
 
-- 
cgit v1.2.1


From 29a5bbb93eb3cccc042e2b0987d728ccd74488a1 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 7 Feb 2009 20:54:18 +0000
Subject: Can now install and run colm from the installed location.

---
 colm/Makefile.in | 21 +++++++++++++++------
 colm/main.cpp    | 11 +++++++----
 2 files changed, 22 insertions(+), 10 deletions(-)

diff --git a/colm/Makefile.in b/colm/Makefile.in
index 131bd771..9b247eae 100644
--- a/colm/Makefile.in
+++ b/colm/Makefile.in
@@ -27,7 +27,7 @@
 
 INCS += -I../aapl
 
-DEFS_COLM += -DCOLM_LOG
+DEFS_COLM += -DCOLM_LOG -DPREFIX='"$(prefix)"'
 DEFS_RT_P +=
 DEFS_RT_D += -DCOLM_LOG
 
@@ -67,8 +67,8 @@ ALL_SRC = $(COLM_SRC) $(RUNTIME_SRC)
 # Files in ALL_SRC that are generated.
 GEN_SRC = version.h lmscan.cpp lmparse.h lmparse.cpp 
 
-RUNTIME_P = runtime_p.a
-RUNTIME_D = runtime_d.a
+RUNTIME_P = libcolmp.a
+RUNTIME_D = libcolmd.a
 
 LIBS = 
 
@@ -77,7 +77,7 @@ LIBS =
 # Get the version info.
 include ../version.mk
 
-PREFIX = @prefix@
+prefix = @prefix@
 
 BUILD_PARSERS = @BUILD_PARSERS@
 
@@ -146,7 +146,16 @@ clean:
 	rm -f tags .*.d *.o colm $(EXTRA_CLEAN) $(RUNTIME_P) $(RUNTIME_D)
 
 install: all
-	install -d $(PREFIX)/bin
-	install -s colm $(PREFIX)/bin/colm
+	install -d $(prefix)/bin
+	install -d $(prefix)/include
+	install -d $(prefix)/include/colm
+	install -d $(prefix)/lib
+	install -s colm $(prefix)/bin/colm
+	install libcolmp.a libcolmd.a $(prefix)/lib
+	install ../aapl/astring.h ../aapl/avlcommon.h ../aapl/avlmap.h \
+		../aapl/compare.h ../aapl/dlcommon.h ../aapl/dlist.h \
+		../aapl/dlistval.h ../aapl/resize.h ../aapl/table.h \
+		../aapl/vector.h bytecode.h config.h fsmrun.h input.h \
+		pdarun.h $(prefix)/include/colm
 
 -include $(DEPS)
diff --git a/colm/main.cpp b/colm/main.cpp
index db2336a5..fd403313 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -287,14 +287,17 @@ void compileOutput( const char *argv0 )
 	char command[length];
 	sprintf( command, 
 		"g++ -Wall -Wwrite-strings"
+		" -I%s"
 		" -I%s/../aapl"
-		" -I%s/../colm"
-		" -I%s/../common"
+		" -I" PREFIX "/include/colm"
 		" -g"
 		" -o %s"
 		" %s"
-		" %s/../colm/runtime_%c.a",
-		location, location, location, exec, outputFileName, location, logging ? 'd' : 'p' );
+		" -L %s"
+		" -L " PREFIX "/lib"
+		" -lcolm%c",
+		location, location,
+		exec, outputFileName, location, logging ? 'd' : 'p' );
 	if ( colm_log_compile ) {
 		cout << "compiling: " << outputFileName << endl;
 	}
-- 
cgit v1.2.1


From ba86e1650f475034ef4ae4d03da4a5f17b81830b Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 8 Feb 2009 23:38:50 +0000
Subject: got graphviz output working

---
 colm/colm.h         |   4 +-
 colm/dotgen.cpp     | 310 +++++-----------------------------------------------
 colm/fsmcodegen.cpp |   1 -
 colm/main.cpp       |  29 +++--
 colm/parsedata.cpp  |  11 +-
 colm/parsedata.h    |  11 ++
 6 files changed, 62 insertions(+), 304 deletions(-)

diff --git a/colm/colm.h b/colm/colm.h
index b3a99e0d..721529bd 100644
--- a/colm/colm.h
+++ b/colm/colm.h
@@ -35,9 +35,7 @@
 #define PROGNAME "colm"
 
 /* IO filenames and stream. */
-extern bool printPrintables;
-extern bool graphvizDone;
-
+extern bool genGraphviz;
 extern int gblErrorCount;
 
 std::ostream &error();
diff --git a/colm/dotgen.cpp b/colm/dotgen.cpp
index fd8af6b8..2fd9bf09 100644
--- a/colm/dotgen.cpp
+++ b/colm/dotgen.cpp
@@ -20,272 +20,13 @@
  */
 
 
-#include "dotgen.h"
+#include "colm.h"
 #include "parsedata.h"
-#include "pdacodegen.h"
 
 using namespace std;
-#if 0
 
-std::ostream &GraphvizDotGen::KEY( Key key )
-{
-	if ( printPrintables && key.isPrintable() ) {
-		// Output values as characters, ensuring we escape the quote (") character
-		char cVal = (char) key.getVal();
-		out << "'";
-		switch ( cVal ) {
-			case '"': case '\\':
-				out << "\\" << cVal;
-				break;
-			default:	
-				out << cVal;
-				break;
-		}
-		out << "'";
-	}
-	else {
-		if ( keyOps->isSigned )
-			out << key.getVal();
-		else
-			out << (unsigned long) key.getVal();
-	}
-
-	return out;
-}
-
-std::ostream &GraphvizDotGen::TRANS_ACTION( RedState *fromState, RedTrans *trans )
-{
-	int n = 0;
-	RedAction *actions[3];
-
-	if ( fromState->fromStateAction != 0 )
-		actions[n++] = fromState->fromStateAction;
-	if ( trans->action != 0 )
-		actions[n++] = trans->action;
-	if ( trans->targ != 0 && trans->targ->toStateAction != 0 )
-		actions[n++] = trans->targ->toStateAction;
-
-	if ( n > 0 )
-		out << " / ";
-	
-	/* Loop the existing actions and write out what's there. */
-	for ( int a = 0; a < n; a++ ) {
-		for ( GenActionTable::Iter actIt = actions[a]->key.first(); actIt.lte(); actIt++ ) {
-			GenAction *action = actIt->value;
-			out << action->nameOrLoc();
-			if ( a < n-1 || !actIt.last() )
-				out << ", ";
-		}
-	}
-	return out;
-}
-
-std::ostream &GraphvizDotGen::ACTION( RedAction *action )
-{
-	/* The action. */
-	out << " / ";
-	for ( GenActionTable::Iter actIt = action->key.first(); actIt.lte(); actIt++ ) {
-		GenAction *action = actIt->value;
-		if ( action->name != 0 )
-			out << action->name;
-		else
-			out << action->loc.line << ":" << action->loc.col;
-		if ( !actIt.last() )
-			out << ", ";
-	}
-	return out;
-}
-
-std::ostream &GraphvizDotGen::ONCHAR( Key lowKey, Key highKey )
-{
-	if ( lowKey > keyOps->maxKey ) {
-		GenCondSpace *condSpace = redFsm->findCondSpace( lowKey, highKey );
-		Key values = ( lowKey - condSpace->baseKey ) / keyOps->alphSize();
-
-		lowKey = keyOps->minKey + 
-			(lowKey - condSpace->baseKey - keyOps->alphSize() * values.getVal());
-		highKey = keyOps->minKey + 
-			(highKey - condSpace->baseKey - keyOps->alphSize() * values.getVal());
-		KEY( lowKey );
-		if ( lowKey != highKey ) {
-			out << "..";
-			KEY( highKey );
-		}
-		out << "(";
-
-		for ( GenCondSet::Iter csi = condSpace->condSet; csi.lte(); csi++ ) {
-			bool set = values & (1 << csi.pos());
-			if ( !set )
-				out << "!";
-			out << (*csi)->nameOrLoc();
-			if ( !csi.last() )
-				out << ", ";
-		}
-		out << ")";
-	}
-	else {
-		/* Output the key. Possibly a range. */
-		KEY( lowKey );
-		if ( highKey != lowKey ) {
-			out << "..";
-			KEY( highKey );
-		}
-	}
-	return out;
-}
-
-void GraphvizDotGen::writeTransList( RedState *state )
-{
-	/* Build the set of unique transitions out of this state. */
-	RedTransPtrSet stTransSet;
-	for ( RedTransList::Iter tel = state->outRange; tel.lte(); tel++ ) {
-		/* If we haven't seen the transitions before, the move forward
-		 * emitting all the transitions on the same character. */
-		if ( stTransSet.insert( tel->value ) ) {
-			/* Write out the from and to states. */
-			out << "\t" << state->id << " -> ";
-
-			if ( tel->value->targ == 0 )
-				out << "err_" << state->id;
-			else
-				out << tel->value->targ->id;
-
-			/* Begin the label. */
-			out << " [ label = \""; 
-			ONCHAR( tel->lowKey, tel->highKey );
-
-			/* Walk the transition list, finding the same. */
-			for ( RedTransList::Iter mtel = tel.next(); mtel.lte(); mtel++ ) {
-				if ( mtel->value == tel->value ) {
-					out << ", ";
-					ONCHAR( mtel->lowKey, mtel->highKey );
-				}
-			}
-
-			/* Write the action and close the transition. */
-			TRANS_ACTION( state, tel->value );
-			out << "\" ];\n";
-		}
-	}
-
-	/* Write the default transition. */
-	if ( state->defTrans != 0 ) {
-		/* Write out the from and to states. */
-		out << "\t" << state->id << " -> ";
-
-		if ( state->defTrans->targ == 0 )
-			out << "err_" << state->id;
-		else
-			out << state->defTrans->targ->id;
-
-		/* Begin the label. */
-		out << " [ label = \"DEF"; 
-
-		/* Write the action and close the transition. */
-		TRANS_ACTION( state, state->defTrans );
-		out << "\" ];\n";
-	}
-}
 
-void GraphvizDotGen::writeDotFile( )
-{
-	out << 
-		"digraph " << fsmName << " {\n"
-		"	rankdir=LR;\n";
-	
-	/* Define the psuedo states. Transitions will be done after the states
-	 * have been defined as either final or not final. */
-	out << "	node [ shape = point ];\n";
-	out << "	ENTRY;\n";
-
-	/* Psuedo states for entry points in the entry map. */
-	for ( EntryIdVect::Iter en = redFsm->entryPointIds; en.lte(); en++ ) {
-		RedState *state = redFsm->allStates + *en;
-		out << "	en_" << state->id << ";\n";
-	}
-
-	/* Psuedo states for final states with eof actions. */
-	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
-		if ( st->eofAction != 0 )
-			out << "	eof_" << st->id << ";\n";
-	}
-
-	out << "	node [ shape = circle, height = 0.2 ];\n";
-
-	/* Psuedo states for states whose default actions go to error. */
-	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
-		bool needsErr = false;
-		if ( st->defTrans != 0 && st->defTrans->targ == 0 )
-			needsErr = true;
-		else {
-			for ( RedTransList::Iter tel = st->outRange; tel.lte(); tel++ ) {
-				if ( tel->value->targ == 0 ) {
-					needsErr = true;
-					break;
-				}
-			}
-		}
-
-		if ( needsErr )
-			out << "	err_" << st->id << " [ label=\"\"];\n";
-	}
-
-	/* Attributes common to all nodes, plus double circle for final states. */
-	out << "	node [ fixedsize = true, height = 0.65, shape = doublecircle ];\n";
-
-	/* List Final states. */
-	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
-		if ( st->isFinal )
-			out << "	" << st->id << ";\n";
-	}
-
-	/* List transitions. */
-	out << "	node [ shape = circle ];\n";
-
-	/* Walk the states. */
-	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ )
-		writeTransList( st );
-
-	/* Transitions into the start state. */
-	out << "	ENTRY -> " << redFsm->startState->id << " [ label = \"IN";
-	out << "\" ];\n";
-
-	/* Transitions into the entry points. */
-	for ( EntryIdVect::Iter en = redFsm->entryPointIds; en.lte(); en++ ) {
-		RedState *state = redFsm->allStates + *en;
-		char *name = redFsm->entryPointNames[en.pos()];
-		out << "	en_" << state->id << " -> " << state->id <<
-				" [ label = \"" << name << "\" ];\n";
-	}
-
-	/* Out action transitions. */
-	for ( RedStateList::Iter st = redFsm->stateList; st.lte(); st++ ) {
-		if ( st->eofAction != 0 ) {
-			out << "	" << st->id << " -> eof_" << 
-					st->id << " [ label = \"EOF"; 
-			ACTION( st->eofAction ) << "\" ];\n";
-		}
-	}
-
-	out <<
-		"}\n";
-}
-
-void GraphvizDotGen::finishRagelDef()
-{
-	if ( !graphvizDone ) {
-		graphvizDone = true;
-
-		/* For dot file generation we want to pick default transitions. */
-		redFsm->chooseDefaultSpan();
-
-		/* Write out with it. */
-		writeDotFile();
-	}
-}
-
-
-void PdaCodeGen::writeTransList( PdaState *state )
+void ParseData::writeTransList( PdaState *state )
 {
 	for ( TransMap::Iter trans = state->transMap; trans.lte(); trans++ ) {
 		/* Write out the from and to states. */
@@ -294,9 +35,9 @@ void PdaCodeGen::writeTransList( PdaState *state )
 		/* Begin the label. */
 		out << " [ label = \""; 
 		long key = trans->key;  
-		KlangEl *lel = pd->langElIndex[key];
+		KlangEl *lel = langElIndex[key];
 		if ( lel != 0 )
-			out << lel->data;
+			out << lel->name;
 		else
 			out << (char)key;
 
@@ -308,12 +49,12 @@ void PdaCodeGen::writeTransList( PdaState *state )
 					out << "S(" << trans->value->actOrds[act.pos()] << ")";
 					break;
 				case 2: {
-					out << "R(" << pd->prodIdIndex[(*act >> 2)]->data <<
+					out << "R(" << prodIdIndex[(*act >> 2)]->data <<
 							", " << trans->value->actOrds[act.pos()] << ")";
 					break;
 				}
 				case 3: {
-					out << "SR(" << pd->prodIdIndex[(*act >> 2)]->data << 
+					out << "SR(" << prodIdIndex[(*act >> 2)]->data << 
 							", " << trans->value->actOrds[act.pos()] << ")";
 					break;
 				}}
@@ -326,44 +67,45 @@ void PdaCodeGen::writeTransList( PdaState *state )
 	}
 }
 
-void PdaCodeGen::writeDotFile( PdaGraph *graph )
+void ParseData::writeDotFile( PdaGraph *graph )
 {
 	out << 
 		"digraph " << parserName << " {\n"
-		"	rankdir=LR;\n";
+		"	rankdir=LR;\n"
+		"	ranksep=\"0\"\n"
+		"	nodesep=\"0.25\"\n"
+		"\n";
 	
 	/* Define the psuedo states. Transitions will be done after the states
 	 * have been defined as either final or not final. */
-	out << "	node [ shape = point ];\n";
-	out << "	ENTRY;\n";
-
-	out << "	node [ shape = circle, height = 0.2 ];\n";
-
-	/* Attributes common to all nodes, plus double circle for final states. */
-	out << "	node [ fixedsize = true, height = 0.65, shape = doublecircle ];\n";
+	out << 
+		"	node [ shape = point ];\n"
+		"	ENTRY [ label = \"\" ];\n"
+		"\n"
+		"	node [ shape = circle, fixedsize = true, height = 0.2 ];\n";
 
-	/* List Final states. */
-	for ( PdaStateSet::Iter st = graph->finStateSet; st.lte(); st++ )
-		out << "	" << (*st)->stateNum << ";\n";
+	/* Walk the states. */
+	for ( PdaStateList::Iter st = graph->stateList; st.lte(); st++ )
+		out << "	" << st->stateNum << " [ label = \"\" ];\n";
 
-	/* List transitions. */
-	out << "	node [ shape = circle ];\n";
+	out << "\n";
 
 	/* Walk the states. */
 	for ( PdaStateList::Iter st = graph->stateList; st.lte(); st++ )
 		writeTransList( st );
 
 	/* Transitions into the start state. */
-	out << "	ENTRY -> " << graph->startState->stateNum << " [ label = \"START\" ];\n";
+	out << "	ENTRY -> " << graph->startState->stateNum << " [ label = \"\" ];\n";
 
 	out <<
 		"}\n";
 }
 
-void PdaCodeGen::writeDotFile( )
+void ParseData::writeDotFile()
 {
-	writeDotFile( pd->pdaGraph );
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->parserId >= 0 )
+			writeDotFile( lel->pdaGraph );
+	}
 }
 
-#endif
-
diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 29d840ee..e0eb3d9d 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -22,7 +22,6 @@
 #include "parsedata.h"
 #include "fsmcodegen.h"
 #include "redfsm.h"
-#include "dotgen.h"
 #include "bstmap.h"
 #include "fsmrun.h"
 #include <sstream>
diff --git a/colm/main.cpp b/colm/main.cpp
index fd403313..a6170f0d 100644
--- a/colm/main.cpp
+++ b/colm/main.cpp
@@ -37,7 +37,6 @@
 #include "vector.h"
 #include "version.h"
 #include "fsmcodegen.h"
-#include "dotgen.h"
 
 using std::istream;
 using std::ifstream;
@@ -49,9 +48,7 @@ using std::cerr;
 using std::endl;
 
 /* Graphviz dot file generation. */
-bool graphvizDone = false;
-
-bool printPrintables = false;
+bool genGraphviz = false;
 
 using std::ostream;
 using std::istream;
@@ -308,7 +305,7 @@ void compileOutput( const char *argv0 )
 
 void process_args( int argc, const char **argv )
 {
-	ParamCheck pc( "vlio:S:M:vHh?-:s", argc, argv );
+	ParamCheck pc( "vlio:S:M:vHh?-:sV", argc, argv );
 
 	while ( pc.check() ) {
 		switch ( pc.state ) {
@@ -341,6 +338,9 @@ void process_args( int argc, const char **argv )
 			case 's':
 				printStatistics = true;
 				break;
+			case 'V':
+				generateGraphviz = true;
+				break;
 			case '-':
 				if ( strcasecmp(pc.parameterArg, "help") == 0 ) {
 					usage();
@@ -429,10 +429,21 @@ int main(int argc, const char **argv)
 	/* Initiate a compile following a parse. */
 	scanner.parser->pd->semanticAnalysis();
 
-	if ( outStream != 0 )
-		delete outStream;
-
-	compileOutput( argv[0] );
+	/*
+	 * Write output.
+	 */
+	if ( generateGraphviz ) {
+		outStream = &cout;
+		scanner.parser->pd->writeDotFile();
+	}
+	else {
+		openOutput();
+		scanner.parser->pd->generateOutput();
+	
+		if ( outStream != 0 )
+			delete outStream;
 
+		compileOutput( argv[0] );
+	}
 	return 0;
 }
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 1ed0403d..ba7f14cd 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1747,7 +1747,7 @@ void ParseData::semanticAnalysis()
 
 	/* Make the reduced fsm. */
 	RedFsmBuild reduce( sectionName, this, fsmGraph );
-	RedFsm *redFsm = reduce.reduceMachine();
+	redFsm = reduce.reduceMachine();
 
 	/* Build the parsers used for patterns and replacements. */
 	makePatternParsers();
@@ -1774,13 +1774,10 @@ void ParseData::semanticAnalysis()
 	
 	/* Parse patterns and replacements. */
 	parsePatterns();
+}
 
-	/*
-	 * Write output.
-	 */
-
-	openOutput();
-
+void ParseData::generateOutput()
+{
 	FsmCodeGen *fsmGen = new FsmCodeGen("<INPUT>", sectionName,
 			*outStream, redFsm, fsmTables );
 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 9bf464b4..f2c382f5 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -743,6 +743,15 @@ struct ParseData
 	void resolveUses();
 	void createDefaultScanner();
 	void semanticAnalysis();
+	void generateOutput();
+
+	/* 
+	 * Graphviz Generation
+	 */
+	void writeTransList( PdaState *state );
+	void writeDotFile( PdaGraph *graph );
+	void writeDotFile( );
+	
 
 	/*
 	 * Data collected during the parse.
@@ -885,6 +894,8 @@ struct ParseData
 	ObjFieldMap *objFieldMap;
 
 	bool revertOn;
+
+	RedFsm *redFsm;
 };
 
 void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
-- 
cgit v1.2.1


From f9a1603eead3b6daa97b79eab8a6445fb46af5de Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 13 Feb 2009 04:20:27 +0000
Subject: Now using a single parse table with multiple entry points, instead of
 multiple disjoint tables, one for each nonterminal that must be parsed. I had
 pursued this before but gave up because the EOF token of one parser could
 interfere with another parser. The observation I was missing was that we can
 use unique EOF tokens for each nonterminal we parse, thus avoiding
 interference.

---
 colm/bytecode.cpp   |   8 ++--
 colm/closure.cpp    |  40 ++++++++++-------
 colm/compile.cpp    |   2 +
 colm/dotgen.cpp     |  18 ++++----
 colm/fsmrun.cpp     |   4 +-
 colm/parsedata.cpp  | 108 +++++++++++++++++---------------------------
 colm/parsedata.h    |  25 +++++++----
 colm/pdabuild.cpp   | 127 ++++++++++++++++++++++++++++++++++++++--------------
 colm/pdacodegen.cpp |  19 ++++----
 colm/pdacodegen.h   |   2 +-
 colm/pdagraph.cpp   |   6 ++-
 colm/pdagraph.h     |   1 +
 colm/pdarun.cpp     |   5 ++-
 colm/pdarun.h       |   9 ++--
 14 files changed, 220 insertions(+), 154 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 787fa353..58db7499 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -131,8 +131,8 @@ void send( Tree **root, Program *prg, PdaRun *parser, Tree *tree, bool ignore )
 Tree *call_parser( Tree **&sp, Program *prg, Stream *stream, 
 		long parserId, long stopId, CodeVect *&cv, bool revertOn )
 {
-	PdaTables *tables = prg->rtd->parsers[parserId];
-	PdaRun parser( sp, prg, tables, stream->scanner, stopId, revertOn );
+	PdaTables *tables = prg->rtd->pdaTables;
+	PdaRun parser( sp, prg, tables, parserId, stream->scanner, stopId, revertOn );
 	parser.run();
 	commit_full( &parser, 0 );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
@@ -156,8 +156,8 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 void undo_parse( Tree **&sp, Program *prg, Stream *stream, 
 		long parserId, Tree *tree, CodeVect *rev )
 {
-	PdaTables *tables = prg->rtd->parsers[parserId];
-	PdaRun parser( sp, prg, tables, stream->scanner, 0, false );
+	PdaTables *tables = prg->rtd->pdaTables;
+	PdaRun parser( sp, prg, tables, parserId, stream->scanner, 0, false );
 	parser.undoParse( tree, rev );
 }
 
diff --git a/colm/closure.cpp b/colm/closure.cpp
index b3c17b1c..5ee6538e 100644
--- a/colm/closure.cpp
+++ b/colm/closure.cpp
@@ -320,7 +320,7 @@ void ParseData::lalr1AddFollow1( PdaGraph *pdaGraph, PdaTrans *trans )
 }
 
 /* Add follow sets to an LR(0) graph to make it LALR(1). */
-void ParseData::lalr1AddFollowSets( PdaGraph *pdaGraph, KlangEl *rootEl )
+void ParseData::lalr1AddFollowSets( PdaGraph *pdaGraph, KlangElSet &parserEls )
 {
 	/* Make the state that all reduction actions go to. Since a reduction pops
 	 * states of the stack and sets the new target state, this state is
@@ -328,13 +328,15 @@ void ParseData::lalr1AddFollowSets( PdaGraph *pdaGraph, KlangEl *rootEl )
 	actionDestState = pdaGraph->addState();
 	pdaGraph->setFinState( actionDestState );
 
-	/* Get the entry into the graph and traverse over start. */
-	PdaState *overStart = pdaGraph->followFsm( pdaGraph->startState, rootEl->rootDef->fsm );
+	for ( KlangElSet::Iter pe = parserEls; pe.lte(); pe++ ) {
+		/* Get the entry into the graph and traverse over start. */
+		PdaState *overStart = pdaGraph->followFsm( (*pe)->startState, (*pe)->rootDef->fsm );
 
-	/* Add _eof after the initial _start. */
-	PdaTrans *eofTrans = pdaGraph->insertNewTrans( overStart, actionDestState, 
-			eofKlangEl->id, eofKlangEl->id );
-	eofTrans->isShift = true;
+		/* Add _eof after the initial _start. */
+		PdaTrans *eofTrans = pdaGraph->insertNewTrans( overStart, actionDestState, 
+				(*pe)->eofLel->id, (*pe)->eofLel->id );
+		eofTrans->isShift = true;
+	}
 
 	/* This was used during lr0 table construction. */
 	pdaGraph->transClosureQueue.abandon();
@@ -416,20 +418,26 @@ void ParseData::addDupTerms( PdaGraph *pdaGraph )
 }
 
 /* Generate a LALR(1) graph. */
-void ParseData::lalr1GenerateParser( PdaGraph *pdaGraph, KlangEl *rootEl )
+void ParseData::lalr1GenerateParser( PdaGraph *pdaGraph, KlangElSet &parserEls )
 {
 	/* Make the intial graph. */
 	pdaGraph->langElIndex = langElIndex;
 
-	PdaState *start = pdaGraph->addState();
-	pdaGraph->setStartState( start );
+	for ( Vector<KlangEl*>::Iter r = parserEls; r.lte(); r++ ) {
+		/* Create the entry point. */
+		PdaState *rs = pdaGraph->addState();
+		pdaGraph->entryStateSet.insert( rs );
+
+		/* State set of just one state. */
+		rs->stateSet = new PdaStateSet;
+		rs->stateSet->insert( (*r)->rootDef->fsm->startState );
 
-	start->stateSet = new PdaStateSet;
-	start->stateSet->insert( rootEl->rootDef->fsm->startState );
+		/* Queue the start state for closure. */
+		rs->onClosureQueue = true;
+		pdaGraph->stateClosureQueue.append( rs );
 
-	/* Queue the start state for closure. */
-	start->onClosureQueue = true;
-	pdaGraph->stateClosureQueue.append( start );
+		(*r)->startState = rs;
+	}
 
 	/* Run the lr0 closure. */
 	lr0CloseAllStates( pdaGraph );
@@ -441,7 +449,7 @@ void ParseData::lalr1GenerateParser( PdaGraph *pdaGraph, KlangEl *rootEl )
 	linkExpansions( pdaGraph );
 
 	/* Walk the graph adding follow sets to the LR(0) graph. */
-	lalr1AddFollowSets( pdaGraph, rootEl );
+	lalr1AddFollowSets( pdaGraph, parserEls );
 
 //	/* Set the commit on the final eof shift. */
 //	PdaTrans *overStart = pdaGraph->startState->findTrans( rootEl->id );
diff --git a/colm/compile.cpp b/colm/compile.cpp
index aab44efc..1f6068bb 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1147,6 +1147,8 @@ UniqueType *LangTerm::evaluateParse( ParseData *pd, CodeVect &code, bool stop )
 	/* Allocate a parser id. This will cause a parser to be built for
 	 * the type. */
 	ut->langEl->parserId = pd->nextParserId++;
+	if ( stop )
+		ut->langEl->parseStop = true;
 
 	/* Parse instruction, dependent on whether or not we are
 	 * producing revert or commit code. */
diff --git a/colm/dotgen.cpp b/colm/dotgen.cpp
index 2fd9bf09..30788a4c 100644
--- a/colm/dotgen.cpp
+++ b/colm/dotgen.cpp
@@ -79,8 +79,12 @@ void ParseData::writeDotFile( PdaGraph *graph )
 	/* Define the psuedo states. Transitions will be done after the states
 	 * have been defined as either final or not final. */
 	out << 
-		"	node [ shape = point ];\n"
-		"	ENTRY [ label = \"\" ];\n"
+		"	node [ shape = point ];\n";
+	
+	for ( int i = 0; i < graph->entryStateSet.length(); i++ )
+		out << "\tENTRY" << i <<  " [ label = \"\" ];\n";
+
+	out << 
 		"\n"
 		"	node [ shape = circle, fixedsize = true, height = 0.2 ];\n";
 
@@ -94,8 +98,9 @@ void ParseData::writeDotFile( PdaGraph *graph )
 	for ( PdaStateList::Iter st = graph->stateList; st.lte(); st++ )
 		writeTransList( st );
 
-	/* Transitions into the start state. */
-	out << "	ENTRY -> " << graph->startState->stateNum << " [ label = \"\" ];\n";
+	/* Start state and other entry points. */
+	for ( PdaStateSet::Iter st = graph->entryStateSet; st.lte(); st++ )
+		out << "\tENTRY" << st.pos() << " -> " << (*st)->stateNum << " [ label = \"\" ];\n";
 
 	out <<
 		"}\n";
@@ -103,9 +108,6 @@ void ParseData::writeDotFile( PdaGraph *graph )
 
 void ParseData::writeDotFile()
 {
-	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-		if ( lel->parserId >= 0 )
-			writeDotFile( lel->pdaGraph );
-	}
+	writeDotFile( pdaGraph );
 }
 
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index f7602d2f..2ddf8751 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -724,7 +724,7 @@ void FsmRun::sendEOF( )
 	input->tree->flags |= AF_PARSE_TREE;
 
 	input->tree->refs = 1;
-	input->tree->id = parser->tables->rtd->eofId;
+	input->tree->id = parser->tables->rtd->eofLelIds[parser->parserId];
 
 	bool ctxDepParsing = prg->ctxDepParsing;
 	long frameId = parser->tables->rtd->regionInfo[region].eofFrameId;
@@ -748,7 +748,7 @@ void FsmRun::sendEOF( )
 	parser->send( input );
 
 	if ( parser->errCount > 0 ) {
-		parser->parse_error( parser->tables->rtd->eofId, input->tree ) << 
+		parser->parse_error( input->tree->id, input->tree ) << 
 				"parse error" << endp;
 	}
 
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index ba7f14cd..fd38e64e 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1603,29 +1603,6 @@ void InputStreamRepl::pushBackNamed()
 }
 
 
-void ParseData::makePatternParsers()
-{
-	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
-		/* We assume the reduction action compilation phase was run before
-		 * pattern parsing and it decorated the pattern with the target type. */
-		assert( pat->langEl != 0 );
-		if ( pat->langEl->type != KlangEl::NonTerm )
-			error(pat->loc) << "pattern type is not a non-terminal" << endp;
-
-		/* Make a parser for the language element. */
-		makeParser( pat->langEl );
-	}
-
-	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
-		/* We assume the reduction action compilation phase was run before
-		 * replacement parsing decorated the replacement with the target type. */
-		assert( repl->langEl != 0 );
-
-		/* Make a parser for the language element. */
-		makeParser( repl->langEl );
-	}
-}
-
 void ParseData::parsePatterns()
 {
 	Program program( false, runtimeData );
@@ -1639,7 +1616,7 @@ void ParseData::parsePatterns()
 		fsmRun.attachInputStream( &in );
 
 		repl->pdaRun = new PdaRun( root, &program,
-				repl->langEl->pdaTables, &fsmRun, 0, false );
+				pdaTables, repl->langEl->parserId, &fsmRun, 0, false );
 		repl->pdaRun->run();
 
 			//#ifdef COLM_LOG_COMPILE
@@ -1655,7 +1632,7 @@ void ParseData::parsePatterns()
 		fsmRun.attachInputStream( &in );
 
 		pat->pdaRun = new PdaRun( root, &program,
-				pat->langEl->pdaTables, &fsmRun, 0, false );
+				pdaTables, pat->langEl->parserId, &fsmRun, 0, false );
 		pat->pdaRun->run();
 
 			//#ifdef COLM_LOG_COMPILE
@@ -1668,31 +1645,6 @@ void ParseData::parsePatterns()
 	fillInPatterns( &program );
 }
 
-void ParseData::verifyParseStopGrammar( KlangEl *langEl )
-{
-	PdaGraph *pdaGraph = langEl->pdaGraph;
-
-	/* Get the entry into the graph and traverse over the root. The resulting
-	 * state can have eof, nothing else can. */
-	PdaState *overStart = pdaGraph->followFsm( 
-			pdaGraph->startState,
-			langEl->rootDef->fsm );
-
-	/* The graph must reduce to root all on it's own. It cannot depend on
-	 * require EOF. */
-	for ( PdaStateList::Iter st = pdaGraph->stateList; st.lte(); st++ ) {
-		if ( st == overStart )
-			continue;
-
-		for ( TransMap::Iter tr = st->transMap; tr.lte(); tr++ ) {
-			if ( tr->value->lowKey == eofKlangEl->id ) {
-				/* This needs a better error message. Appears to be voodoo. */
-				error() << "grammar is not usable with parse_stop" << endp;
-			}
-		}
-	}
-}
-
 void ParseData::resolveUses()
 {
 	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
@@ -1710,6 +1662,41 @@ void ParseData::resolveUses()
 	}
 }
 
+void ParseData::collectParserEls( BstSet<KlangEl*> &parserEls )
+{
+	for ( PatternList::Iter pat = patternList; pat.lte(); pat++ ) {
+		/* We assume the reduction action compilation phase was run before
+		 * pattern parsing and it decorated the pattern with the target type. */
+		assert( pat->langEl != 0 );
+		if ( pat->langEl->type != KlangEl::NonTerm )
+			error(pat->loc) << "pattern type is not a non-terminal" << endp;
+
+		if ( pat->langEl->parserId < 0 ) {
+			/* Make a parser for the language element. */
+			parserEls.insert( pat->langEl );
+			pat->langEl->parserId = nextParserId++;
+		}
+	}
+
+	for ( ReplList::Iter repl = replList; repl.lte(); repl++ ) {
+		/* We assume the reduction action compilation phase was run before
+		 * replacement parsing decorated the replacement with the target type. */
+		assert( repl->langEl != 0 );
+
+		if ( repl->langEl->parserId < 0 ) {
+			/* Make a parser for the language element. */
+			parserEls.insert( repl->langEl );
+			repl->langEl->parserId = nextParserId++;
+		}
+	}
+
+	/* Make parsers that we need. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->parserId >= 0 )
+			parserEls.insert( lel );
+	}
+}
+
 void ParseData::semanticAnalysis()
 {
 	beginProcessing();
@@ -1749,18 +1736,10 @@ void ParseData::semanticAnalysis()
 	RedFsmBuild reduce( sectionName, this, fsmGraph );
 	redFsm = reduce.reduceMachine();
 
-	/* Build the parsers used for patterns and replacements. */
-	makePatternParsers();
+	BstSet<KlangEl*> parserEls;
+	collectParserEls( parserEls );
 
-	/* Make parsers that we need. */
-	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-		if ( lel->parserId >= 0 ) {
-			makeParser( lel );
-
-			if ( lel->parseStop )
-				verifyParseStopGrammar( lel );
-		}
-	}
+	makeParser( parserEls );
 
 	/* Make the scanner tables. */
 	fsmTables = redFsm->makeFsmTables();
@@ -1787,13 +1766,10 @@ void ParseData::generateOutput()
 	fsmGen->writeCode();
 
 	/* Make parsers that we need. */
-	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-		if ( lel->parserId >= 0 )
-			pdaGen->writeParserData( lel->parserId, lel->pdaTables );
-	}
+	pdaGen->writeParserData( 0, pdaTables );
 
 	/* Write the runtime data. */
-	pdaGen->writeRuntimeData( runtimeData );
+	pdaGen->writeRuntimeData( runtimeData, pdaTables );
 
 	outStream->flush();
 }
diff --git a/colm/parsedata.h b/colm/parsedata.h
index f2c382f5..522a7aea 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -147,6 +147,7 @@ typedef Vector< TokenDef* > TokenDefVect;
 struct UniqueType;
 
 typedef Vector<KlangEl*> KlangElVect;
+typedef BstSet<KlangEl*> KlangElSet;
 
 /* A language element class. Can be a nonTerm or a term. */
 struct KlangEl : public DListEl<KlangEl>
@@ -178,6 +179,7 @@ struct KlangEl : public DListEl<KlangEl>
 	bool isRepeat;
 	bool isOpt;
 	bool parseStop;
+	bool isEOF;
 
 	/* Productions from the language element if it is a non-terminal. */
 	LelDefList defList;
@@ -185,10 +187,13 @@ struct KlangEl : public DListEl<KlangEl>
 	TokenDef *tokenDef;
 	Definition *rootDef;
 	KlangEl *termDup;
+	KlangEl *eofLel;
 
 	PdaGraph *pdaGraph;
 	PdaTables *pdaTables;
 
+	PdaState *startState;
+
 	CodeBlock *transBlock;
 
 	ObjectDef *objectDef;
@@ -635,14 +640,14 @@ struct ParseData
 	void lalr1AddFollow2( PdaGraph *pdaGraph, PdaTrans *trans, long followKey, long prior );
 	void lalr1AddFollow1( PdaGraph *pdaGraph, PdaTrans *trans );
 
-	void lalr1AddFollowSets( PdaGraph *pdaGraph, KlangEl *rootEl );
+	void lalr1AddFollowSets( PdaGraph *pdaGraph, KlangElSet &parserEls );
 
 	void lr0BringInItem( PdaGraph *pdaGraph, PdaState *dest, PdaState *prodState, 
 			PdaTrans *expandFrom, Definition *prod );
 	void lr0InvokeClosure( PdaGraph *pdaGraph, PdaState *state );
 	void lr0CloseAllStates( PdaGraph *pdaGraph );
 
-	void lalr1GenerateParser( PdaGraph *pdaGraph, KlangEl *rootEl );
+	void lalr1GenerateParser( PdaGraph *pdaGraph, KlangElSet &parserEls );
 
 	void reduceActions( PdaGraph *pdaGraph );
 
@@ -657,13 +662,13 @@ struct ParseData
 	PdaState *followProd( PdaState *tabState, PdaState *prodState );
 	void findFollow( AlphSet &result, PdaState *overTab, 
 			PdaState *overSrc, Definition *parentDef );
-	void pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl );
+	void pdaActionOrder( PdaGraph *pdaGraph, KlangElSet &parserEls );
 	void pdaOrderFollow( KlangEl *rootEl, PdaState *tabState, 
 			PdaTrans *tabTrans, PdaTrans *srcTrans,
 			Definition *parentDef, Definition *definition, long &time );
 	void pdaOrderProd( KlangEl *rootEl, PdaState *tabState, 
 			PdaState *srcState, Definition *parentDef, long &time );
-	void analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl );
+	void analyzeMachine( PdaGraph *pdaGraph, KlangElSet &parserEls );
 
 	void makeProdFsms();
 	void insertUniqueEmptyProductions();
@@ -688,12 +693,11 @@ struct ParseData
 	void addProdRHSLoads( Definition *prod, CodeVect &code, long &insertPos );
 
 	void prepGrammar();
-
-	void makePatternParsers();
 	void parsePatterns();
 
-	void makeParser( KlangEl *rootEl );
-	PdaGraph *makePdaGraph( KlangEl *rootEl );
+	void collectParserEls( KlangElSet &parserEls );
+	void makeParser( KlangElSet &parserEls );
+	PdaGraph *makePdaGraph( BstSet<KlangEl*> &parserEls  );
 	PdaTables *makePdaTables( PdaGraph *pdaGraph );
 
 	void fillInPatterns( Program *prg );
@@ -702,7 +706,7 @@ struct ParseData
 	/* Generate and write out the fsm. */
 	void generateGraphviz();
 
-	void verifyParseStopGrammar( KlangEl *langEl );
+	void verifyParseStopGrammar( KlangEl *langEl, PdaGraph *pdaGraph );
 
 	void initFieldInstructions( ObjField *el );
 	void initLocalInstructions( ObjField *el );
@@ -896,6 +900,9 @@ struct ParseData
 	bool revertOn;
 
 	RedFsm *redFsm;
+
+	PdaGraph *pdaGraph;
+	PdaTables *pdaTables;
 };
 
 void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 2c370644..17a85d03 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -73,9 +73,11 @@ KlangEl::KlangEl( Namespace *nspace, const String &name, Type type )
 	isRepeat(false),
 	isOpt(false),
 	parseStop(false),
+	isEOF(false),
 	tokenDef(0),
 	rootDef(0),
 	termDup(0),
+	eofLel(0),
 	pdaGraph(0),
 	pdaTables(0),
 	transBlock(0),
@@ -218,10 +220,11 @@ void ParseData::makeKlangElIds()
 	assert( noTokenMapEl != 0 );
 
 	/* Make the EOF language element. */
-	eofKlangEl = new KlangEl( rootNamespace, strdup("_eof"), KlangEl::Term );
-	langEls.prepend( eofKlangEl );
-	SymbolMapEl *eofMapEl = rootNamespace->symbolMap.insert( eofKlangEl->name, eofKlangEl );
-	assert( eofMapEl != 0 );
+	eofKlangEl = 0;
+//	eofKlangEl = new KlangEl( rootNamespace, strdup("_eof"), KlangEl::Term );
+//	langEls.prepend( eofKlangEl );
+//	SymbolMapEl *eofMapEl = rootNamespace->symbolMap.insert( eofKlangEl->name, eofKlangEl );
+//	assert( eofMapEl != 0 );
 
 	/* Make the "any" language element */
 	anyKlangEl = new KlangEl( rootNamespace, strdup("any"), KlangEl::NonTerm );
@@ -247,6 +250,25 @@ void ParseData::makeKlangElIds()
 		}
 	}
 
+	/* Make eof language elements for each user terminal. This is a bit excessive and
+	 * need to be reduced to the ones that we need parsers for, but we don't know that yet.
+	 * Another pass before this one is needed. */
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		if ( lel->eofLel == 0 &&
+				lel != eofKlangEl &&
+				lel != errorKlangEl &&
+				lel != noTokenKlangEl )
+		{
+			String name( lel->name.length() + 5, "_eof_%s", lel->name.data );
+			KlangEl *eofLel = new KlangEl( lel->nspace, name, KlangEl::Term );
+
+			langEls.append( eofLel );
+			lel->eofLel = eofLel;
+			eofLel->eofLel = lel;
+			eofLel->isEOF = true;
+		}
+	}
+
 	/* The first id 0 is reserved for the stack sentinal. A negative id means
 	 * error to the parsing function, inducing backtracking. */
 	nextSymbolId = 1;
@@ -256,7 +278,7 @@ void ParseData::makeKlangElIds()
 		/* Must be a term, and not any of the special reserved terminals.
 		 * Remember if the non terminal is a user non terminal. */
 		if ( lel->type == KlangEl::Term && 
-				lel != eofKlangEl && 
+				!lel->isEOF && 
 				lel != errorKlangEl &&
 				lel != noTokenKlangEl )
 		{
@@ -265,8 +287,15 @@ void ParseData::makeKlangElIds()
 		}
 	}
 
+	//eofKlangEl->id = nextSymbolId++;
+	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
+		/* Must be a term, and not any of the special reserved terminals.
+		 * Remember if the non terminal is a user non terminal. */
+		if ( lel->isEOF )
+			lel->id = nextSymbolId++;
+	}
+
 	/* Next assign to the eof notoken, which we always create. */
-	eofKlangEl->id = nextSymbolId++;
 	noTokenKlangEl->id = nextSymbolId++;
 
 	/* Possibly assign to the error language element. */
@@ -482,7 +511,7 @@ void ParseData::pdaOrderFollow( KlangEl *rootEl, PdaState *tabState,
 
 	AlphSet alphSet;
 	if ( parentDef == rootEl->rootDef )
-		alphSet.insert( eofKlangEl->id );
+		alphSet.insert( rootEl->eofLel->id );
 	else
 		findFollow( alphSet, overTab, overSrc, parentDef );		
 
@@ -519,7 +548,7 @@ void ParseData::addRegion( PdaState *tabState, long pdaKey )
 
 		/* If it is not the eof, then use the region associated 
 		 * with the token definition. */
-		if ( klangEl != eofKlangEl && klangEl->tokenDef != 0 )
+		if ( !klangEl->isEOF && klangEl->tokenDef != 0 )
 			region = klangEl->tokenDef->tokenRegion;
 
 		if ( region != 0 && !regionVectHas( tabState->regions, region ) )
@@ -620,7 +649,7 @@ void ParseData::pdaOrderProd( KlangEl *rootEl, PdaState *tabState,
 	}
 }
 
-void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl )
+void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangElSet &parserEls )
 {
 	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
 		assert( (state->stateBits & SB_ISMARKED) == 0 );
@@ -636,14 +665,16 @@ void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl )
 
 	/* Compute the action orderings, record the max value. */
 	long time = 1;
-	PdaState *startState = rootEl->rootDef->fsm->startState;
-	pdaOrderProd( rootEl, pdaGraph->startState, startState, rootEl->rootDef, time );
-
-	/* Walk over the start lang el and set the time for shift of
-	 * the eof action that completes the parse. */
-	PdaTrans *overStart = pdaGraph->startState->findTrans( rootEl->id );
-	PdaTrans *eofTrans = overStart->toState->findTrans( eofKlangEl->id );
-	eofTrans->actOrds[0] = time++;
+	for ( KlangElSet::Iter pe = parserEls; pe.lte(); pe++ ) {
+		PdaState *startState = (*pe)->rootDef->fsm->startState;
+		pdaOrderProd( *pe, (*pe)->startState, startState, (*pe)->rootDef, time );
+
+		/* Walk over the start lang el and set the time for shift of
+		 * the eof action that completes the parse. */
+		PdaTrans *overStart = (*pe)->startState->findTrans( (*pe)->id );
+		PdaTrans *eofTrans = overStart->toState->findTrans( (*pe)->eofLel->id );
+		eofTrans->actOrds[0] = time++;
+	}
 
 	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
 		if ( state->regions.length() == 0 ) {
@@ -651,7 +682,8 @@ void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangEl *rootEl )
 				/* There are no regions and EOF leaves the state. Add the eof
 				 * token region. */
 				PdaTrans *trans = tel->value;
-				if ( trans->lowKey == eofKlangEl->id )
+				KlangEl *lel = langElIndex[trans->lowKey];
+				if ( lel != 0 && lel->isEOF )
 					state->regions.append( eofTokenRegion );
 			}
 		}
@@ -859,7 +891,30 @@ void ParseData::reduceActions( PdaGraph *pdaGraph )
 	}
 }
 
-void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl )
+void ParseData::verifyParseStopGrammar( KlangEl *langEl, PdaGraph *pdaGraph )
+{
+	/* Get the entry into the graph and traverse over the root. The resulting
+	 * state can have eof, nothing else can. */
+	PdaState *overStart = pdaGraph->followFsm( 
+			langEl->startState,
+			langEl->rootDef->fsm );
+
+	/* The graph must reduce to root all on it's own. It cannot depend on
+	 * require EOF. */
+	for ( PdaStateList::Iter st = pdaGraph->stateList; st.lte(); st++ ) {
+		if ( st == overStart )
+			continue;
+
+		for ( TransMap::Iter tr = st->transMap; tr.lte(); tr++ ) {
+			if ( tr->value->lowKey == langEl->eofLel->id ) {
+				/* This needs a better error message. Appears to be voodoo. */
+				error() << "grammar is not usable with parse_stop" << endp;
+			}
+		}
+	}
+}
+
+void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangElSet &parserEls )
 {
 	pdaGraph->maxState = pdaGraph->stateList.length() - 1;
 	pdaGraph->maxLelId = nextSymbolId - 1;
@@ -879,7 +934,7 @@ void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl )
 		}
 	}
 
-	pdaActionOrder( pdaGraph, rootEl );
+	pdaActionOrder( pdaGraph, parserEls );
 	sortActions( pdaGraph );
 	advanceReductions( pdaGraph );
 	pdaGraph->setStateNumbers();
@@ -922,6 +977,10 @@ void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangEl *rootEl )
 			}
 		}
 	}
+
+	/* Verify that any type we parse_stop can actually be parsed that way. */
+	for ( KlangElSet::Iter pe = parserEls; pe.lte(); pe++ )
+		verifyParseStopGrammar(*pe, pdaGraph);
 }
 
 void ParseData::wrapNonTerminals()
@@ -1359,12 +1418,16 @@ void ParseData::makeRuntimeData()
 	}
 
 	runtimeData->fsmTables = fsmTables;
+	runtimeData->pdaTables = pdaTables;
 
-	runtimeData->parsers = new PdaTables*[nextParserId];
+	runtimeData->startStates = new int[nextParserId];
+	runtimeData->eofLelIds = new int[nextParserId];
 	runtimeData->numParsers = nextParserId;
 	for ( LelList::Iter lel = langEls; lel.lte(); lel++ ) {
-		if ( lel->parserId >= 0 )
-			runtimeData->parsers[lel->parserId] = lel->pdaTables;
+		if ( lel->parserId >= 0 ) {
+			runtimeData->startStates[lel->parserId] = lel->startState->stateNum;
+			runtimeData->eofLelIds[lel->parserId] = lel->eofLel->id;
+		}
 	}
 		
 
@@ -1379,7 +1442,7 @@ void ParseData::makeRuntimeData()
 	runtimeData->integerId = intKlangEl->id;
 	runtimeData->stringId = strKlangEl->id;
 	runtimeData->anyId = anyKlangEl->id;
-	runtimeData->eofId = eofKlangEl->id;
+	runtimeData->eofId = 0; //eofKlangEl->id;
 	runtimeData->noTokenId = noTokenKlangEl->id;
 }
 
@@ -1503,8 +1566,6 @@ PdaTables *ParseData::makePdaTables( PdaGraph *pdaGraph )
 	int count, curOffset, pos;
 	PdaTables *pdaTables = new PdaTables;
 
-	pdaTables->startState = pdaGraph->startState->stateNum;
-
 	/*
 	 * Indicies.
 	 */
@@ -1687,25 +1748,23 @@ void ParseData::prepGrammar()
 	runtimeData = new RuntimeData;
 }
 
-PdaGraph *ParseData::makePdaGraph( KlangEl *rootEl )
+PdaGraph *ParseData::makePdaGraph( KlangElSet &parserEls )
 {
 	//for ( DefList::Iter prod = prodList; prod.lte(); prod++ )
 	//	cerr << prod->prodId << " " << prod->data << endl;
 
 	PdaGraph *pdaGraph = new PdaGraph();
-	lalr1GenerateParser( pdaGraph, rootEl );
+	lalr1GenerateParser( pdaGraph, parserEls );
 	pdaGraph->setStateNumbers();
-	analyzeMachine( pdaGraph, rootEl );
+	analyzeMachine( pdaGraph, parserEls );
 
 	//cerr << "NUMBER OF STATES: " << pdaGraph->stateList.length() << endl;
 
 	return pdaGraph;
 }
 
-void ParseData::makeParser( KlangEl *rootEl )
+void ParseData::makeParser( KlangElSet &parserEls )
 {
-	if ( rootEl->pdaTables == 0 ) {
-		rootEl->pdaGraph = makePdaGraph( rootEl );
-		rootEl->pdaTables = makePdaTables( rootEl->pdaGraph );
-	}
+	pdaGraph = makePdaGraph( parserEls );
+	pdaTables = makePdaTables( pdaGraph );
 }
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 8067dc06..53530e80 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -92,7 +92,7 @@ void PdaCodeGen::writeFirst()
 		"\n";
 }
 
-void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
+void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTables )
 {
 	/*
 	 * Blocks of code in frames.
@@ -355,10 +355,15 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 		out << "0, ";
 	out << "};\n\n";
 
-	/* Parsers. */
-	out << "PdaTables *parsers[] = {\n\t";
+	out << "int startStates[] = {\n\t";
 	for ( long i = 0; i < runtimeData->numParsers; i++ ) {
-		out << "&pid_" << i << "_pdaTables,\n";
+		out << runtimeData->startStates[i] << ", ";
+	}
+	out << "};\n\n";
+
+	out << "int eofLelIds[] = {\n\t";
+	for ( long i = 0; i < runtimeData->numParsers; i++ ) {
+		out << runtimeData->eofLelIds[i] << ", ";
 	}
 	out << "};\n\n";
 
@@ -398,7 +403,8 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 		"	" << runtimeData->numLiterals << ",\n"
 		"\n"
 		"	&fsmTables_start,\n"
-		"	parsers, " << runtimeData->numParsers << ",\n"
+		"	&pid_0_pdaTables,\n"
+		"	startStates, eofLelIds, " << runtimeData->numParsers << ",\n"
 		"\n"
 		"	" << runtimeData->globalSize << ",\n"
 		"\n"
@@ -415,8 +421,6 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData )
 void PdaCodeGen::writeParserData( long id, PdaTables *tables )
 {
 	String prefix = "pid_" + String(0, "%ld", id) + "_";
-	out << "unsigned int " << prefix << startState() << " = " <<
-		tables->startState << ";\n\n";
 
 	out << "int " << prefix << indicies() << "[] = {\n\t";
 	for ( int i = 0; i < tables->numIndicies; i++ ) {
@@ -529,7 +533,6 @@ void PdaCodeGen::writeParserData( long id, PdaTables *tables )
 	out << 
 		"PdaTables " << prefix << "pdaTables =\n"
 		"{\n"
-		"	" << prefix << startState() << ",\n"
 		"	" << prefix << indicies() << ",\n"
 		"	" << prefix << keys() << ",\n"
 		"	" << prefix << offsets() << ",\n"
diff --git a/colm/pdacodegen.h b/colm/pdacodegen.h
index 216bd9e3..7ca32546 100644
--- a/colm/pdacodegen.h
+++ b/colm/pdacodegen.h
@@ -51,7 +51,7 @@ struct PdaCodeGen
 	void writeRhsLocate( Definition *prod );
 
 	void writeFirst();
-	void writeRuntimeData( RuntimeData *runtimeData );
+	void writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTables );
 	void writeParserData( long id, PdaTables *tables );
 
 	String PARSER() { return "parser_"; }
diff --git a/colm/pdagraph.cpp b/colm/pdagraph.cpp
index 72fd8dfc..ce3c3a7f 100644
--- a/colm/pdagraph.cpp
+++ b/colm/pdagraph.cpp
@@ -497,7 +497,11 @@ void PdaGraph::removeUnreachableStates()
 {
 	/* Mark all the states that can be reached 
 	 * through the existing set of entry points. */
-	markReachableFromHere( startState );
+	if ( startState != 0 )
+		markReachableFromHere( startState );
+
+	for ( PdaStateSet::Iter si = entryStateSet; si.lte(); si++ )
+		markReachableFromHere( *si );
 
 	/* Delete all states that are not marked
 	 * and unmark the ones that are marked. */
diff --git a/colm/pdagraph.h b/colm/pdagraph.h
index fc0e5ef7..479a60de 100644
--- a/colm/pdagraph.h
+++ b/colm/pdagraph.h
@@ -388,6 +388,7 @@ struct PdaGraph
 
 	/* The start state. */
 	PdaState *startState;
+	PdaStateSet entryStateSet;
 
 	/* The set of final states. */
 	PdaStateSet finStateSet;
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index fd52668b..d3a3fd87 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -86,7 +86,8 @@ bool PdaRun::isParserStopFinished()
 
 void PdaRun::init()
 {
-	cs = tables->startState;
+	/* FIXME: need the right one here. */
+	cs = prg->rtd->startStates[parserId];
 
 	/* Init the element allocation variables. */
 	stackTop = prg->kidPool.allocate();
@@ -111,7 +112,7 @@ long PdaRun::stackTopTarget()
 {
 	long state;
 	if ( pt(stackTop->tree)->state < 0 )
-		state = tables->startState;
+		state = prg->rtd->startStates[parserId];
 	else {
 		state = tables->targs[(int)tables->indicies[tables->offsets[
 				pt(stackTop->tree)->state] + 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 9634b20c..61039a7e 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -420,7 +420,9 @@ struct RuntimeData
 	long numLiterals;
 
 	FsmTables *fsmTables;
-	PdaTables **parsers;
+	PdaTables *pdaTables;
+	int *startStates;
+	int *eofLelIds;
 	long numParsers;
 
 	long globalSize;
@@ -437,7 +439,6 @@ struct RuntimeData
 struct PdaTables
 {
 	/* Parser table data. */
-	unsigned int startState;
 	int *indicies;
 	int *keys;
 	unsigned int *offsets;
@@ -466,12 +467,13 @@ typedef Vector<Tree*> Bindings;
 
 struct PdaRun
 {
-	PdaRun( Tree **root, Program *prg, PdaTables *tables, 
+	PdaRun( Tree **root, Program *prg, PdaTables *tables, int parserId,
 			FsmRun *scanner, long stopTarget, bool revertOn )
 	:
 		root(root),
 		prg(prg),
 		tables(tables), 
+		parserId(parserId), 
 		fsmRun(scanner), 
 		stopParsing(false),
 		stopTarget(stopTarget),
@@ -497,6 +499,7 @@ struct PdaRun
 
 	Program *prg;
 	PdaTables *tables;
+	int parserId;
 
 	FsmRun *fsmRun;
 
-- 
cgit v1.2.1


From 56c2836d55f950c5f010b3c4bf85a7bbba5c18a8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 13 Feb 2009 23:29:45 +0000
Subject: A couple fixes to the last patch.

---
 colm/fsmrun.cpp   | 2 +-
 colm/pdabuild.cpp | 7 +++++--
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 2ddf8751..8b0e205f 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -316,7 +316,7 @@ void FsmRun::sendBack( Kid *input )
 	sendBackIgnore( tree_ignore( prg, input->tree ) );
 
 	/* If eof was just sent back remember that it needs to be sent again. */
-	if ( input->tree->id == parser->tables->rtd->eofId )
+	if ( input->tree->id == parser->tables->rtd->eofLelIds[parser->parserId] )
 		eofSent = false;
 
 	/* If the item is bound then store remove it from the bindings array. */
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 17a85d03..1937b0c3 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -979,8 +979,11 @@ void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangElSet &parserEls )
 	}
 
 	/* Verify that any type we parse_stop can actually be parsed that way. */
-	for ( KlangElSet::Iter pe = parserEls; pe.lte(); pe++ )
-		verifyParseStopGrammar(*pe, pdaGraph);
+	for ( KlangElSet::Iter pe = parserEls; pe.lte(); pe++ ) {
+		KlangEl *lel = *pe;
+		if ( lel->parseStop )
+			verifyParseStopGrammar(lel , pdaGraph);
+	}
 }
 
 void ParseData::wrapNonTerminals()
-- 
cgit v1.2.1


From e52e24db80a4b9b70e2d034a2eca5da217ca29c7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 15 Feb 2009 01:18:01 +0000
Subject: Parse errors in patterns and constructors now report the line number
 in the space of the colm source file.

---
 colm/fsmrun.cpp    | 30 ++++++++++++++++--------------
 colm/fsmrun.h      |  2 --
 colm/input.h       | 27 +++++++++++++++++++++------
 colm/lmparse.kl    | 12 ++++++------
 colm/lmscan.rl     |  5 +++--
 colm/parsedata.cpp | 10 ++++++++++
 colm/parsetree.h   | 22 ++++++++++++----------
 colm/pdarun.cpp    |  2 +-
 8 files changed, 69 insertions(+), 41 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 8b0e205f..b027e028 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -45,9 +45,7 @@ void operator<<( ostream &out, exit_object & )
 FsmRun::FsmRun( Program *prg ) :
 	prg(prg),
 	tables(prg->rtd->fsmTables),
-	parser(0),
-	line(1),
-	position(0)
+	parser(0)
 {
 }
 
@@ -119,23 +117,27 @@ void FsmRun::streamPush( const char *data, long length )
 /* Keep the position up to date after consuming text. */
 void update_position( FsmRun *fsmRun, const char *data, long length )
 {
-	for ( int i = 0; i < length; i++ ) {
-		if ( data[i] == '\n' )
-			fsmRun->line += 1;
+	if ( !fsmRun->inputStream->handlesLine ) {
+		for ( int i = 0; i < length; i++ ) {
+			if ( data[i] == '\n' )
+				fsmRun->inputStream->line += 1;
+		}
 	}
 
-	fsmRun->position += length;
+	fsmRun->inputStream->position += length;
 }
 
 /* Keep the position up to date after sending back text. */
 void undo_position( FsmRun *fsmRun, const char *data, long length )
 {
-	for ( int i = 0; i < length; i++ ) {
-		if ( data[i] == '\n' )
-			fsmRun->line -= 1;
+	if ( !fsmRun->inputStream->handlesLine ) {
+		for ( int i = 0; i < length; i++ ) {
+			if ( data[i] == '\n' )
+				fsmRun->inputStream->line -= 1;
+		}
 	}
 
-	fsmRun->position -= length;
+	fsmRun->inputStream->position -= length;
 }
 
 /* Should only be sending back whole tokens/ignores, therefore the send back
@@ -665,7 +667,7 @@ void FsmRun::sendIgnore( long id )
 	parser->ignore( tree );
 
 	/* Prepare for more scanning. */
-	position += length;
+	inputStream->position += length;
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
 
@@ -769,7 +771,7 @@ void FsmRun::attachInputStream( InputStream *in )
 	p = pe = runBuf->buf;
 	peof = 0;
 	eofSent = false;
-	position = 0;
+	inputStream->position = 0;
 }
 
 long PdaRun::run()
@@ -937,7 +939,7 @@ long FsmRun::run( PdaRun *destParser )
 			}
 
 			/* Machine failed before finding a token. */
-			cerr << "SCANNER ERROR" << endp;
+			cerr << "error:" << inputStream->line << ": scanner error" << endp;
 		}
 
 		space = runBuf->buf + FSM_BUFSIZE - pe;
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index af1edc10..7d96112c 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -121,8 +121,6 @@ struct FsmRun
 	bool eofSent;
 	RunBuf *runBuf;
 	bool gotoResume;
-	long line;
-	long position;
 	char *mark_enter[32];
 	char *mark_leave[32];
 };
diff --git a/colm/input.h b/colm/input.h
index 3796c554..41feef25 100644
--- a/colm/input.h
+++ b/colm/input.h
@@ -33,6 +33,11 @@ struct RunBuf;
 
 struct InputStream
 {
+	InputStream( bool handlesLine ) :
+		line(1),
+		position(0),
+		handlesLine(handlesLine) {}
+
 	virtual ~InputStream() {}
 
 	/* Basic functions. */
@@ -51,12 +56,20 @@ struct InputStream
 		{ assert( false ); return 0; }
 	virtual void pushBackNamed()
 		{ assert( false ); }
+	
+	long line;
+	long position;
+
+	/* This is set true for input streams that do their own line counting.
+	 * Causes FsmRun to ignore NLs. */
+	bool handlesLine;
 };
 
 struct InputStreamString : public InputStream
 {
-	InputStreamString( const String &data )
-		: data(data), offset(0), eof(false) {}
+	InputStreamString( const String &data ) : 
+		InputStream(false), 
+		data(data), offset(0), eof(false) {}
 
 	int getData( char *dest, int length );
 	int isEOF() { return eof; }
@@ -70,8 +83,9 @@ struct InputStreamString : public InputStream
 
 struct InputStreamFile : public InputStream
 {
-	InputStreamFile( FILE *file )
-		: file(file), queue(0) {}
+	InputStreamFile( FILE *file ) :
+		InputStream(false), 
+		file(file), queue(0) {}
 
 	int getData( char *dest, int length );
 	int isEOF();
@@ -85,8 +99,9 @@ struct InputStreamFile : public InputStream
 
 struct InputStreamFD : public InputStream
 {
-	InputStreamFD( long fd )
-		: fd(fd), eof(false), queue(0) {}
+	InputStreamFD( long fd ) :
+		InputStream(false), 
+		fd(fd), eof(false), queue(0) {}
 
 	int isEOF();
 	int needFlush();
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index ef34d20f..dc81e9d9 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -399,7 +399,7 @@ litpat_el_list: ;
 
 litpat_el: TK_LitPat
 	final {
-		PatternItem *patternItem = new PatternItem( $1->data,
+		PatternItem *patternItem = new PatternItem( $1->loc, $1->data,
 			PatternItem::InputText );
 		patternItemList->append( patternItem );
 	};
@@ -444,7 +444,7 @@ pattern_el_type_or_lit: region_qual TK_Word opt_repeat
 	final {
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
 				$2->data, 0, $3->opt, $3->repeat );
-		$$->patternItem = new PatternItem( factor, PatternItem::FactorType );
+		$$->patternItem = new PatternItem( $2->loc, factor, PatternItem::FactorType );
 		patternItemList->append( $$->patternItem );
 	};
 
@@ -453,7 +453,7 @@ pattern_el_type_or_lit: region_qual TK_Literal opt_repeat
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
 				literal, 0, $3->opt, $3->repeat );
-		$$->patternItem = new PatternItem( factor, PatternItem::FactorType );
+		$$->patternItem = new PatternItem( $2->loc, factor, PatternItem::FactorType );
 		patternItemList->append( $$->patternItem );
 	};
 
@@ -488,7 +488,7 @@ litrepl_el_list: ;
 
 litrepl_el: TK_LitPat
 	final {
-		ReplItem *replItem = new ReplItem( ReplItem::InputText, $1->data );
+		ReplItem *replItem = new ReplItem( $1->loc, ReplItem::InputText, $1->data );
 		replItemList->append( replItem );
 	};
 
@@ -499,7 +499,7 @@ repl_el_list: ;
 
 repl_el: var_ref
 	final {
-		ReplItem *replItem = new ReplItem( ReplItem::VarRefType, $1->varRef );
+		ReplItem *replItem = new ReplItem( $1->varRef->loc, ReplItem::VarRefType, $1->varRef );
 		replItemList->append( replItem );
 	};
 
@@ -508,7 +508,7 @@ repl_el: region_qual TK_Literal
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
 				literal, 0, false, false );
-		ReplItem *replItem = new ReplItem( ReplItem::FactorType, factor );
+		ReplItem *replItem = new ReplItem( $2->loc, ReplItem::FactorType, factor );
 		replItemList->append( replItem );
 	};
 
diff --git a/colm/lmscan.rl b/colm/lmscan.rl
index d772a887..83283c35 100644
--- a/colm/lmscan.rl
+++ b/colm/lmscan.rl
@@ -165,6 +165,9 @@ void Scanner::token( int type )
 		loc.line = line;
 		loc.col = column;
 
+		if ( tokdata != 0 && tokdata[toklen-1] == '\n' )
+			loc.line -= 1;
+
 		parser->token( loc, type, tokdata, toklen );
 	}
 
@@ -442,8 +445,6 @@ void Scanner::endSection( )
 
 		# Whitespace other than newline.
 		[ \t\r]+ => { updateCol(); };
-
-		# If we are in a single line machine then newline may end the spec.
 		NL => { updateCol(); };
 
 		# Consume eof.
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index fd38e64e..2effebcf 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1386,6 +1386,7 @@ void ParseData::initEmptyScanners()
 
 InputStreamPattern::InputStreamPattern( Pattern *pattern )
 : 
+	InputStream(true),
 	pattern(pattern),
 	patItem(pattern->list->head),
 	offset(0),
@@ -1408,6 +1409,7 @@ KlangEl *InputStreamPattern::getLangEl( long &bindId, char *&data, long &length
 	bindId = patItem->bindId;
 	data = 0;
 	length = 0;
+	line = patItem->loc.line;
 
 	patItem = patItem->next;
 	offset = 0;
@@ -1418,6 +1420,9 @@ KlangEl *InputStreamPattern::getLangEl( long &bindId, char *&data, long &length
 
 int InputStreamPattern::getData( char *dest, int length )
 { 
+	if ( offset == 0 )
+		line = patItem->loc.line;
+
 	assert ( patItem->type == PatternItem::InputText );
 	int available = patItem->data.length() - offset;
 
@@ -1491,6 +1496,7 @@ void InputStreamPattern::pushBackNamed()
 
 InputStreamRepl::InputStreamRepl( Replacement *replacement )
 : 
+	InputStream(true),
 	replacement(replacement),
 	replItem(replacement->list->head),
 	offset(0),
@@ -1517,6 +1523,7 @@ KlangEl *InputStreamRepl::getLangEl( long &bindId, char *&data, long &length )
 
 	data = 0;
 	length = 0;
+	line = replItem->loc.line;
 
 	if ( replItem->type == ReplItem::FactorType ) {
 		if ( replItem->factor->literal != 0 ) {
@@ -1538,6 +1545,9 @@ KlangEl *InputStreamRepl::getLangEl( long &bindId, char *&data, long &length )
 
 int InputStreamRepl::getData( char *dest, int length )
 { 
+	if ( offset == 0 )
+		line = replItem->loc.line;
+
 	assert ( replItem->type == ReplItem::InputText );
 	int available = replItem->data.length() - offset;
 
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 96449c43..a9e4f6c1 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -907,14 +907,15 @@ struct PatternItem
 		InputText
 	};
 
-	PatternItem( const String &data, Type type ) : 
-			factor(0), data(data), type(type), region(0), 
+	PatternItem( const InputLoc &loc, const String &data, Type type ) : 
+			loc(loc), factor(0), data(data), type(type), region(0), 
 			varRef(0), bindId(0) {}
 
-	PatternItem( PdaFactor *factor, Type type ) : 
-			factor(factor), type(type), region(0), 
+	PatternItem( const InputLoc &loc, PdaFactor *factor, Type type ) : 
+			loc(loc), factor(factor), type(type), region(0), 
 			varRef(0), bindId(0) {}
 
+	InputLoc loc;
 	PdaFactor *factor;
 	String data;
 	Type type;
@@ -935,15 +936,16 @@ struct ReplItem
 		FactorType
 	};
 
-	ReplItem( Type type, const String &data ) : 
-		type(type), data(data), varRef(0), bindId(0) {}
+	ReplItem( const InputLoc &loc, Type type, const String &data ) : 
+		loc(loc), type(type), data(data), varRef(0), bindId(0) {}
 
-	ReplItem( Type type, LangVarRef *varRef ) : 
-		type(type), varRef(varRef), bindId(0) {}
+	ReplItem( const InputLoc &loc, Type type, LangVarRef *varRef ) : 
+		loc(loc), type(type), varRef(varRef), bindId(0) {}
 
-	ReplItem( Type type, PdaFactor *factor ) : 
-		type(type), factor(factor), bindId(0) {}
+	ReplItem( const InputLoc &loc, Type type, PdaFactor *factor ) : 
+		loc(loc), type(type), factor(factor), bindId(0) {}
 
+	InputLoc loc;
 	Type type;
 	String data;
 	LangVarRef *varRef;
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index d3a3fd87..07bd8d09 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -701,7 +701,7 @@ _out:
 
 ostream &PdaRun::parse_error( int tokId, Tree *tree )
 {
-	cerr << "error:" << fsmRun->line << ": at token ";
+	cerr << "error:" << fsmRun->inputStream->line << ": at token ";
 	if ( tokId < 128 )
 		cerr << "\"" << tables->rtd->lelInfo[tokId].name << "\"";
 	else 
-- 
cgit v1.2.1


From 7d7be6ccc3a13c5bfb6d145d947508af096994c7 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 15 Feb 2009 17:39:56 +0000
Subject: added a couple missing includes

---
 test/mediawiki/garticle.rl | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/test/mediawiki/garticle.rl b/test/mediawiki/garticle.rl
index ca711a85..cc101364 100644
--- a/test/mediawiki/garticle.rl
+++ b/test/mediawiki/garticle.rl
@@ -1,5 +1,7 @@
 #include <iostream>
 #include <fstream>
+#include <stdlib.h>
+#include <string.h>
 
 using std::cout;
 using std::cerr;
-- 
cgit v1.2.1


From 4daa230e86bcf1a126f9a469257302fb0f36bfba Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 15 Feb 2009 23:07:32 +0000
Subject: label the states

---
 colm/dotgen.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/colm/dotgen.cpp b/colm/dotgen.cpp
index 30788a4c..eb69ba16 100644
--- a/colm/dotgen.cpp
+++ b/colm/dotgen.cpp
@@ -86,11 +86,11 @@ void ParseData::writeDotFile( PdaGraph *graph )
 
 	out << 
 		"\n"
-		"	node [ shape = circle, fixedsize = true, height = 0.2 ];\n";
+		"	node [ shape = circle, fixedsize = true, height = 0.6 ];\n";
 
 	/* Walk the states. */
 	for ( PdaStateList::Iter st = graph->stateList; st.lte(); st++ )
-		out << "	" << st->stateNum << " [ label = \"\" ];\n";
+		out << "	" << st->stateNum << " [ label = \"" << st->stateNum << "\" ];\n";
 
 	out << "\n";
 
-- 
cgit v1.2.1


From 27ad94aba9f211bcdb4b2d1c83d22ce97464a503 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 15 Feb 2009 23:12:44 +0000
Subject: Unset action orderings are a reality due to the fact that we are
 using LALR(1). They are not a user-level warning. Just ordering last since
 they result in parse errors anyways.

---
 colm/pdabuild.cpp | 16 +++++-----------
 1 file changed, 5 insertions(+), 11 deletions(-)

diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 1937b0c3..a18f388f 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -699,24 +699,18 @@ void ParseData::pdaActionOrder( PdaGraph *pdaGraph, KlangElSet &parserEls )
 		}
 	}
 
+	/* Some actions may not have an ordering. I believe these to be actions
+	 * that result in a parse error and they arise because the state tables
+	 * are LALR(1) but the action ordering is LR(1). LALR(1) causes some
+	 * reductions that lead nowhere. */
 	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
 		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
 		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
 			PdaTrans *trans = tel->value;
 			/* Check every action has an ordering. */
 			for ( ActDataList::Iter adl = trans->actOrds; adl.lte(); adl++ ) {
-				if ( *adl == 0 ) {
-					warning() << "action ordering for " << 
-						trans->actions[adl.pos()] << " is unset, state: " << 
-						state->stateNum << ", trans: ";
-
-					KlangEl *lel = langElIndex[trans->lowKey];
-					if ( lel == 0 )
-						cerr << (char)trans->lowKey << endl;
-					else
-						cerr << lel->name << endl;
+				if ( *adl == 0 )
 					*adl = time++;
-				}
 			}
 		}
 	}
-- 
cgit v1.2.1


From 68a67ac3f363da3ce29765edf1d892993301d455 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 16 Feb 2009 16:53:55 +0000
Subject: Don't allow KW_Def statements to add to a the production list. This
 is left over from Kelbt.

---
 colm/lmparse.kl | 66 ++++++++++++++++++++++++++++-----------------------------
 1 file changed, 32 insertions(+), 34 deletions(-)

diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index dc81e9d9..46006f51 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -246,17 +246,11 @@ global_def: KW_Global var_def opt_def_init
 		}
 	};
 
-cfl_def: KW_Def cfl_id obj_var_list properties_list cfl_prod_list
+cfl_def: cfl_def_head obj_var_list properties_list cfl_prod_list
 	final {
 		/* Get the language element. */
 		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), 
-				curDefineId, KlangEl::NonTerm );
-
-		/* Check that the element wasn't previously defined as something else. */
-		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
-			error($1->loc) << "'" << curDefineId << 
-				"' already defined as something else" << endp;
-		}
+				curDefineId, KlangEl::Unknown );
 
 		/* Make a new object definition. */
 		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, curDefineId, 
@@ -265,9 +259,21 @@ cfl_def: KW_Def cfl_id obj_var_list properties_list cfl_prod_list
 		langEl->objectDef = objectDef;
 	};
 
-cfl_id: TK_Word
+cfl_def_head: KW_Def TK_Word
 	final {
-		curDefineId = $1->data;
+		curDefineId = $2->data;
+
+		/* Get the language element. */
+		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), 
+				$2->data, KlangEl::Unknown );
+
+		/* Check that the element wasn't previously defined as something else. */
+		if ( langEl->type != KlangEl::Unknown ) {
+			error($2->loc) << "'" << curDefineId << 
+				"' has already been defined, maybe you want to use redef?" << endp;
+		}
+
+		langEl->type = KlangEl::NonTerm;
 	};
 
 cfl_prod_list: cfl_prod_list '|' define_prod;
@@ -281,7 +287,7 @@ property:
 	final {
 		/* Get the language element. */
 		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-				curDefineId, KlangEl::NonTerm );
+				curDefineId, KlangEl::Unknown );
 		prodName->reduceFirst = true;
 	};
 
@@ -835,7 +841,7 @@ start_reduce:
 
 		/* Get the language element. */
 		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-			curDefineId, KlangEl::NonTerm );
+			curDefineId, KlangEl::Unknown );
 
 		/* References to the reduce item. */
 		pd->addProdRedObjectVar( pd->curLocalFrame, prodName );
@@ -1959,32 +1965,24 @@ void Parser::addProduction( InputLoc &loc, const String &name,
 {
 	/* Get the language element. */
 	KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-			name, KlangEl::NonTerm );
+			name, KlangEl::Unknown );
 
-	/* Check that the element wasn't previously defined as something else. */
-	if ( prodName->type != KlangEl::Unknown 
-			&& prodName->type != KlangEl::NonTerm )
-	{
-		error(loc) << "'" << name << "' already defined as something else" << endp;
-	}
-	else {
-		Namespace *nspace = namespaceStack.top();
+	assert( prodName->type == KlangEl::NonTerm );
+	Namespace *nspace = namespaceStack.top();
 
-		prodName->type = KlangEl::NonTerm;
-		Definition *newDef = new Definition( loc, prodName, 
-				prodElList, commit, redBlock,
-				pd->prodList.length(), Definition::Production );
+	Definition *newDef = new Definition( loc, prodName, 
+		prodElList, commit, redBlock,
+		pd->prodList.length(), Definition::Production );
 
-		prodName->defList.append( newDef );
-		pd->prodList.append( newDef );
+	prodName->defList.append( newDef );
+	pd->prodList.append( newDef );
 
-		/* If the token has the same name as the region it is in, then also
-		 * insert it into the symbol map for the parent region. */
-		if ( strcmp( name, nspace->name ) == 0 ) {
-			/* Insert the name into the top of the region stack after popping the
-			 * region just created. We need it in the parent. */
-			nspace->parentNamespace->symbolMap.insert( name, prodName );
-		}
+	/* If the token has the same name as the region it is in, then also
+	 * insert it into the symbol map for the parent region. */
+	if ( strcmp( name, nspace->name ) == 0 ) {
+		/* Insert the name into the top of the region stack after popping the
+		 * region just created. We need it in the parent. */
+		nspace->parentNamespace->symbolMap.insert( name, prodName );
 	}
 }
 
-- 
cgit v1.2.1


From ce09765debae50348d84db942193e69fc26aa522 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 16 Feb 2009 17:50:11 +0000
Subject: The getKlangEl now always creates tokens with the Unknown tpe. If it
 comes back unknown then it hasn't been previously defined as anything.

Now reporting an error if tokens, maps and lists are defined more than once.
---
 colm/lmparse.kl    | 43 ++++++++++++++++++++-----------------------
 colm/parsedata.cpp | 23 ++++++++++-------------
 colm/parsedata.h   |  3 +--
 colm/pdabuild.cpp  | 10 +++++-----
 4 files changed, 36 insertions(+), 43 deletions(-)

diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 46006f51..799418a1 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -173,13 +173,14 @@ generic_def: KW_Map TK_Word '[' type_ref type_ref ']'
 	final {
 		Namespace *nspace = namespaceStack.top();
 
-		KlangEl *langEl = getKlangEl( pd, nspace, $2->data, KlangEl::NonTerm );
+		KlangEl *langEl = getKlangEl( pd, nspace, $2->data );
 
 		/* Check that the element wasn't previously defined as something else. */
-		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
-			error($1->loc) << "'" << curDefineId << 
+		if ( langEl->type != KlangEl::Unknown ) {
+			error($1->loc) << "'" << $2->data << 
 				"' already defined as something else" << endp;
 		}
+		langEl->type = KlangEl::NonTerm;
 
 		GenericType *generic = new GenericType( $2->data, GEN_MAP,
 				pd->nextGenericId++, langEl, $5->typeRef );
@@ -197,13 +198,14 @@ generic_def: KW_List TK_Word '[' type_ref ']'
 	final {
 		/* Get the language element. */
 		Namespace *nspace = namespaceStack.top();
-		KlangEl *langEl = getKlangEl( pd, nspace, $2->data, KlangEl::NonTerm );
+		KlangEl *langEl = getKlangEl( pd, nspace, $2->data );
 
 		/* Check that the element wasn't previously defined as something else. */
-		if ( langEl->type != KlangEl::Unknown && langEl->type != KlangEl::NonTerm ) {
-			error($1->loc) << "'" << curDefineId << 
+		if ( langEl->type != KlangEl::Unknown ) {
+			error($1->loc) << "'" << $2->data << 
 				"' already defined as something else" << endp;
 		}
+		langEl->type = KlangEl::NonTerm;
 
 		GenericType *generic = new GenericType( $2->data, GEN_LIST, 
 				pd->nextGenericId++, langEl, $4->typeRef );
@@ -249,8 +251,7 @@ global_def: KW_Global var_def opt_def_init
 cfl_def: cfl_def_head obj_var_list properties_list cfl_prod_list
 	final {
 		/* Get the language element. */
-		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), 
-				curDefineId, KlangEl::Unknown );
+		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), curDefineId );
 
 		/* Make a new object definition. */
 		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, curDefineId, 
@@ -264,8 +265,7 @@ cfl_def_head: KW_Def TK_Word
 		curDefineId = $2->data;
 
 		/* Get the language element. */
-		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), 
-				$2->data, KlangEl::Unknown );
+		KlangEl *langEl = getKlangEl( pd, namespaceStack.top(), $2->data );
 
 		/* Check that the element wasn't previously defined as something else. */
 		if ( langEl->type != KlangEl::Unknown ) {
@@ -286,8 +286,7 @@ property:
 	KW_ReduceFirst
 	final {
 		/* Get the language element. */
-		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-				curDefineId, KlangEl::Unknown );
+		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), curDefineId );
 		prodName->reduceFirst = true;
 	};
 
@@ -612,9 +611,9 @@ literal_item: TK_Literal
 			error( $1->loc ) << "literal already defined in this namespace" << endp;
 		else {
 			/* Create a token for the literal. */
-			KlangEl *newLangEl = getKlangEl( pd, nspace, name, KlangEl::Term );
-			assert( newLangEl != 0 );
-			assert( newLangEl->type == KlangEl::Term );
+			KlangEl *newLangEl = getKlangEl( pd, nspace, name );
+			assert( newLangEl->type == KlangEl::Unknown );
+			newLangEl->type = KlangEl::Term;
 			newLangEl->lit = $1->data;
 			newLangEl->isLiteral = true;
 
@@ -660,9 +659,9 @@ token_def:
 			name.setAs( 32, "_ignore_%.4x", pd->nextTokenId );
 
 		/* Create the token. */
-		KlangEl *tokEl = getKlangEl( pd, namespaceStack.top(), name, KlangEl::Term );
-		if ( tokEl->type != KlangEl::Unknown && tokEl->type != KlangEl::Term )
-			error($1->loc) << "'" << name << "' already defined as something else" << endp;
+		KlangEl *tokEl = getKlangEl( pd, namespaceStack.top(), name );
+		if ( tokEl->type != KlangEl::Unknown )
+			error($1->loc) << "'" << name << "' already defined" << endp;
 
 		tokEl->type = KlangEl::Term;
 		tokEl->ignore = ignore;
@@ -840,8 +839,7 @@ start_reduce:
 		$$->localFrame = $1->localFrame;
 
 		/* Get the language element. */
-		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-			curDefineId, KlangEl::Unknown );
+		KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), curDefineId );
 
 		/* References to the reduce item. */
 		pd->addProdRedObjectVar( pd->curLocalFrame, prodName );
@@ -1956,7 +1954,7 @@ void Parser::addRegularDef( const InputLoc &loc, Namespace *nspace,
 	}
 	else {
 		// Recover by ignoring the duplicate.
-		error(loc) << "fsm \"" << name << "\" previously defined" << endl;
+		error(loc) << "regular definition \"" << name << "\" already exists" << endl;
 	}
 }
 
@@ -1964,8 +1962,7 @@ void Parser::addProduction( InputLoc &loc, const String &name,
 		ProdElList *prodElList, bool commit, CodeBlock *redBlock )
 {
 	/* Get the language element. */
-	KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), 
-			name, KlangEl::Unknown );
+	KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), name );
 
 	assert( prodName->type == KlangEl::NonTerm );
 	Namespace *nspace = namespaceStack.top();
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 2effebcf..c0f086b5 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1090,10 +1090,9 @@ void ParseData::createDefaultScanner()
 
 	/* Now create the one and only token -> "<chr>" / any /  */
 	name = "___DEFAULT_SCANNER_CHR";
-	defaultCharKlangEl = getKlangEl( this, defaultNamespace, 
-			name, KlangEl::Term );
-	assert( defaultCharKlangEl != 0 );
-	assert( defaultCharKlangEl->type == KlangEl::Term );
+	defaultCharKlangEl = getKlangEl( this, defaultNamespace, name );
+	assert( defaultCharKlangEl->type == KlangEl::Unknown );
+	defaultCharKlangEl->type = KlangEl::Term;
 
 	Join *join = new Join( new Expression( BT_Any ) );
 		
@@ -1138,7 +1137,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 	fact->nspace = nspace;
 
 	/* Look up the language element in the region. */
-	KlangEl *langEl = getKlangEl( this, nspace, fact->refName, KlangEl::Unknown );
+	KlangEl *langEl = getKlangEl( this, nspace, fact->refName );
 
 	if ( fact->opt ) {
 		/* If the factor is an opt, create the opt element and link the factor
@@ -1150,7 +1149,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 			fact->langEl = inDict->value;
 		}
 		else {
-			KlangEl *prodName = getKlangEl( this, nspace, optName, KlangEl::NonTerm );
+			KlangEl *prodName = getKlangEl( this, nspace, optName );
 			prodName->type = KlangEl::NonTerm;
 			prodName->isOpt = true;
 
@@ -1191,8 +1190,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 			fact->langEl = inDict->value;
 		}
 		else {
-			KlangEl *prodName = getKlangEl( this, nspace,
-					repeatName, KlangEl::NonTerm );
+			KlangEl *prodName = getKlangEl( this, nspace, repeatName );
 			prodName->type = KlangEl::NonTerm;
 			prodName->isRepeat = true;
 
@@ -1364,10 +1362,9 @@ void ParseData::initEmptyScanners()
 			InputLoc loc;
 			String name( reg->name.length() + 16, "__%s_DEF_PAT", reg->name.data );
 
-			KlangEl *lel = getKlangEl( this, rootNamespace,
-					name.data, KlangEl::Term );
-			assert( lel != 0 );
-			assert( lel->type == KlangEl::Term );
+			KlangEl *lel = getKlangEl( this, rootNamespace, name.data );
+			assert( lel->type == KlangEl::Unknown );
+			lel->type = KlangEl::Term;
 
 			Join *join = new Join( new Expression( BT_Any ) );
 				
@@ -1666,7 +1663,7 @@ void ParseData::resolveUses()
 				error() << "do not have namespace for resolving reference" << endp;
 	
 			/* Look up the language element in the region. */
-			KlangEl *langEl = getKlangEl( this, nspace, lel->objectDefUses, KlangEl::Unknown );
+			KlangEl *langEl = getKlangEl( this, nspace, lel->objectDefUses );
 			lel->objectDef = langEl->objectDef;
 		}
 	}
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 522a7aea..ab60f859 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -924,7 +924,6 @@ struct Parser;
 typedef AvlMap<String, Parser *, CmpStr> ParserDict;
 typedef AvlMapEl<String, Parser *> ParserDictEl;
 
-KlangEl *getKlangEl( ParseData *pd, Namespace *nspace,
-		const String &data, KlangEl::Type defType );
+KlangEl *getKlangEl( ParseData *pd, Namespace *nspace, const String &data );
 
 #endif /* _PARSEDATA_H */
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index a18f388f..4c718399 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -125,15 +125,14 @@ PdaGraph *ProdElList::walk( ParseData *pd )
 }
 
 
-KlangEl *getKlangEl( ParseData *pd, Namespace *nspace,
-		const String &data, KlangEl::Type defType )
+KlangEl *getKlangEl( ParseData *pd, Namespace *nspace, const String &data )
 {
     /* If the id is already in the dict, it will be placed in last found. If
      * it is not there then it will be inserted and last found will be set to it. */
     SymbolMapEl *inDict = nspace->symbolMap.find( data );
     if ( inDict == 0 ) {
         /* Language element not there. Make the new lang el and insert.. */
-        KlangEl *langEl = new KlangEl( nspace, data, defType );
+        KlangEl *langEl = new KlangEl( nspace, data, KlangEl::Unknown );
         inDict = nspace->symbolMap.insert( langEl->name, langEl );
         pd->langEls.append( langEl );
     }
@@ -1191,8 +1190,9 @@ void ParseData::insertUniqueEmptyProductions()
 		/* Get a language element. */
 		char name[20];
 		sprintf(name, "U%li", prodList.length());
-		KlangEl *prodName = getKlangEl( this, rootNamespace,
-				name, KlangEl::NonTerm );
+		KlangEl *prodName = getKlangEl( this, rootNamespace, name );
+		assert( prodName->type == KlangEl::Unknown );
+		prodName->type = KlangEl::NonTerm;
 		Definition *newDef = new Definition( InputLoc(), prodName, 
 				0 /* FIXME new VarDef( name, 0 )*/, 
 				false, 0, prodList.length(), Definition::Production );
-- 
cgit v1.2.1


From 296c3de188a7a42649b5a821348e08b4561718dd Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 22 Feb 2009 02:06:41 +0000
Subject: Started precedence implementation.

---
 colm/lmparse.kh    |  4 ++++
 colm/lmparse.kl    | 33 +++++++++++++++++++++++++++-
 colm/lmscan.rl     |  4 ++++
 colm/parsedata.cpp | 15 ++++++++++++-
 colm/parsedata.h   | 14 +++++++++++-
 colm/pdabuild.cpp  | 64 +++++++++++++++++++++++++++++++++++++++++++++++++++++-
 6 files changed, 130 insertions(+), 4 deletions(-)

diff --git a/colm/lmparse.kh b/colm/lmparse.kh
index bac8a62d..47678353 100644
--- a/colm/lmparse.kh
+++ b/colm/lmparse.kh
@@ -60,6 +60,8 @@ struct Parser
 
 	token KW_Include, KW_Preeof;
 
+	token KW_Left, KW_Right, KW_Nonassoc, KW_Prec;
+
 	}%%
 
 	%% write instance_data;
@@ -99,6 +101,8 @@ struct Parser
 
 	String curDefineId;
 	ProdElList *curProdElList;
+
+	PredType predType;
 };
 
 %% write token_defs;
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 799418a1..489f0bf8 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -77,6 +77,7 @@ root_item: iter_def commit final { $$->stmt = 0; };
 root_item: global_def commit final { $$->stmt = $1->stmt; };
 root_item: statement commit final { $$->stmt = $1->stmt; };
 root_item: pre_eof commit final { $$->stmt = 0; };
+root_item: precedence commit final { $$->stmt = 0; };
 
 nonterm block_open
 {
@@ -248,6 +249,36 @@ global_def: KW_Global var_def opt_def_init
 		}
 	};
 
+precedence: pred_type pred_token_list final { pd->predValue++; };
+
+pred_type: KW_Left final { predType = PredLeft; };
+pred_type: KW_Right final { predType = PredRight; };
+pred_type: KW_Nonassoc final { predType = PredNonassoc; };
+
+pred_token_list: pred_token_list ',' pred_token;
+pred_token_list: pred_token;
+
+pred_token: 
+	region_qual TK_Word 
+	final {
+		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
+				$2->data, 0, false, false );
+		pd->resolveReferenceFactor( factor );
+		factor->langEl->predType = predType;
+		factor->langEl->predValue = pd->predValue;
+	};
+
+pred_token: 
+	region_qual TK_Literal 
+	final {
+		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
+		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
+				literal, 0, false, false );
+		pd->resolveLiteralFactor( factor );
+		factor->langEl->predType = predType;
+		factor->langEl->predValue = pd->predValue;
+	};
+
 cfl_def: cfl_def_head obj_var_list properties_list cfl_prod_list
 	final {
 		/* Get the language element. */
@@ -1970,7 +2001,7 @@ void Parser::addProduction( InputLoc &loc, const String &name,
 	Definition *newDef = new Definition( loc, prodName, 
 		prodElList, commit, redBlock,
 		pd->prodList.length(), Definition::Production );
-
+	
 	prodName->defList.append( newDef );
 	pd->prodList.append( newDef );
 
diff --git a/colm/lmscan.rl b/colm/lmscan.rl
index 83283c35..8d42f274 100644
--- a/colm/lmscan.rl
+++ b/colm/lmscan.rl
@@ -390,6 +390,10 @@ void Scanner::endSection( )
 		'deref' => { token( KW_Deref ); };
 		'require' => { token( KW_Require ); };
 		'preeof' => { token( KW_Preeof ); };
+		'left' => { token( KW_Left ); };
+		'right' => { token( KW_Right ); };
+		'nonassoc' => { token( KW_Nonassoc ); };
+		'prec' => { token( KW_Prec ); };
 
 		# Identifiers.
 		ident => { token( TK_Word, ts, te ); } ;
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index c0f086b5..116e576d 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -428,7 +428,8 @@ ParseData::ParseData( const String &fileName, const String &sectionName,
 	nextFrameId(0),
 	nextParserId(0),
 	nextLabelId(0),
-	revertOn(true)
+	revertOn(true),
+	predValue(0)
 {
 }
 
@@ -1243,11 +1244,23 @@ void ParseData::resolveFactor( PdaFactor *fact )
 	}
 }
 
+/* Resolves production els and computes the precedence of each prod. */
 void ParseData::resolveProductionEls()
 {
 	for ( DefList::Iter prod = prodList; prod.lte(); prod++ ) {
+		/* First resolve. */
 		for ( ProdElList::Iter fact = *prod->prodElList; fact.lte(); fact++ )
 			resolveFactor( fact );
+
+		/* Compute the precedence of the productions. */
+		for ( ProdElList::Iter fact = prod->prodElList->last(); fact.gtb(); fact-- ) {
+			/* Production inherits the precedence of the last terminal with
+			 * precedence. */
+			if ( fact->langEl->predType != PredNone ) {
+				prod->predOf = fact->langEl;
+				break;
+			}
+		}
 	}
 }
 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index ab60f859..416dfa4a 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -75,6 +75,8 @@ typedef Vector< PdaFactor* > FactorVect;
 typedef AvlMap<String, long, CmpStr> StringMap;
 typedef AvlMapEl<String, long> StringMapEl;
 
+enum PredType { PredLeft, PredRight, PredNonassoc, PredNone };
+
 /* Graph dictionary. */
 struct Definition 
 :
@@ -87,7 +89,7 @@ struct Definition
 		loc(loc), prodName(prodName), prodElList(prodElList), 
 		prodCommit(prodCommit), redBlock(redBlock), prodId(prodId), 
 		type(type), fsm(0), fsmLength(0), uniqueEmptyLeader(0), 
-		isLeftRec(false), localFrame(0), lhsField(0) {}
+		isLeftRec(false), localFrame(0), lhsField(0), predOf(0) {}
 
 	InputLoc loc;
 	KlangEl *prodName;
@@ -112,6 +114,8 @@ struct Definition
 
 	ObjectDef *localFrame;
 	ObjField *lhsField;
+
+	KlangEl *predOf;
 };
 
 struct CmpDefById
@@ -206,6 +210,9 @@ struct KlangEl : public DListEl<KlangEl>
 	GenericType *generic;
 
 	long parserId;
+
+	PredType predType;
+	long predValue;
 };
 
 struct PdaFactor
@@ -510,6 +517,9 @@ struct ParseData
 
 	void analyzeAction( Action *action, InlineList *inlineList );
 	void analyzeGraph( FsmGraph *graph );
+	void resolvePrecedence( PdaGraph *pdaGraph );
+	KlangEl *predOf( PdaTrans *trans, long action );
+	bool precedenceSwap( KlangEl *l1, KlangEl *l2 );
 
 	void initKeyOps();
 
@@ -903,6 +913,8 @@ struct ParseData
 
 	PdaGraph *pdaGraph;
 	PdaTables *pdaTables;
+
+	long predValue;
 };
 
 void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 4c718399..7d424e2f 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -85,7 +85,9 @@ KlangEl::KlangEl( Namespace *nspace, const String &name, Type type )
 	thisSize(0),
 	ofiOffset(0),
 	generic(0),
-	parserId(-1)
+	parserId(-1),
+	predType(PredNone),
+	predValue(0)
 {
 }
  
@@ -907,6 +909,65 @@ void ParseData::verifyParseStopGrammar( KlangEl *langEl, PdaGraph *pdaGraph )
 	}
 }
 
+KlangEl *ParseData::predOf( PdaTrans *trans, long action )
+{
+	KlangEl *lel;
+	if ( action == SHIFT_CODE )
+		lel = langElIndex[trans->lowKey];
+	else
+		lel = prodIdIndex[action >> 2]->predOf;
+	return lel;
+}
+
+bool ParseData::precedenceSwap( KlangEl *l1, KlangEl *l2 )
+{
+	bool swap = false;
+	if ( l2->predValue > l1->predValue )
+		swap = true;
+	else if ( l1->predValue == l2->predValue ) {
+		if ( l1->predType == PredLeft && trans->actions[i] == SHIFT_CODE )
+			swap = true;
+		else if ( l1->predType == PredRight && trans->actions[j] == SHIFT_CODE )
+			swap = true;
+	}
+	return swap;
+}
+
+void ParseData::resolvePrecedence( PdaGraph *pdaGraph )
+{
+	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
+		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
+		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
+			PdaTrans *trans = tel->value;
+
+again:
+			/* Find action with precedence. */
+			for ( int i = 0; i < trans->actions.length(); i++ ) {
+				KlangEl *li = predOf( trans, trans->actions[i] );
+					
+				if ( li != 0 && li->predValue != PredNone ) {
+					/* Find another action with precedence. */
+					for ( int j = i+1; j < trans->actions.length(); j++ ) {
+						KlangEl *lj = predOf( trans, trans->actions[j] );
+
+						if ( lj != 0 && lj->predValue != PredNone ) {
+							/* Conflict to check. */
+							bool swap = precedenceSwap( li, lj );
+							
+							if ( swap ) {
+								long t = trans->actions[i];
+								trans->actions[i] = trans->actions[j];
+								trans->actions[j] = t;
+								goto again;
+							}
+						}
+					}
+				}
+			}
+		}
+	}
+}
+
 void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangElSet &parserEls )
 {
 	pdaGraph->maxState = pdaGraph->stateList.length() - 1;
@@ -929,6 +990,7 @@ void ParseData::analyzeMachine( PdaGraph *pdaGraph, KlangElSet &parserEls )
 
 	pdaActionOrder( pdaGraph, parserEls );
 	sortActions( pdaGraph );
+	resolvePrecedence( pdaGraph );
 	advanceReductions( pdaGraph );
 	pdaGraph->setStateNumbers();
 	reduceActions( pdaGraph );
-- 
cgit v1.2.1


From 3765c038c21e22ad8901a657c9fa0537fd796e70 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 22 Feb 2009 02:25:41 +0000
Subject: Fix to last commit.

---
 colm/parsedata.h  |  2 +-
 colm/pdabuild.cpp | 10 ++++++----
 2 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/colm/parsedata.h b/colm/parsedata.h
index 416dfa4a..a2331651 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -519,7 +519,7 @@ struct ParseData
 	void analyzeGraph( FsmGraph *graph );
 	void resolvePrecedence( PdaGraph *pdaGraph );
 	KlangEl *predOf( PdaTrans *trans, long action );
-	bool precedenceSwap( KlangEl *l1, KlangEl *l2 );
+	bool precedenceSwap( long action1, long action2, KlangEl *l1, KlangEl *l2 );
 
 	void initKeyOps();
 
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 7d424e2f..576d6bf6 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -919,15 +919,16 @@ KlangEl *ParseData::predOf( PdaTrans *trans, long action )
 	return lel;
 }
 
-bool ParseData::precedenceSwap( KlangEl *l1, KlangEl *l2 )
+
+bool ParseData::precedenceSwap( long action1, long action2, KlangEl *l1, KlangEl *l2 )
 {
 	bool swap = false;
 	if ( l2->predValue > l1->predValue )
 		swap = true;
 	else if ( l1->predValue == l2->predValue ) {
-		if ( l1->predType == PredLeft && trans->actions[i] == SHIFT_CODE )
+		if ( l1->predType == PredLeft && action1 == SHIFT_CODE )
 			swap = true;
-		else if ( l1->predType == PredRight && trans->actions[j] == SHIFT_CODE )
+		else if ( l1->predType == PredRight && action2 == SHIFT_CODE )
 			swap = true;
 	}
 	return swap;
@@ -952,7 +953,8 @@ again:
 
 						if ( lj != 0 && lj->predValue != PredNone ) {
 							/* Conflict to check. */
-							bool swap = precedenceSwap( li, lj );
+							bool swap = precedenceSwap( trans->actions[i], 
+									trans->actions[j], li, lj );
 							
 							if ( swap ) {
 								long t = trans->actions[i];
-- 
cgit v1.2.1


From 76ab0efa0b78d21fa8f2f2398a2d232386640bd0 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 22 Feb 2009 03:18:29 +0000
Subject: implemented nonassoc

---
 colm/parsedata.h  |  1 +
 colm/pdabuild.cpp | 26 +++++++++++++++++++++++---
 2 files changed, 24 insertions(+), 3 deletions(-)

diff --git a/colm/parsedata.h b/colm/parsedata.h
index a2331651..1e69935b 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -520,6 +520,7 @@ struct ParseData
 	void resolvePrecedence( PdaGraph *pdaGraph );
 	KlangEl *predOf( PdaTrans *trans, long action );
 	bool precedenceSwap( long action1, long action2, KlangEl *l1, KlangEl *l2 );
+	bool precedenceRemoveBoth( KlangEl *l1, KlangEl *l2 );
 
 	void initKeyOps();
 
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 576d6bf6..37fe8304 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -934,12 +934,20 @@ bool ParseData::precedenceSwap( long action1, long action2, KlangEl *l1, KlangEl
 	return swap;
 }
 
+bool ParseData::precedenceRemoveBoth( KlangEl *l1, KlangEl *l2 )
+{
+	if ( l1->predValue == l2->predValue && l1->predType == PredNonassoc )
+		return true;
+	return false;
+}
+
 void ParseData::resolvePrecedence( PdaGraph *pdaGraph )
 {
 	for ( PdaStateList::Iter state = pdaGraph->stateList; state.lte(); state++ ) {
 		assert( CmpDotSet::compare( state->dotSet, state->dotSet2 ) == 0 );
-		for ( TransMap::Iter tel = state->transMap; tel.lte(); tel++ ) {
-			PdaTrans *trans = tel->value;
+		
+		for ( long t = 0; t < state->transMap.length(); /* increment at end */ ) {
+			PdaTrans *trans = state->transMap[t].value;
 
 again:
 			/* Find action with precedence. */
@@ -960,12 +968,24 @@ again:
 								long t = trans->actions[i];
 								trans->actions[i] = trans->actions[j];
 								trans->actions[j] = t;
-								goto again;
 							}
+
+							trans->actions.remove( j );
+							if ( precedenceRemoveBoth( li, lj ) )
+								trans->actions.remove( i );
+
+							goto again;
 						}
 					}
 				}
 			}
+
+			/* If there are still actions then move to the next one. If not,
+			 * (due to nonassoc) then remove the transition. */
+			if ( trans->actions.length() > 0 )
+				t += 1;
+			else
+				state->transMap.vremove( t );
 		}
 	}
 }
-- 
cgit v1.2.1


From 48df5c80840ff189c0e019376c74630284eb6f3c Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 22 Feb 2009 22:33:01 +0000
Subject: Can now set the precedence of a production as you can in bison.

---
 colm/lmparse.kh    |  2 +-
 colm/lmparse.kl    | 60 ++++++++++++++++++++++++++++++++++++++++--------------
 colm/parsedata.cpp | 17 +++++++++-------
 colm/pdabuild.cpp  |  4 ++--
 4 files changed, 58 insertions(+), 25 deletions(-)

diff --git a/colm/lmparse.kh b/colm/lmparse.kh
index 47678353..0184a76d 100644
--- a/colm/lmparse.kh
+++ b/colm/lmparse.kh
@@ -79,7 +79,7 @@ struct Parser
 	void addRegularDef( const InputLoc &loc, Namespace *nspace, 
 		const String &name, JoinOrLm *joinOrLm, bool isInstance );
 	void addProduction( InputLoc &loc, const String &name, 
-		ProdElList *prodElList, bool commit, CodeBlock *redBlock );
+		ProdElList *prodElList, bool commit, CodeBlock *redBlock, KlangEl *predOf );
 
 	/* Report an error encountered by the parser. */
 	ostream &parse_error( int tokId, Token &token );
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 489f0bf8..510a9127 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -189,7 +189,7 @@ generic_def: KW_Map TK_Word '[' type_ref type_ref ']'
 
 		/* Add one empty production. */
 		ProdElList *emptyList = new ProdElList;
-		addProduction( $1->loc, $2->data, emptyList, false, 0 );
+		addProduction( $1->loc, $2->data, emptyList, false, 0, 0 );
 
 		nspace->genericList.append( generic );
 		langEl->generic = generic;
@@ -213,7 +213,7 @@ generic_def: KW_List TK_Word '[' type_ref ']'
 
 		/* Add one empty production. */
 		ProdElList *emptyList = new ProdElList;
-		addProduction( $1->loc, $2->data, emptyList, false, 0 );
+		addProduction( $1->loc, $2->data, emptyList, false, 0, 0 );
 
 		nspace->genericList.append( generic );
 		langEl->generic = generic;
@@ -255,28 +255,38 @@ pred_type: KW_Left final { predType = PredLeft; };
 pred_type: KW_Right final { predType = PredRight; };
 pred_type: KW_Nonassoc final { predType = PredNonassoc; };
 
-pred_token_list: pred_token_list ',' pred_token;
-pred_token_list: pred_token;
+pred_token_list: pred_token_list ',' pred_token 
+	final {
+		$3->factor->langEl->predType = predType;
+		$3->factor->langEl->predValue = pd->predValue;
+	};
+
+pred_token_list: pred_token
+	final {
+		$1->factor->langEl->predType = predType;
+		$1->factor->langEl->predValue = pd->predValue;
+	};
+
+nonterm pred_token
+{
+	PdaFactor *factor;
+};
 
 pred_token: 
 	region_qual TK_Word 
 	final {
-		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
+		$$->factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
 				$2->data, 0, false, false );
-		pd->resolveReferenceFactor( factor );
-		factor->langEl->predType = predType;
-		factor->langEl->predValue = pd->predValue;
+		pd->resolveReferenceFactor( $$->factor );
 	};
 
 pred_token: 
 	region_qual TK_Literal 
 	final {
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
-		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
+		$$->factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
 				literal, 0, false, false );
-		pd->resolveLiteralFactor( factor );
-		factor->langEl->predType = predType;
-		factor->langEl->predValue = pd->predValue;
+		pd->resolveLiteralFactor( $$->factor );
 	};
 
 cfl_def: cfl_def_head obj_var_list properties_list cfl_prod_list
@@ -321,9 +331,27 @@ property:
 		prodName->reduceFirst = true;
 	};
 
-define_prod: '[' prod_el_list ']' opt_commit opt_reduce_code
+nonterm opt_prec
+{
+	KlangEl *predOf;
+};
+
+opt_prec:
+	final {
+		$$->predOf = 0;
+	};
+
+opt_prec: 
+	KW_Prec pred_token
 	final {
-		addProduction( $1->loc, curDefineId, curProdElList, $4->commit, $5->codeBlock ); 
+		$$->predOf = $2->factor->langEl;
+	};
+
+
+define_prod: '[' prod_el_list ']' opt_commit opt_reduce_code opt_prec
+	final {
+		addProduction( $1->loc, curDefineId, curProdElList, $4->commit, 
+				$5->codeBlock, $6->predOf ); 
 	};
 
 obj_var_list: obj_var_list var_def
@@ -1990,7 +2018,7 @@ void Parser::addRegularDef( const InputLoc &loc, Namespace *nspace,
 }
 
 void Parser::addProduction( InputLoc &loc, const String &name, 
-		ProdElList *prodElList, bool commit, CodeBlock *redBlock )
+		ProdElList *prodElList, bool commit, CodeBlock *redBlock, KlangEl *predOf )
 {
 	/* Get the language element. */
 	KlangEl *prodName = getKlangEl( pd, namespaceStack.top(), name );
@@ -2012,6 +2040,8 @@ void Parser::addProduction( InputLoc &loc, const String &name,
 		 * region just created. We need it in the parent. */
 		nspace->parentNamespace->symbolMap.insert( name, prodName );
 	}
+
+	newDef->predOf = predOf;
 }
 
 ostream &Parser::parse_error( int tokId, Token &token )
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 116e576d..5bcb1282 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1252,13 +1252,16 @@ void ParseData::resolveProductionEls()
 		for ( ProdElList::Iter fact = *prod->prodElList; fact.lte(); fact++ )
 			resolveFactor( fact );
 
-		/* Compute the precedence of the productions. */
-		for ( ProdElList::Iter fact = prod->prodElList->last(); fact.gtb(); fact-- ) {
-			/* Production inherits the precedence of the last terminal with
-			 * precedence. */
-			if ( fact->langEl->predType != PredNone ) {
-				prod->predOf = fact->langEl;
-				break;
+		/* If there is no explicit precdence ... */
+		if ( prod->predOf == 0 )  {
+			/* Compute the precedence of the productions. */
+			for ( ProdElList::Iter fact = prod->prodElList->last(); fact.gtb(); fact-- ) {
+				/* Production inherits the precedence of the last terminal with
+				 * precedence. */
+				if ( fact->langEl->predType != PredNone ) {
+					prod->predOf = fact->langEl;
+					break;
+				}
 			}
 		}
 	}
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 37fe8304..308a57ab 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -954,12 +954,12 @@ again:
 			for ( int i = 0; i < trans->actions.length(); i++ ) {
 				KlangEl *li = predOf( trans, trans->actions[i] );
 					
-				if ( li != 0 && li->predValue != PredNone ) {
+				if ( li != 0 && li->predType != PredNone ) {
 					/* Find another action with precedence. */
 					for ( int j = i+1; j < trans->actions.length(); j++ ) {
 						KlangEl *lj = predOf( trans, trans->actions[j] );
 
-						if ( lj != 0 && lj->predValue != PredNone ) {
+						if ( lj != 0 && lj->predType != PredNone ) {
 							/* Conflict to check. */
 							bool swap = precedenceSwap( trans->actions[i], 
 									trans->actions[j], li, lj );
-- 
cgit v1.2.1


From bd0270a463dd608944405d7ecaacc6a236083817 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 22 Feb 2009 22:56:10 +0000
Subject: Flattened arg and specified precedence.

---
 test/ruby/ruby.lm | 119 ++++++++++++++++++++++--------------------------------
 1 file changed, 49 insertions(+), 70 deletions(-)

diff --git a/test/ruby/ruby.lm b/test/ruby/ruby.lm
index b9505515..ec35fae4 100644
--- a/test/ruby/ruby.lm
+++ b/test/ruby/ruby.lm
@@ -295,79 +295,58 @@ def opt_block_arg
 def block_arg
 	[tAMPER arg_value]
 
+right '='
+left 'rescue'
+right '?', ':'
+nonassoc '..', '...'
+left '||'
+left '&&'
+nonassoc '<=>', '==', '===', '!=', '=~', '!~'
+left '>', '>=', '<', '<='
+left '|', '^'
+left '&'
+left '<<', '>>'
+left '+', '-'
+left '*', '/', '%'
+#right tUMINUS_NUM tUMINUS
+right tUMINUS
+right '**'
+right '!', '~', tUPLUS
+
 def arg 
-	['defined?' arg]
-|	[arg_assign]
-
-def arg_assign
-	[lhs '=' arg_assign]
-|	[lhs '=' arg_assign 'rescue' arg]
-|	[arg_sel]
-
-def arg_sel
-	[arg_dot '?' arg_sel ':' arg_sel]
-|	[arg_dot]
-
-def arg_dot
-	[arg_logical '..' arg_dot]
-|	[arg_logical '...' arg_dot]
-|	[arg_logical]
-
-def arg_logical
-	[arg_eq '&&' arg_logical]
-|	[arg_eq '||' arg_logical]
-|	[arg_eq]
-
-def arg_eq
-	[arg_cmp '<=>' arg_eq]
-|	[arg_cmp '==' arg_eq]
-|	[arg_cmp '===' arg_eq]
-|	[arg_cmp '!=' arg_eq]
-|	[arg_cmp '=~' arg_eq]
-|	[arg_cmp '!~' arg_eq]
-|	[arg_cmp]
-
-def arg_cmp
-	[arg_bitor '>=' arg_cmp]
-|	[arg_bitor '<=' arg_cmp]
-|	[arg_bitor '>' arg_cmp]
-|	[arg_bitor '<' arg_cmp]
-|	[arg_bitor]
-
-def arg_bitor
-	[arg_bitand '|' arg_bitor]
-|	[arg_bitand '^' arg_bitor]
-|	[arg_bitand]
-
-def arg_bitand
-	[arg_shift '&' arg_bitand]
-|	[arg_shift]
-
-def arg_shift
-	[arg_add '<<' arg_shift]
-|	[arg_add '>>' arg_shift]
-|	[arg_add]
-
-def arg_add
-	[arg_mult '+' arg_add]
-|	[arg_mult '-' arg_add]
-|	[arg_mult]
-
-def arg_mult
-	[arg_pow '*' arg_mult]
-|	[arg_pow '/' arg_mult]
-|	[arg_pow '%' arg_mult]
-|	[arg_pow]
-
-def arg_pow
-	[arg_unary '**' arg_pow]
-|	[arg_unary]
-
-def arg_unary
-	['!' primary]
+	[lhs '=' arg]
+|	[lhs '=' arg 'rescue' arg]
+|	[arg '?' arg ':' arg]
+|	[arg '..' arg]
+|	[arg '...' arg]
+|	[arg '||' arg]
+|	[arg '&&' arg]
+|	[arg '<=>' arg]
+|	[arg '==' arg]
+|	[arg '===' arg]
+|	[arg '!=' arg]
+|	[arg '=~' arg]
+|	[arg '!~' arg]
+|	[arg '>' arg]
+|	[arg '>=' arg]
+|	[arg '<' arg]
+|	[arg '<=' arg]
+|	[arg '|' arg]
+|	[arg '^' arg]
+|	[arg '&' arg]
+|	[arg '<<' arg]
+|	[arg '>>' arg]
+|	[arg '+' arg]
+|	[arg '-' arg]
+|	[arg '*' arg]
+|	[arg '/' arg]
+|	[arg '%' arg]
+|	[arg '**' arg]
+|	['!' primary]
 |	['~' primary]
-|	[tUPLUS primary]
 |	[tUMINUS primary]
+|	[tUPLUS primary]
+|	['defined?' arg]
 |	[primary]
 
 def primary_value 
-- 
cgit v1.2.1


From d20411f657ee6ae9f7088a413452a7e4be970cdf Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 23 Feb 2009 02:20:52 +0000
Subject: Grammar definition names must be unique.

---
 test/cxx/cxx.lm | 14 ++++----------
 1 file changed, 4 insertions(+), 10 deletions(-)

diff --git a/test/cxx/cxx.lm b/test/cxx/cxx.lm
index cf0d452b..31fcc92e 100644
--- a/test/cxx/cxx.lm
+++ b/test/cxx/cxx.lm
@@ -1024,15 +1024,13 @@ def postfix_expression
 def pseudo_destructor_call
 	[root_qual_opt nested_name_specifier_opt '~' pdc_type_name]
 
-def primary_expression 
+def primary_expression
 	[expr_lit]
 |	['this']
 |	['(' expression ')']
 |	[id_expression]
-
 # This is an GNU extension.
-def primary_expression 
-	['(' '{' statement_rep '}' ')']
+|	['(' '{' statement_rep '}' ')']
 
 def expr_lit 
 	[TK_IntegerDecimal]
@@ -1678,9 +1676,7 @@ def class_function_body
 def member_declaration_forms
 	[decl_specifier_mult_seq_opt decl_specifier_sing 
 		decl_specifier_mult_seq_opt member_declarator_list_opt]
-
-def member_declaration_forms
-	[decl_specifier_mult_seq_opt member_declarator_list_opt]
+|	[decl_specifier_mult_seq_opt member_declarator_list_opt]
 
 def member_declarator_list_opt 
 	[member_declarator_list]
@@ -2107,9 +2103,7 @@ def exception_declaration
 	[type_specifier_seq declarator]
 |	[type_specifier_seq abstract_declarator]
 |	[type_specifier_seq]
-
-def exception_declaration 
-	['...']
+|	['...']
 
 def throw_expression 
 	['throw' assignment_expression]
-- 
cgit v1.2.1


From 9fcbafb9dfa6fc741177b5ba126a0aa4ed9f2f38 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 23 Feb 2009 02:21:37 +0000
Subject: Definition names must be unique.

---
 test/python/python.lm | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/test/python/python.lm b/test/python/python.lm
index 7d579955..d4e8a692 100644
--- a/test/python/python.lm
+++ b/test/python/python.lm
@@ -290,10 +290,10 @@ def defparameter
 |	[parameter '=' expression]
   
 def sublist 
-	[parameter_list opt_comma]
+	[sublist_pl opt_comma]
 
-def parameter_list 
-	[parameter_list ',' parameter]
+def sublist_pl 
+	[sublist_pl ',' parameter]
 |	[parameter]
   
 def parameter 
@@ -359,8 +359,9 @@ def target_atom
 |	['(' target_list ')']
 |	['[' target_list ']']
 
-def target_ext_rep [target_ext target_ext_rep]
-def target_ext_rep []
+def target_ext_rep 
+	[target_ext target_ext_rep]
+|	[]
 
 def target_ext
 	[attributeref]
-- 
cgit v1.2.1


From ff17942e8101c03b1dfa7a2f8dd61b4393630e39 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 25 Feb 2009 02:43:27 +0000
Subject: Added the plus operator.

---
 colm/compile.cpp    |  6 ++++--
 colm/lmparse.kl     | 28 +++++++++++++-------------
 colm/parsedata.cpp  | 58 ++++++++++++++++++++++++++++++++++++++++++++++++-----
 colm/parsedata.h    | 17 ++++++++--------
 colm/parsetree.h    | 18 +++++++++++------
 colm/pdabuild.cpp   |  2 ++
 colm/pdacodegen.cpp |  1 +
 colm/pdarun.h       |  1 +
 colm/tree.cpp       |  5 +++++
 9 files changed, 101 insertions(+), 35 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index 1f6068bb..918b9712 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -218,10 +218,12 @@ UniqueType *TypeRef::lookupType( ParseData *pd )
 		uniqueType = pd->findUniqueType( TYPE_TREE, factor->langEl );
 	else {
 		String name = typeName;
-		if ( isOpt )
+		if ( repeatType == RepeatOpt )
 			name.setAs( 32, "_opt_%s", name.data );
-		else if ( isRepeat )
+		else if ( repeatType == RepeatRepeat )
 			name.setAs( 32, "_repeat_%s", name.data );
+		else if ( repeatType == RepeatList )
+			name.setAs( 32, "_list_%s", name.data );
 
 		/* Not an iterator. May be a reference. */
 		uniqueType = lookupTypePart( pd, nspaceQual, name );
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 510a9127..beb70bc8 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -276,7 +276,7 @@ pred_token:
 	region_qual TK_Word 
 	final {
 		$$->factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
-				$2->data, 0, false, false );
+				$2->data, 0, RepeatNone, false, false );
 		pd->resolveReferenceFactor( $$->factor );
 	};
 
@@ -285,7 +285,7 @@ pred_token:
 	final {
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
 		$$->factor = new PdaFactor( $2->loc, false, $1->nspaceQual,
-				literal, 0, false, false );
+				literal, 0, RepeatNone, false, false );
 		pd->resolveLiteralFactor( $$->factor );
 	};
 
@@ -383,15 +383,13 @@ nonterm basic_type_ref uses type_ref;
 basic_type_ref: region_qual TK_Word opt_repeat
 	final {
 		$$->typeRef = new TypeRef( $2->loc, $1->nspaceQual, $2->data );
-		$$->typeRef->isRepeat = $3->repeat;
-		$$->typeRef->isOpt = $3->opt;
+		$$->typeRef->repeatType = $3->repeatType;
 	};
 
 basic_type_ref: KW_Ptr region_qual TK_Word opt_repeat
 	final {
 		$$->typeRef = new TypeRef( $1->loc, $2->nspaceQual, $3->data );
-		$$->typeRef->isRepeat = $4->repeat;
-		$$->typeRef->isOpt = $4->opt;
+		$$->typeRef->repeatType = $4->repeatType;
 		$$->typeRef->isPtr = true;
 	};
 
@@ -507,7 +505,7 @@ nonterm pattern_el_type_or_lit
 pattern_el_type_or_lit: region_qual TK_Word opt_repeat
 	final {
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
-				$2->data, 0, $3->opt, $3->repeat );
+				$2->data, 0, $3->repeatType, $3->opt, $3->repeat );
 		$$->patternItem = new PatternItem( $2->loc, factor, PatternItem::FactorType );
 		patternItemList->append( $$->patternItem );
 	};
@@ -516,7 +514,7 @@ pattern_el_type_or_lit: region_qual TK_Literal opt_repeat
 	final {
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
-				literal, 0, $3->opt, $3->repeat );
+				literal, 0, $3->repeatType, $3->opt, $3->repeat );
 		$$->patternItem = new PatternItem( $2->loc, factor, PatternItem::FactorType );
 		patternItemList->append( $$->patternItem );
 	};
@@ -571,7 +569,7 @@ repl_el: region_qual TK_Literal
 	final {
 		PdaLiteral *literal = new PdaLiteral( $2->loc, *$2 );
 		PdaFactor *factor = new PdaFactor( $2->loc, false, $1->nspaceQual, 
-				literal, 0, false, false );
+				literal, 0, RepeatNone, false, false );
 		ReplItem *replItem = new ReplItem( $2->loc, ReplItem::FactorType, factor );
 		replItemList->append( replItem );
 	};
@@ -596,7 +594,7 @@ prod_el:
 	opt_commit region_qual TK_Word opt_repeat
 	final {
 		$$->factor = new PdaFactor( $3->loc, $1->commit, 
-				$2->nspaceQual, $3->data, 0, $4->opt, $4->repeat );
+				$2->nspaceQual, $3->data, 0, $4->repeatType, $4->opt, $4->repeat );
 	};
 
 prod_el: 
@@ -605,18 +603,20 @@ prod_el:
 		/* Create a new factor node going to a concat literal. */
 		PdaLiteral *literal = new PdaLiteral( $3->loc, *$3 );
 		$$->factor = new PdaFactor( $3->loc, $1->commit, $2->nspaceQual, 
-				literal, 0, $4->opt, $4->repeat );
+				literal, 0, $4->repeatType, $4->opt, $4->repeat );
 	};
 
 nonterm opt_repeat
 {
 	bool opt;
 	bool repeat;
+	RepeatType repeatType;
 };
 
-opt_repeat: '?' final { $$->opt = true; $$->repeat = false; };
-opt_repeat: '*' final { $$->opt = false; $$->repeat = true; };
-opt_repeat:     final { $$->opt = false; $$->repeat = false; };
+opt_repeat: '*' final { $$->opt = false; $$->repeat = true; $$->repeatType = RepeatRepeat; };
+opt_repeat: '+' final { $$->opt = false; $$->repeat = false; $$->repeatType = RepeatList; };
+opt_repeat: '?' final { $$->opt = true; $$->repeat = false; $$->repeatType = RepeatOpt; };
+opt_repeat:     final { $$->opt = false; $$->repeat = false; $$->repeatType = RepeatNone; };
 
 nonterm region_qual
 {
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 5bcb1282..4d91fbaa 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1140,7 +1140,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 	/* Look up the language element in the region. */
 	KlangEl *langEl = getKlangEl( this, nspace, fact->refName );
 
-	if ( fact->opt ) {
+	if ( fact->repeatType == RepeatOpt ) {
 		/* If the factor is an opt, create the opt element and link the factor
 		 * to it. */
 		String optName( 32, "_opt_%s", fact->refName.data );
@@ -1158,7 +1158,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 
 			/* Build the first production of the repeat. */
 			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, false, false );
+					fact->refName, 0, RepeatNone, false, false );
 			prodElList1->append( factor1 );
 
 			Definition *newDef1 = new Definition( InputLoc(),
@@ -1181,7 +1181,7 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 			fact->langEl = prodName;
 		}
 	}
-	else if ( fact->repeat ) {
+	else if ( fact->repeatType == RepeatRepeat ) {
 		/* If the factor is a repeat, create the repeat element and link the
 		 * factor to it. */
 		String repeatName( 32, "_repeat_%s", fact->refName.data );
@@ -1199,9 +1199,9 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 
 			/* Build the first production of the repeat. */
 			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, false, false );
+					fact->refName, 0, RepeatNone, false, false );
 			PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					repeatName, 0, false, false );
+					repeatName, 0, RepeatNone, false, false );
 
 			prodElList1->append( factor1 );
 			prodElList1->append( factor2 );
@@ -1226,6 +1226,54 @@ void ParseData::resolveReferenceFactor( PdaFactor *fact )
 			fact->langEl = prodName;
 		}
 	}
+	else if ( fact->repeatType == RepeatList ) {
+		/* If the factor is a repeat, create the repeat element and link the
+		 * factor to it. */
+		String repeatName( 32, "_list_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( repeatName );
+	    if ( inDict != 0 ) {
+			fact->langEl = inDict->value;
+		}
+		else {
+			KlangEl *prodName = getKlangEl( this, nspace, repeatName );
+			prodName->type = KlangEl::NonTerm;
+			prodName->isList = true;
+
+			/* Build the first production of the list. */
+			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					fact->refName, 0, RepeatNone, false, false );
+			PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					repeatName, 0, RepeatNone, false, false );
+
+			ProdElList *prodElList1 = new ProdElList;
+			prodElList1->append( factor1 );
+			prodElList1->append( factor2 );
+
+			Definition *newDef1 = new Definition( InputLoc(),
+					prodName, prodElList1, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef1 );
+			prodList.append( newDef1 );
+
+			/* Build the second production of the list. */
+			PdaFactor *factor3 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+					fact->refName, 0, RepeatNone, false, false );
+
+			ProdElList *prodElList2 = new ProdElList;
+			prodElList2->append( factor3 );
+
+			Definition *newDef2 = new Definition( InputLoc(),
+					prodName, prodElList2, false, 0,
+					prodList.length(), Definition::Production );
+
+			prodName->defList.append( newDef2 );
+			prodList.append( newDef2 );
+
+			fact->langEl = prodName;
+		}
+	}
 	else {
 		/* The factor is not a repeat. Link to the language element. */
 		fact->langEl = langEl;
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 1e69935b..28db05ab 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -181,6 +181,7 @@ struct KlangEl : public DListEl<KlangEl>
 	bool reduceFirst;
 	bool isLiteral;
 	bool isRepeat;
+	bool isList;
 	bool isOpt;
 	bool parseStop;
 	bool isEOF;
@@ -225,25 +226,26 @@ struct PdaFactor
 
 	/* Construct with a literal fsm. */
 	PdaFactor( const InputLoc &loc, bool commit, NamespaceQual *nspaceQual, 
-			PdaLiteral *literal, int priorVal, bool opt, bool repeat ) :
+			PdaLiteral *literal, int priorVal, RepeatType repeatType, bool opt, bool repeat ) :
 		loc(loc), commit(commit), nspaceQual(nspaceQual), 
-		literal(literal), langEl(0), priorVal(priorVal), opt(opt), repeat(repeat),
+		literal(literal), langEl(0), priorVal(priorVal), repeatType(repeatType),
 		nspace(0), type(LiteralType), objField(0) {}
 
 	/* Construct with a reference to a var def. */
 	PdaFactor( const InputLoc &loc, bool commit, NamespaceQual *nspaceQual, 
-			const String &refName, int priorVal, bool opt, bool repeat ) :
+			const String &refName, int priorVal, RepeatType repeatType, bool opt, bool repeat ) :
 		loc(loc), commit(commit), nspaceQual(nspaceQual), refName(refName),
-		literal(0), langEl(0), priorVal(priorVal), opt(opt), repeat(repeat), 
+		literal(0), langEl(0), priorVal(priorVal), repeatType(repeatType),
 		nspace(0), type(ReferenceType), objField(0) {}
 
 	PdaFactor( const InputLoc &loc, KlangEl *langEl ) :
 		loc(loc), commit(false), nspaceQual(0), literal(0), langEl(langEl), 
-		priorVal(0), opt(false), repeat(false), nspace(0), type(ReferenceType), objField(0) {}
+		priorVal(0), repeatType(RepeatNone), nspace(0),
+		type(ReferenceType), objField(0) {}
 
 	PdaFactor() :
 		commit(false), nspaceQual(0), 
-		literal(0), langEl(0), priorVal(0), opt(false), repeat(false),
+		literal(0), langEl(0), priorVal(0), repeatType(RepeatNone),
 		nspace(0), type(LiteralType), objField(0) {}
 
 	InputLoc loc;
@@ -253,8 +255,7 @@ struct PdaFactor
 	PdaLiteral *literal;
 	KlangEl *langEl;
 	int priorVal;
-	bool opt;
-	bool repeat;
+	RepeatType repeatType;
 	Namespace *nspace;
 	Type type;
 	ObjField *objField;
diff --git a/colm/parsetree.h b/colm/parsetree.h
index a9e4f6c1..e4ef5e38 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1091,25 +1091,32 @@ typedef AvlMapEl< StringVect, int > VectorTypeIdMapEl;
 
 typedef Vector<TypeRef*> TypeRefVect;
 
+enum RepeatType {
+	RepeatRepeat,
+	RepeatList,
+	RepeatOpt,
+	RepeatNone
+};
+
 struct TypeRef
 {
 	/* Qualification and a type name. These require lookup. */
 	TypeRef( const InputLoc &loc, NamespaceQual *nspaceQual, String typeName ) :
 		loc(loc), nspaceQual(nspaceQual), typeName(typeName), iterDef(0),
 		searchTypeRef(0), factor(0),
-		isPtr(false), isRef(false), isRepeat(false), isOpt(false),
+		isPtr(false), isRef(false), repeatType(RepeatNone),
 		uniqueType(0) {}
 
 	/* Iterator definition. */
 	TypeRef( const InputLoc &loc, IterDef *iterDef, TypeRef *searchTypeRef ) :
 		loc(loc), iterDef(iterDef), searchTypeRef(searchTypeRef), factor(0),
-		isPtr(false), isRef(false), isRepeat(false), isOpt(false),
+		isPtr(false), isRef(false), repeatType(RepeatNone),
 		uniqueType(0) {}
 
 	/* Unique type is given directly. */
 	TypeRef( const InputLoc &loc, UniqueType *uniqueType ) :
 		loc(loc), nspaceQual(0), iterDef(0), searchTypeRef(0), factor(0),
-		isPtr(false), isRef(false), isRepeat(false), isOpt(false), 
+		isPtr(false), isRef(false), repeatType(RepeatNone),
 		uniqueType(uniqueType) {}
 
 	/* A factor in a pattern. In the case of matches we need a type ref at
@@ -1117,7 +1124,7 @@ struct TypeRef
 	 * to do it on demand. */
 	TypeRef( const InputLoc &loc, PdaFactor *factor ) :
 		loc(loc), nspaceQual(0), iterDef(0), searchTypeRef(0), factor(factor),
-		isPtr(false), isRef(false), isRepeat(false), isOpt(false), 
+		isPtr(false), isRef(false), repeatType(RepeatNone),
 		uniqueType(0) {}
 
 
@@ -1131,8 +1138,7 @@ struct TypeRef
 	PdaFactor *factor;
 	bool isPtr;
 	bool isRef;
-	bool isRepeat;
-	bool isOpt;
+	RepeatType repeatType;
 
 private:
 	UniqueType *lookupTypePart( ParseData *pd, NamespaceQual *nspaceQual, 
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 308a57ab..a616de1b 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -71,6 +71,7 @@ KlangEl::KlangEl( Namespace *nspace, const String &name, Type type )
 	reduceFirst(false),
 	isLiteral(false),
 	isRepeat(false),
+	isList(false),
 	isOpt(false),
 	parseStop(false),
 	isEOF(false),
@@ -1386,6 +1387,7 @@ void ParseData::makeRuntimeData()
 		if ( lel != 0 ) {
 			runtimeData->lelInfo[i].name = lel->fullLit;
 			runtimeData->lelInfo[i].repeat = lel->isRepeat;
+			runtimeData->lelInfo[i].list = lel->isList;
 			runtimeData->lelInfo[i].literal = lel->isLiteral;
 			runtimeData->lelInfo[i].ignore = lel->ignore;
 			runtimeData->lelInfo[i].frameId = -1;
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 53530e80..f5d6de5e 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -177,6 +177,7 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 		
 		/* Repeat, literal, ignore flags. */
 		out << ", " << runtimeData->lelInfo[i].repeat << ", " << 
+				runtimeData->lelInfo[i].list << ", " <<
 				runtimeData->lelInfo[i].literal << ", " <<
 				runtimeData->lelInfo[i].ignore << ", ";
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 61039a7e..b95d8806 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -341,6 +341,7 @@ struct LangElInfo
 {
 	const char *name;
 	bool repeat;
+	bool list;
 	bool literal;
 	bool ignore;
 
diff --git a/colm/tree.cpp b/colm/tree.cpp
index d41b4fbf..dce1e5e8 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -560,6 +560,11 @@ rec_call:
 				 * right to the first child (repeated item). */
 				if ( lelInfo[((Kid*)vm_top())->tree->id].repeat )
 					kid = kid->tree->child;
+
+				/* If we have a kid and the parent is a list (recursive prod of
+				 * list) then go right to the first child. */
+				if ( kid != 0 && lelInfo[((Kid*)vm_top())->tree->id].list )
+					kid = kid->tree->child;
 			}
 
 			kid = (Kid*) vm_pop();
-- 
cgit v1.2.1


From 9edcc5097c9555169076aa8271c158dfd5bbaaca Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 25 Feb 2009 03:16:46 +0000
Subject: new precedence keywords

---
 colm.vim | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/colm.vim b/colm.vim
index b32441a5..40aef135 100644
--- a/colm.vim
+++ b/colm.vim
@@ -56,7 +56,7 @@ syntax keyword Type
 	\ commit include literal iter
 	\ namespace lex reducefirst global include 
 	\ construct parse parse_stop match require
-	\ preeof
+	\ preeof left right nonassoc prec
 
 syntax keyword typeKeywords
 	\ int str bool any ref vector map list ptr
-- 
cgit v1.2.1


From 0ab005c28a931a20aec401cd6730bed72cc64c42 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 25 Feb 2009 03:18:23 +0000
Subject: cleaned up a large function

---
 colm/parsedata.cpp | 235 +++++++++++++++++++++++++++--------------------------
 colm/parsedata.h   |   3 +
 2 files changed, 125 insertions(+), 113 deletions(-)

diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 4d91fbaa..b7b3e526 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1127,152 +1127,161 @@ void ParseData::resolveLiteralFactor( PdaFactor *fact )
 	fact->langEl = tokenDef->token;
 }
 
-void ParseData::resolveReferenceFactor( PdaFactor *fact )
+KlangEl *ParseData::makeRepeatProd( Namespace *nspace, const String &repeatName, PdaFactor *fact )
 {
-	/* Look for the production's associated region. */
-	Namespace *nspace = fact->nspaceQual->getQual( this );
+	KlangEl *prodName = getKlangEl( this, nspace, repeatName );
+	prodName->type = KlangEl::NonTerm;
+	prodName->isRepeat = true;
 
-	if ( nspace == 0 )
-		error(fact->loc) << "do not have namespace for resolving reference" << endp;
-	
-	fact->nspace = nspace;
+	ProdElList *prodElList1 = new ProdElList;
 
-	/* Look up the language element in the region. */
-	KlangEl *langEl = getKlangEl( this, nspace, fact->refName );
+	/* Build the first production of the repeat. */
+	PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			fact->refName, 0, RepeatNone, false, false );
+	PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			repeatName, 0, RepeatNone, false, false );
 
-	if ( fact->repeatType == RepeatOpt ) {
-		/* If the factor is an opt, create the opt element and link the factor
-		 * to it. */
-		String optName( 32, "_opt_%s", fact->refName.data );
+	prodElList1->append( factor1 );
+	prodElList1->append( factor2 );
 
-    	SymbolMapEl *inDict = nspace->symbolMap.find( optName );
-	    if ( inDict != 0 ) {
-			fact->langEl = inDict->value;
-		}
-		else {
-			KlangEl *prodName = getKlangEl( this, nspace, optName );
-			prodName->type = KlangEl::NonTerm;
-			prodName->isOpt = true;
+	Definition *newDef1 = new Definition( InputLoc(),
+			prodName, prodElList1, false, 0,
+			prodList.length(), Definition::Production );
 
-			ProdElList *prodElList1 = new ProdElList;
+	prodName->defList.append( newDef1 );
+	prodList.append( newDef1 );
 
-			/* Build the first production of the repeat. */
-			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, RepeatNone, false, false );
-			prodElList1->append( factor1 );
+	/* Build the second production of the repeat. */
+	ProdElList *prodElList2 = new ProdElList;
 
-			Definition *newDef1 = new Definition( InputLoc(),
-					prodName, prodElList1, false, 0,
-					prodList.length(), Definition::Production );
+	Definition *newDef2 = new Definition( InputLoc(),
+			prodName, prodElList2, false, 0,
+			prodList.length(), Definition::Production );
 
-			prodName->defList.append( newDef1 );
-			prodList.append( newDef1 );
+	prodName->defList.append( newDef2 );
+	prodList.append( newDef2 );
 
-			/* Build the second production of the repeat. */
-			ProdElList *prodElList2 = new ProdElList;
+	return prodName;
+}
 
-			Definition *newDef2 = new Definition( InputLoc(),
-					prodName, prodElList2, false, 0,
-					prodList.length(), Definition::Production );
+KlangEl *ParseData::makeListProd( Namespace *nspace, const String &listName, PdaFactor *fact )
+{
+	KlangEl *prodName = getKlangEl( this, nspace, listName );
+	prodName->type = KlangEl::NonTerm;
+	prodName->isList = true;
 
-			prodName->defList.append( newDef2 );
-			prodList.append( newDef2 );
+	/* Build the first production of the list. */
+	PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			fact->refName, 0, RepeatNone, false, false );
+	PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			listName, 0, RepeatNone, false, false );
 
-			fact->langEl = prodName;
-		}
-	}
-	else if ( fact->repeatType == RepeatRepeat ) {
-		/* If the factor is a repeat, create the repeat element and link the
-		 * factor to it. */
-		String repeatName( 32, "_repeat_%s", fact->refName.data );
+	ProdElList *prodElList1 = new ProdElList;
+	prodElList1->append( factor1 );
+	prodElList1->append( factor2 );
 
-    	SymbolMapEl *inDict = nspace->symbolMap.find( repeatName );
-	    if ( inDict != 0 ) {
-			fact->langEl = inDict->value;
-		}
-		else {
-			KlangEl *prodName = getKlangEl( this, nspace, repeatName );
-			prodName->type = KlangEl::NonTerm;
-			prodName->isRepeat = true;
+	Definition *newDef1 = new Definition( InputLoc(),
+			prodName, prodElList1, false, 0,
+			prodList.length(), Definition::Production );
 
-			ProdElList *prodElList1 = new ProdElList;
+	prodName->defList.append( newDef1 );
+	prodList.append( newDef1 );
 
-			/* Build the first production of the repeat. */
-			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, RepeatNone, false, false );
-			PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					repeatName, 0, RepeatNone, false, false );
+	/* Build the second production of the list. */
+	PdaFactor *factor3 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			fact->refName, 0, RepeatNone, false, false );
 
-			prodElList1->append( factor1 );
-			prodElList1->append( factor2 );
+	ProdElList *prodElList2 = new ProdElList;
+	prodElList2->append( factor3 );
 
-			Definition *newDef1 = new Definition( InputLoc(),
-					prodName, prodElList1, false, 0,
-					prodList.length(), Definition::Production );
+	Definition *newDef2 = new Definition( InputLoc(),
+			prodName, prodElList2, false, 0,
+			prodList.length(), Definition::Production );
 
-			prodName->defList.append( newDef1 );
-			prodList.append( newDef1 );
+	prodName->defList.append( newDef2 );
+	prodList.append( newDef2 );
 
-			/* Build the second production of the repeat. */
-			ProdElList *prodElList2 = new ProdElList;
+	return prodName;
+}
 
-			Definition *newDef2 = new Definition( InputLoc(),
-					prodName, prodElList2, false, 0,
-					prodList.length(), Definition::Production );
+KlangEl *ParseData::makeOptProd( Namespace *nspace, const String &optName, PdaFactor *fact )
+{
+	KlangEl *prodName = getKlangEl( this, nspace, optName );
+	prodName->type = KlangEl::NonTerm;
+	prodName->isOpt = true;
 
-			prodName->defList.append( newDef2 );
-			prodList.append( newDef2 );
+	ProdElList *prodElList1 = new ProdElList;
 
-			fact->langEl = prodName;
-		}
-	}
-	else if ( fact->repeatType == RepeatList ) {
-		/* If the factor is a repeat, create the repeat element and link the
-		 * factor to it. */
-		String repeatName( 32, "_list_%s", fact->refName.data );
+	/* Build the first production of the repeat. */
+	PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
+			fact->refName, 0, RepeatNone, false, false );
+	prodElList1->append( factor1 );
 
-    	SymbolMapEl *inDict = nspace->symbolMap.find( repeatName );
-	    if ( inDict != 0 ) {
-			fact->langEl = inDict->value;
-		}
-		else {
-			KlangEl *prodName = getKlangEl( this, nspace, repeatName );
-			prodName->type = KlangEl::NonTerm;
-			prodName->isList = true;
+	Definition *newDef1 = new Definition( InputLoc(),
+			prodName, prodElList1, false, 0,
+			prodList.length(), Definition::Production );
 
-			/* Build the first production of the list. */
-			PdaFactor *factor1 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, RepeatNone, false, false );
-			PdaFactor *factor2 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					repeatName, 0, RepeatNone, false, false );
+	prodName->defList.append( newDef1 );
+	prodList.append( newDef1 );
 
-			ProdElList *prodElList1 = new ProdElList;
-			prodElList1->append( factor1 );
-			prodElList1->append( factor2 );
+	/* Build the second production of the repeat. */
+	ProdElList *prodElList2 = new ProdElList;
 
-			Definition *newDef1 = new Definition( InputLoc(),
-					prodName, prodElList1, false, 0,
-					prodList.length(), Definition::Production );
+	Definition *newDef2 = new Definition( InputLoc(),
+			prodName, prodElList2, false, 0,
+			prodList.length(), Definition::Production );
 
-			prodName->defList.append( newDef1 );
-			prodList.append( newDef1 );
+	prodName->defList.append( newDef2 );
+	prodList.append( newDef2 );
 
-			/* Build the second production of the list. */
-			PdaFactor *factor3 = new PdaFactor( InputLoc(), false, fact->nspaceQual, 
-					fact->refName, 0, RepeatNone, false, false );
+	return prodName;
+}
 
-			ProdElList *prodElList2 = new ProdElList;
-			prodElList2->append( factor3 );
+void ParseData::resolveReferenceFactor( PdaFactor *fact )
+{
+	/* Look for the production's associated region. */
+	Namespace *nspace = fact->nspaceQual->getQual( this );
 
-			Definition *newDef2 = new Definition( InputLoc(),
-					prodName, prodElList2, false, 0,
-					prodList.length(), Definition::Production );
+	if ( nspace == 0 )
+		error(fact->loc) << "do not have namespace for resolving reference" << endp;
+	
+	fact->nspace = nspace;
 
-			prodName->defList.append( newDef2 );
-			prodList.append( newDef2 );
+	/* Look up the language element in the region. */
+	KlangEl *langEl = getKlangEl( this, nspace, fact->refName );
 
-			fact->langEl = prodName;
-		}
+	if ( fact->repeatType == RepeatRepeat ) {
+		/* If the factor is a repeat, create the repeat element and link the
+		 * factor to it. */
+		String repeatName( 32, "_repeat_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( repeatName );
+	    if ( inDict != 0 )
+			fact->langEl = inDict->value;
+		else
+			fact->langEl = makeRepeatProd( nspace, repeatName, fact );;
+	}
+	else if ( fact->repeatType == RepeatList ) {
+		/* If the factor is a repeat, create the repeat element and link the
+		 * factor to it. */
+		String listName( 32, "_list_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( listName );
+	    if ( inDict != 0 )
+			fact->langEl = inDict->value;
+		else
+			fact->langEl = makeListProd( nspace, listName, fact );
+	}
+	else if ( fact->repeatType == RepeatOpt ) {
+		/* If the factor is an opt, create the opt element and link the factor
+		 * to it. */
+		String optName( 32, "_opt_%s", fact->refName.data );
+
+    	SymbolMapEl *inDict = nspace->symbolMap.find( optName );
+	    if ( inDict != 0 )
+			fact->langEl = inDict->value;
+		else
+			fact->langEl = makeOptProd( nspace, optName, fact );
 	}
 	else {
 		/* The factor is not a repeat. Link to the language element. */
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 28db05ab..caf65e44 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -687,6 +687,9 @@ struct ParseData
 	void printNonTermFirstSets();
 	void printFirstSets();
 
+	KlangEl *makeRepeatProd( Namespace *nspace, const String &repeatName, PdaFactor *fact );
+	KlangEl *makeListProd( Namespace *nspace, const String &listName, PdaFactor *fact );
+	KlangEl *makeOptProd( Namespace *nspace, const String &optName, PdaFactor *fact );
 	void resolveLiteralFactor( PdaFactor *fact );
 	void resolveReferenceFactor( PdaFactor *fact );
 	void resolveFactor( PdaFactor *fact );
-- 
cgit v1.2.1


From e544db3aa8d2cd36ebbeb5ad2e71c17b6ec7de29 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 25 Feb 2009 03:22:08 +0000
Subject: Need to escape '<', '>', and '&'.

---
 colm/tree.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/colm/tree.cpp b/colm/tree.cpp
index dce1e5e8..fafef8b0 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -479,7 +479,13 @@ void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree )
 void xml_escape_data( const char *data, long len )
 {
 	for ( int i = 0; i < len; i++ ) {
-		if ( 32 <= data[i] && data[i] <= 126 )
+		if ( data[i] == '<' )
+			cout << "&lt;";
+		else if ( data[i] == '>' )
+			cout << "&gt;";
+		else if ( data[i] == '&' )
+			cout << "&amp;";
+		else if ( 32 <= data[i] && data[i] <= 126 )
 			cout << data[i];
 		else
 			cout << "&#" << ((unsigned)data[i]) << ';';
-- 
cgit v1.2.1


From 6d1fbb18b8aa01a8cca22b460d087aff8faa65d8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 26 Feb 2009 00:55:21 +0000
Subject: The print_xml function now omits attributes and comments. Now use
 print_xml_ac to get those in the printout.

---
 colm/bytecode.cpp | 14 +++++++++++++-
 colm/bytecode.h   |  7 ++++---
 colm/compile.cpp  |  7 ++++++-
 colm/lmparse.kh   |  2 +-
 colm/lmparse.kl   |  4 ++++
 colm/lmscan.rl    |  3 ++-
 colm/parsetree.h  |  1 +
 colm/tree.cpp     | 22 +++++++++++++---------
 8 files changed, 44 insertions(+), 16 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 58db7499..08a1ac98 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -871,6 +871,18 @@ again:
 			tree_downref( prg, sp, tree );
 			break;
 		}
+		case IN_PRINT_XML_AC: {
+			#ifdef COLM_LOG_BYTECODE
+			if ( colm_log_bytecode ) {
+				cerr << "IN_PRINT_XML_AC" << endl;
+			}
+			#endif
+
+			Tree *tree = pop();
+			print_xml_tree( sp, prg, tree, true );
+			tree_downref( prg, sp, tree );
+			break;
+		}
 		case IN_PRINT_XML: {
 			#ifdef COLM_LOG_BYTECODE
 			if ( colm_log_bytecode ) {
@@ -879,7 +891,7 @@ again:
 			#endif
 
 			Tree *tree = pop();
-			print_xml_tree( sp, prg, tree );
+			print_xml_tree( sp, prg, tree, false );
 			tree_downref( prg, sp, tree );
 			break;
 		}
diff --git a/colm/bytecode.h b/colm/bytecode.h
index c13578a7..1b3eb02a 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -183,7 +183,8 @@ typedef unsigned char uchar;
 #define IN_VECTOR_INSERT_BKT     0x84
 
 #define IN_PRINT                 0x87
-#define IN_PRINT_XML             0x88
+#define IN_PRINT_XML_AC          0x88
+#define IN_PRINT_XML             0xab
 
 #define IN_HALT                  0x8a
 
@@ -486,8 +487,8 @@ Tree *prep_parse_tree( Program *prg, Tree **sp, Tree *tree );
 void print_tree( Tree **&sp, Program *prg, Tree *tree );
 void print_tree( ostream &out, Tree **&sp, Program *prg, Tree *tree );
 void print_str( Head *str );
-void print_xml_tree( Tree **&sp, Program *prg, Tree *tree );
-void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, int depth );
+void print_xml_tree( Tree **&sp, Program *prg, Tree *tree, bool commAttr );
+void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, bool commAttr, int depth );
 
 long list_length( List *list );
 void list_append( Program *prg, List *list, Tree *val );
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 918b9712..2a9b810e 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1704,6 +1704,7 @@ void LangStmt::compile( ParseData *pd, CodeVect &code ) const
 {
 	switch ( type ) {
 		case PrintType: 
+		case PrintXMLACType:
 		case PrintXMLType: {
 			UniqueType **types = new UniqueType*[exprPtrVect->length()];
 			
@@ -1716,7 +1717,11 @@ void LangStmt::compile( ParseData *pd, CodeVect &code ) const
 				for ( ExprVect::Iter pex = *exprPtrVect; pex.lte(); pex++ )
 					code.append( IN_PRINT );
 			}
-			else {
+			else if ( type == PrintXMLACType ) {
+				for ( ExprVect::Iter pex = *exprPtrVect; pex.lte(); pex++ )
+					code.append( IN_PRINT_XML_AC );
+			}
+			else if ( type == PrintXMLType ) {
 				for ( ExprVect::Iter pex = *exprPtrVect; pex.lte(); pex++ )
 					code.append( IN_PRINT_XML );
 			}
diff --git a/colm/lmparse.kh b/colm/lmparse.kh
index 0184a76d..b51d0e3d 100644
--- a/colm/lmparse.kh
+++ b/colm/lmparse.kh
@@ -52,7 +52,7 @@ struct Parser
 
 	# Language.
 	token KW_If, KW_While, KW_Else, KW_Elsif, KW_For, KW_Return, KW_Yield, KW_In,
-		KW_Break, KW_PrintXML, KW_Print, KW_Require;
+		KW_Break, KW_PrintXMLAC, KW_PrintXML, KW_Print, KW_Require;
 
 	# Patterns.
 	token KW_Match, KW_Construct, KW_Parse, KW_ParseStop, KW_New, KW_MakeToken,
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index beb70bc8..ed9102cc 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -984,6 +984,10 @@ statement: KW_Print '(' code_expr_list ')'
 	final {
 		$$->stmt = new LangStmt( $1->loc, LangStmt::PrintType, $3->exprVect );
 	};
+statement: KW_PrintXMLAC '(' code_expr_list ')'
+	final {
+		$$->stmt = new LangStmt( $1->loc, LangStmt::PrintXMLACType, $3->exprVect );
+	};
 statement: KW_PrintXML '(' code_expr_list ')'
 	final {
 		$$->stmt = new LangStmt( $1->loc, LangStmt::PrintXMLType, $3->exprVect );
diff --git a/colm/lmscan.rl b/colm/lmscan.rl
index 8d42f274..d5e5f0f8 100644
--- a/colm/lmscan.rl
+++ b/colm/lmscan.rl
@@ -355,7 +355,6 @@ void Scanner::endSection( )
 		'ignore' => { token( KW_Ignore ); };
 		'construct' => { token( KW_Construct ); };
 		'new' => { token( KW_New ); };
-		'print' => { token( KW_Print ); };
 		'if' => { token( KW_If ); };
 		'reject' => { token( KW_Reject ); };
 		'while' => { token( KW_While ); };
@@ -364,6 +363,8 @@ void Scanner::endSection( )
 		'match' => { token( KW_Match ); };
 		'for' => { token( KW_For ); };
 		'iter' => { token( KW_Iter ); };
+		'print' => { token( KW_Print ); };
+		'print_xml_ac' => { token( KW_PrintXMLAC ); };
 		'print_xml' => { token( KW_PrintXML ); };
 		'namespace' => { token( KW_Namespace ); };
 		'lex' => { token( KW_Lex ); };
diff --git a/colm/parsetree.h b/colm/parsetree.h
index e4ef5e38..6de45be6 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -1497,6 +1497,7 @@ struct LangStmt
 	enum Type {
 		AssignType,
 		PrintType,
+		PrintXMLACType,
 		PrintXMLType,
 		ExprType,
 		IfType,
diff --git a/colm/tree.cpp b/colm/tree.cpp
index fafef8b0..42bcec9b 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -500,13 +500,12 @@ void print_xml_ignore_list( Tree **sp, Program *prg, Tree *tree, long depth )
 {
 	Kid *ignore = tree_ignore( prg, tree );
 	while ( tree_is_ignore( prg, ignore ) ) {
-		print_xml_kid( sp, prg, ignore, depth );
+		print_xml_kid( sp, prg, ignore, true, depth );
 		ignore = ignore->next;
 	}
 }
 
-
-void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, int depth )
+void print_xml_kid( Tree **&sp, Program *prg, Kid *kid, bool commAttr, int depth )
 {
 	Kid *child;
 	Tree **root = vm_ptop();
@@ -525,7 +524,8 @@ rec_call:
 	}
 	else {
 		/* First print the ignore tokens. */
-		print_xml_ignore_list( sp, prg, kid->tree, depth );
+		if ( commAttr )
+			print_xml_ignore_list( sp, prg, kid->tree, depth );
 
 		for ( i = 0; i < depth; i++ )
 			cout << "  ";
@@ -534,8 +534,7 @@ rec_call:
 		 * we will close it off immediately. */
 		cout << '<' << lelInfo[kid->tree->id].name;
 
-		/* If the parent kid is a repeat then skip this node and go
-		 * right to the first child (repeated item). */
+		/* If this is an attribute then give the node an attribute number. */
 		if ( vm_ptop() != root ) {
 			objectLength = lelInfo[((Kid*)vm_top())->tree->id].objectLength;
 			if ( kidNum < objectLength )
@@ -544,13 +543,18 @@ rec_call:
 
 		objectLength = lelInfo[kid->tree->id].objectLength;
 		child = tree_child( prg, kid->tree );
-		if ( objectLength > 0 || child != 0 ) {
+		if ( (commAttr && objectLength > 0) || child != 0 ) {
 			cout << '>' << endl;
 			vm_push( (SW) kidNum );
 			vm_push( (SW) kid );
 
 			kidNum = 0;
 			kid = kid->tree->child;
+
+			/* Skip over attributes if not printing comments and attributes. */
+			if ( ! commAttr )
+				kid = child;
+
 			while ( kid != 0 ) {
 				if ( kid->tree == 0 || !lelInfo[kid->tree->id].ignore ) {
 					depth++;
@@ -620,12 +624,12 @@ rec_call:
 		goto rec_return;
 }
 
-void print_xml_tree( Tree **&sp, Program *prg, Tree *tree )
+void print_xml_tree( Tree **&sp, Program *prg, Tree *tree, bool commAttr )
 {
 	Kid kid;
 	kid.tree = tree;
 	kid.next = 0;
-	print_xml_kid( sp, prg, &kid, 0 );
+	print_xml_kid( sp, prg, &kid, commAttr, 0 );
 }
 
 void stream_free( Program *prg, Stream *s )
-- 
cgit v1.2.1


From fd7ecdb4f5f823e5e026ed89841b39ec00a9a9fc Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 26 Feb 2009 00:57:39 +0000
Subject: Can now have generation code blocks on ignore tokens. The send
 function now checks the ignore property of a token to determine if it should
 be ignored. This will require making an ignore_def production type to have
 context-free comments. This will be a normal production but with the ignore
 bit set.

---
 colm/fsmrun.cpp | 146 ++++++++++++++++++++++++++++++++++++--------------------
 colm/fsmrun.h   |   1 +
 2 files changed, 94 insertions(+), 53 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index b027e028..eb629c4c 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -397,6 +397,10 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 			
 			parser->ignore( send->tree );
 			fsmRun->prg->kidPool.free( send );
+
+			/* Set the current state from the next region. */
+			fsmRun->region = parser->getNextRegion();
+			fsmRun->cs = fsmRun->tables->entryByRegion[fsmRun->region];
 		}
 		else {
 			#ifdef COLM_LOG_PARSE
@@ -411,42 +415,6 @@ void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser )
 	}
 }
 
-void FsmRun::sendToken( long id )
-{
-	#ifdef COLM_LOG_PARSE
-	if ( colm_log_parse ) {
-		cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
-	}
-	#endif
-
-	bool ctxDepParsing = prg->ctxDepParsing;
-	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-
-	/* Make the token data. */
-	long length = p-tokstart;
-	Head *tokdata = string_alloc_const( prg, tokstart, length );
-	update_position( this, tokstart, length );
-
-	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
-		/* We don't want the generation actions to automatically consume text
-		 * so reset p since the scanner leaves it at tokend. */
-		p = tokstart;
-		tokstart = 0;
-
-		generationAction( id, tokdata, false, 0 );
-	}
-	else {
-		/* By default the match is consumed and this is what we need. Just
-		 * need to reset tokstart. */
-		tokstart = 0;
-
-		Kid *input = makeToken( id, tokdata, false, 0 );
-		send_handle_error( this, parser, input );
-	}
-
-	memset( mark_leave, 0, sizeof(mark_leave) );
-}
-
 void FsmRun::sendNamedLangEl()
 {
 	/* All three set by getLangEl. */
@@ -644,36 +612,108 @@ void PdaRun::ignore( Tree *tree )
 	accumIgnore = ignore;
 }
 
-void FsmRun::sendIgnore( long id )
+void FsmRun::sendCtxDep( long id )
 {
 	#ifdef COLM_LOG_PARSE
 	if ( colm_log_parse ) {
-		cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
+		cerr << "token gen action: " << parser->tables->rtd->lelInfo[id].name << endl;
 	}
 	#endif
 
-	/* Make the ignore string. */
-	int length = p - tokstart;
-	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
+	/* Make the token data. */
+	long length = p-tokstart;
+	Head *tokdata = string_alloc_const( prg, tokstart, length );
 	update_position( this, tokstart, length );
-	tokstart = 0;
-	
-	Tree *tree = prg->treePool.allocate();
-	tree->refs = 1;
-	tree->id = id;
-	tree->tokdata = ignoreStr;
 
-	/* Send it to the parser. */
-	parser->ignore( tree );
+	p = tokstart;
+	tokstart = 0;
 
-	/* Prepare for more scanning. */
-	inputStream->position += length;
-	region = parser->getNextRegion();
-	cs = tables->entryByRegion[region];
+	generationAction( id, tokdata, false, 0 );
 
 	memset( mark_leave, 0, sizeof(mark_leave) );
 }
 
+void FsmRun::sendIgnore( long id )
+{
+	bool ctxDepParsing = prg->ctxDepParsing;
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
+		sendCtxDep( id );
+	}
+	else
+	{
+		#ifdef COLM_LOG_PARSE
+		if ( colm_log_parse ) {
+			cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
+		}
+		#endif
+
+		/* Make the ignore string. */
+		int length = p - tokstart;
+		Head *ignoreStr = string_alloc_const( prg, tokstart, length );
+		update_position( this, tokstart, length );
+		tokstart = 0;
+		
+		Tree *tree = prg->treePool.allocate();
+		tree->refs = 1;
+		tree->id = id;
+		tree->tokdata = ignoreStr;
+
+		/* Send it to the parser. */
+		parser->ignore( tree );
+
+		/* Prepare for more scanning. */
+		inputStream->position += length;
+		region = parser->getNextRegion();
+		cs = tables->entryByRegion[region];
+
+		memset( mark_leave, 0, sizeof(mark_leave) );
+	}
+}
+
+void FsmRun::sendToken( long id )
+{
+	bool ctxDepParsing = prg->ctxDepParsing;
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
+		sendCtxDep( id );
+	}
+	else {
+		#ifdef COLM_LOG_PARSE
+		if ( colm_log_parse ) {
+			cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
+		}
+		#endif
+
+		bool ctxDepParsing = prg->ctxDepParsing;
+		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+
+		/* Make the token data. */
+		long length = p-tokstart;
+		Head *tokdata = string_alloc_const( prg, tokstart, length );
+		update_position( this, tokstart, length );
+
+		if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
+			/* We don't want the generation actions to automatically consume text
+			 * so reset p since the scanner leaves it at tokend. */
+			p = tokstart;
+			tokstart = 0;
+
+			generationAction( id, tokdata, false, 0 );
+		}
+		else {
+			/* By default the match is consumed and this is what we need. Just
+			 * need to reset tokstart. */
+			tokstart = 0;
+
+			Kid *input = makeToken( id, tokdata, false, 0 );
+			send_handle_error( this, parser, input );
+		}
+
+		memset( mark_leave, 0, sizeof(mark_leave) );
+	}
+}
+
 void FsmRun::emitToken( KlangEl *token )
 {
 	if ( token->ignore )
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 7d96112c..a5a8b793 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -91,6 +91,7 @@ struct FsmRun
 	void sendNamedLangEl();
 	void sendEOF();
 	void sendIgnore( long id );
+	void sendCtxDep( long id );
 	void sendToken( long id );
 
 	void sendBackIgnore( Kid *ignore );
-- 
cgit v1.2.1


From d3bf24722340a7cb15b95928c860c3adfee37f9a Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 26 Feb 2009 01:49:05 +0000
Subject: When the scanner is generated we can decide then if we need to call a
 token generation action. Call execGen right from fsmExec. Allows some
 cleanup.

---
 colm/fsmcodegen.cpp |   4 +-
 colm/fsmrun.cpp     | 106 ++++++++++++++++++++--------------------------------
 colm/fsmrun.h       |   2 +-
 3 files changed, 45 insertions(+), 67 deletions(-)

diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index e0eb3d9d..4955c930 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -197,7 +197,9 @@ void FsmCodeGen::SET_TOKSTART( ostream &ret, InlineItem *item )
 
 void FsmCodeGen::EMIT_TOKEN( ostream &ret, KlangEl *token )
 {
-	if ( token->ignore )
+	if ( token->transBlock != 0 )
+		ret << "	execGen( " << token->id << " );\n";
+	else if ( token->ignore )
 		ret << "	sendIgnore( " << token->id << " );\n";
 	else 
 		ret << "	sendToken( " << token->id << " );\n";
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index eb629c4c..aa1f728f 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -612,7 +612,7 @@ void PdaRun::ignore( Tree *tree )
 	accumIgnore = ignore;
 }
 
-void FsmRun::sendCtxDep( long id )
+void FsmRun::execGen( long id )
 {
 	#ifdef COLM_LOG_PARSE
 	if ( colm_log_parse ) {
@@ -635,88 +635,64 @@ void FsmRun::sendCtxDep( long id )
 
 void FsmRun::sendIgnore( long id )
 {
-	bool ctxDepParsing = prg->ctxDepParsing;
-	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
-		sendCtxDep( id );
+	#ifdef COLM_LOG_PARSE
+	if ( colm_log_parse ) {
+		cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
 	}
-	else
-	{
-		#ifdef COLM_LOG_PARSE
-		if ( colm_log_parse ) {
-			cerr << "ignoring: " << parser->tables->rtd->lelInfo[id].name << endl;
-		}
-		#endif
+	#endif
 
-		/* Make the ignore string. */
-		int length = p - tokstart;
-		Head *ignoreStr = string_alloc_const( prg, tokstart, length );
-		update_position( this, tokstart, length );
-		tokstart = 0;
-		
-		Tree *tree = prg->treePool.allocate();
-		tree->refs = 1;
-		tree->id = id;
-		tree->tokdata = ignoreStr;
+	/* Make the ignore string. */
+	int length = p - tokstart;
+	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
+	update_position( this, tokstart, length );
+	tokstart = 0;
+	
+	Tree *tree = prg->treePool.allocate();
+	tree->refs = 1;
+	tree->id = id;
+	tree->tokdata = ignoreStr;
 
-		/* Send it to the parser. */
-		parser->ignore( tree );
+	/* Send it to the parser. */
+	parser->ignore( tree );
 
-		/* Prepare for more scanning. */
-		inputStream->position += length;
-		region = parser->getNextRegion();
-		cs = tables->entryByRegion[region];
+	/* Prepare for more scanning. */
+	inputStream->position += length;
+	region = parser->getNextRegion();
+	cs = tables->entryByRegion[region];
 
-		memset( mark_leave, 0, sizeof(mark_leave) );
-	}
+	memset( mark_leave, 0, sizeof(mark_leave) );
 }
 
 void FsmRun::sendToken( long id )
 {
-	bool ctxDepParsing = prg->ctxDepParsing;
-	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
-		sendCtxDep( id );
+	#ifdef COLM_LOG_PARSE
+	if ( colm_log_parse ) {
+		cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
 	}
-	else {
-		#ifdef COLM_LOG_PARSE
-		if ( colm_log_parse ) {
-			cerr << "token: " << parser->tables->rtd->lelInfo[id].name << endl;
-		}
-		#endif
-
-		bool ctxDepParsing = prg->ctxDepParsing;
-		LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-
-		/* Make the token data. */
-		long length = p-tokstart;
-		Head *tokdata = string_alloc_const( prg, tokstart, length );
-		update_position( this, tokstart, length );
+	#endif
 
-		if ( ctxDepParsing && lelInfo[id].frameId >= 0 ) {
-			/* We don't want the generation actions to automatically consume text
-			 * so reset p since the scanner leaves it at tokend. */
-			p = tokstart;
-			tokstart = 0;
+	/* Make the token data. */
+	long length = p-tokstart;
+	Head *tokdata = string_alloc_const( prg, tokstart, length );
+	update_position( this, tokstart, length );
 
-			generationAction( id, tokdata, false, 0 );
-		}
-		else {
-			/* By default the match is consumed and this is what we need. Just
-			 * need to reset tokstart. */
-			tokstart = 0;
+	/* By default the match is consumed and this is what we need. Just
+	 * need to reset tokstart. */
+	tokstart = 0;
 
-			Kid *input = makeToken( id, tokdata, false, 0 );
-			send_handle_error( this, parser, input );
-		}
+	Kid *input = makeToken( id, tokdata, false, 0 );
+	send_handle_error( this, parser, input );
 
-		memset( mark_leave, 0, sizeof(mark_leave) );
-	}
+	memset( mark_leave, 0, sizeof(mark_leave) );
 }
 
 void FsmRun::emitToken( KlangEl *token )
 {
-	if ( token->ignore )
+	bool ctxDepParsing = prg->ctxDepParsing;
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( ctxDepParsing && lelInfo[token->id].frameId >= 0 )
+		execGen( token->id );
+	else if ( token->ignore )
 		sendIgnore( token->id );
 	else
 		sendToken( token->id );
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index a5a8b793..70a6b5b6 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -91,8 +91,8 @@ struct FsmRun
 	void sendNamedLangEl();
 	void sendEOF();
 	void sendIgnore( long id );
-	void sendCtxDep( long id );
 	void sendToken( long id );
+	void execGen( long id );
 
 	void sendBackIgnore( Kid *ignore );
 	void sendBack( Kid *input );
-- 
cgit v1.2.1


From 9093101090f41cebda94486a68afd50096236ee8 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 26 Feb 2009 01:53:10 +0000
Subject: removed some duplicate position updates

---
 colm/fsmrun.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index aa1f728f..ba803c96 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -623,7 +623,9 @@ void FsmRun::execGen( long id )
 	/* Make the token data. */
 	long length = p-tokstart;
 	Head *tokdata = string_alloc_const( prg, tokstart, length );
-	update_position( this, tokstart, length );
+
+	/* Note that we don't update the position now. It is done when the token
+	 * data is pulled from the stream. */
 
 	p = tokstart;
 	tokstart = 0;
@@ -656,7 +658,6 @@ void FsmRun::sendIgnore( long id )
 	parser->ignore( tree );
 
 	/* Prepare for more scanning. */
-	inputStream->position += length;
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
 
-- 
cgit v1.2.1


From b591f8a623447b4fce22f53bc76a19a76810a89b Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 27 Feb 2009 01:45:48 +0000
Subject: Added a sync pattern.

---
 colm.vim | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/colm.vim b/colm.vim
index 40aef135..8b7b5799 100644
--- a/colm.vim
+++ b/colm.vim
@@ -72,6 +72,8 @@ syntax region defTypes matchgroup=defKeywords
 	\ start="\<rl\>" start="\<def\>" start="\<token\>" start="\<ignore\>"
 	\ matchgroup=Function end="[a-zA-Z_][a-zA-Z0-9_]*" end="/"me=e-1
 
+syntax sync match colmSyncPat grouphere NONE "([{}]|\<token\>|\<ignore\>|\<def\>)"
+
 "
 " Specifying Groups
 "
-- 
cgit v1.2.1


From 1b9131c53d32c10e2f69186f7795a5d764f2eab2 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 27 Feb 2009 01:49:00 +0000
Subject: Got trailing context working. The marks are not yet shifted when the
 with the buffer contents.

---
 colm/fsmcodegen.cpp |   3 ++
 colm/fsmexec.cpp    |   3 ++
 colm/fsmrun.cpp     |  20 ++++++++-
 colm/fsmrun.h       |   1 +
 colm/keyops.h       |   4 +-
 colm/lmparse.kl     |  21 ++++++++-
 colm/parsedata.cpp  |   3 +-
 colm/parsedata.h    |   5 +++
 colm/parsetree.cpp  | 127 +++++++++-------------------------------------------
 colm/parsetree.h    |   6 +--
 colm/pdabuild.cpp   |   5 +++
 colm/pdacodegen.cpp |   4 +-
 colm/pdarun.h       |   1 +
 colm/redbuild.cpp   |   1 +
 colm/redfsm.h       |   6 ++-
 15 files changed, 94 insertions(+), 116 deletions(-)

diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 4955c930..6d819970 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -329,6 +329,9 @@ void FsmCodeGen::ACTION( ostream &ret, GenAction *action, int targState, bool in
 			ret << "mark_leave[" << field->offset << "] = " << P() << ";\n";
 	}
 
+	if ( action->markType == MarkMatchEnd )
+		ret << "mark_match_end[" << action->matchEndNum << "] = " << P() << ";\n";
+
 	ret << "}\n";
 
 }
diff --git a/colm/fsmexec.cpp b/colm/fsmexec.cpp
index 6f152d56..ea1af928 100644
--- a/colm/fsmexec.cpp
+++ b/colm/fsmexec.cpp
@@ -94,6 +94,9 @@ void FsmRun::execAction( GenAction *genAction )
 		else if ( genAction->markType == MarkLeave )
 			mark_leave[field->offset] = p;
 	}
+
+	if ( genAction->markType == MarkMatchEnd )
+		mark_match_end[genAction->matchEndNum] = p;
 }
 
 void FsmRun::execute()
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index ba803c96..bfbc898d 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -620,8 +620,12 @@ void FsmRun::execGen( long id )
 	}
 	#endif
 
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( lelInfo[id].matchEnd >= 0 )
+		p = mark_match_end[lelInfo[id].matchEnd];
+
 	/* Make the token data. */
-	long length = p-tokstart;
+	long length = p - tokstart;
 	Head *tokdata = string_alloc_const( prg, tokstart, length );
 
 	/* Note that we don't update the position now. It is done when the token
@@ -633,6 +637,7 @@ void FsmRun::execGen( long id )
 	generationAction( id, tokdata, false, 0 );
 
 	memset( mark_leave, 0, sizeof(mark_leave) );
+	memset( mark_match_end, 0, sizeof(mark_match_end) );
 }
 
 void FsmRun::sendIgnore( long id )
@@ -643,6 +648,10 @@ void FsmRun::sendIgnore( long id )
 	}
 	#endif
 
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( lelInfo[id].matchEnd >= 0 )
+		p = mark_match_end[lelInfo[id].matchEnd];
+
 	/* Make the ignore string. */
 	int length = p - tokstart;
 	Head *ignoreStr = string_alloc_const( prg, tokstart, length );
@@ -662,6 +671,7 @@ void FsmRun::sendIgnore( long id )
 	cs = tables->entryByRegion[region];
 
 	memset( mark_leave, 0, sizeof(mark_leave) );
+	memset( mark_match_end, 0, sizeof(mark_match_end) );
 }
 
 void FsmRun::sendToken( long id )
@@ -672,8 +682,12 @@ void FsmRun::sendToken( long id )
 	}
 	#endif
 
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( lelInfo[id].matchEnd >= 0 )
+		p = mark_match_end[lelInfo[id].matchEnd];
+
 	/* Make the token data. */
-	long length = p-tokstart;
+	long length = p - tokstart;
 	Head *tokdata = string_alloc_const( prg, tokstart, length );
 	update_position( this, tokstart, length );
 
@@ -685,6 +699,7 @@ void FsmRun::sendToken( long id )
 	send_handle_error( this, parser, input );
 
 	memset( mark_leave, 0, sizeof(mark_leave) );
+	memset( mark_match_end, 0, sizeof(mark_match_end) );
 }
 
 void FsmRun::emitToken( KlangEl *token )
@@ -836,6 +851,7 @@ long FsmRun::run( PdaRun *destParser )
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
 	memset( mark_leave, 0, sizeof(mark_leave) );
+	memset( mark_match_end, 0, sizeof(mark_match_end) );
 
 	/* Start with the EOF test. The pattern and replacement input sources can
 	 * be EOF from the start. */
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 70a6b5b6..07930b49 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -124,6 +124,7 @@ struct FsmRun
 	bool gotoResume;
 	char *mark_enter[32];
 	char *mark_leave[32];
+	char *mark_match_end[32];
 };
 
 void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser );
diff --git a/colm/keyops.h b/colm/keyops.h
index 8fb9b86b..791495ee 100644
--- a/colm/keyops.h
+++ b/colm/keyops.h
@@ -27,8 +27,10 @@
 
 enum MarkType
 {
+	MarkNone,
 	MarkEnter,
-	MarkLeave
+	MarkLeave,
+	MarkMatchEnd
 };
 
 typedef unsigned long long Size;
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index ed9102cc..fa46c9fc 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -1490,19 +1490,32 @@ field_init: TK_Word ':' code_expr
 
 nonterm opt_rl_join uses rl_join;
 
-opt_rl_join: rl_join
+opt_rl_join: rl_join opt_context
 	final {
 		$$->join = $1->join;
+		$$->context = $2->context;
+
+		if ( $2->context != 0 ) {
+			/* Create the enter and leaving actions that will mark the substring. */
+			Action *mark = new Action( MarkMatchEnd, 0 );
+			mark->matchEndNum = pd->nextMatchEndNum++;
+			pd->actionList.append( mark );
+
+			$$->join->context = $2->context;
+			$$->join->mark = mark;
+		}
 	};
 
 opt_rl_join:
 	final {
 		$$->join = 0;
+		$$->context = 0;
 	};
 
 nonterm rl_join
 {
 	Join *join;
+	Join *context;
 };
 
 rl_join: 
@@ -1518,6 +1531,12 @@ rl_join:
 		$$->join = new Join( $1->expression );
 	};
 
+# Context at the end of a pattern that is not included in the match
+nonterm opt_context uses rl_join;
+
+opt_context: '@' rl_join final { $$->context = $2->join; };
+opt_context: final { $$->context = 0; };
+
 nonterm rl_expr
 {
 	Expression *expression;
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index b7b3e526..19599e6b 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -429,7 +429,8 @@ ParseData::ParseData( const String &fileName, const String &sectionName,
 	nextParserId(0),
 	nextLabelId(0),
 	revertOn(true),
-	predValue(0)
+	predValue(0),
+	nextMatchEndNum(0)
 {
 }
 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index caf65e44..855855fd 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -297,7 +297,9 @@ public:
 	:
 		loc(loc),
 		name(name),
+		markType(MarkNone),
 		objField(0),
+		matchEndNum(0),
 		inlineList(inlineList), 
 		actionId(-1),
 		numTransRefs(0),
@@ -315,6 +317,7 @@ public:
 		name("mark"),
 		markType(markType),
 		objField(objField),
+		matchEndNum(0),
 		inlineList(new InlineList), 
 		actionId(-1),
 		numTransRefs(0),
@@ -336,6 +339,7 @@ public:
 	
 	MarkType markType;
 	ObjField *objField;
+	long matchEndNum;
 
 	InlineList *inlineList;
 	int actionId;
@@ -920,6 +924,7 @@ struct ParseData
 	PdaTables *pdaTables;
 
 	long predValue;
+	long nextMatchEndNum;
 };
 
 void afterOpMinimize( FsmGraph *fsm, bool lastInSeq = true );
diff --git a/colm/parsetree.cpp b/colm/parsetree.cpp
index 438193ee..5c951324 100644
--- a/colm/parsetree.cpp
+++ b/colm/parsetree.cpp
@@ -607,18 +607,11 @@ void JoinOrLm::resolveNameRefs( ParseData *pd )
 }
 
 
-/* Construct with a location and the first expression. */
-Join::Join( const InputLoc &loc, Expression *expr )
-:
-	loc(loc)
-{
-	exprList.append( expr );
-}
-
 /* Construct with a location and the first expression. */
 Join::Join( Expression *expr )
 :
-	loc(loc)
+	context(0),
+	mark(0)
 {
 	exprList.append( expr );
 }
@@ -626,122 +619,44 @@ Join::Join( Expression *expr )
 /* Walk an expression node. */
 FsmGraph *Join::walk( ParseData *pd )
 {
-	if ( exprList.length() > 1 )
-		return walkJoin( pd );
-	else
-		return exprList.head->walk( pd );
-}
+	assert( exprList.length() == 1 );
 
-/* There is a list of expressions to join. */
-FsmGraph *Join::walkJoin( ParseData *pd )
-{
-	/* We enter into a new name scope. */
-	NameFrame nameFrame = pd->enterNameScope( true, 1 );
-
-	/* Evaluate the machines. */
-	FsmGraph **fsms = new FsmGraph*[exprList.length()];
-	ExprList::Iter expr = exprList;
-	for ( int e = 0; e < exprList.length(); e++, expr++ )
-		fsms[e] = expr->walk( pd );
-	
-	/* Get the start and final names. Final is 
-	 * guaranteed to exist, start is not. */
-	NameInst *startName = pd->curNameInst->start;
-	NameInst *finalName = pd->curNameInst->final;
+	FsmGraph *retFsm = exprList.head->walk( pd );
 
-	int startId = -1;
-	if ( startName != 0 ) {
-		/* Take note that there was an implicit link to the start machine. */
-		pd->localNameScope->referencedNames.append( startName );
-		startId = startName->id;
+	/* Maybe the the context. */
+	if ( context != 0 ) {
+		retFsm->leaveFsmAction( pd->curActionOrd++, mark );
+		FsmGraph *contextGraph = context->walk( pd );
+		retFsm->concatOp( contextGraph );
 	}
 
-	/* A final id of -1 indicates there is no epsilon that references the
-	 * final state, therefor do not create one or set an entry point to it. */
-	int finalId = -1;
-	if ( finalName->numRefs > 0 )
-		finalId = finalName->id;
-
-	/* Join machines 1 and up onto machine 0. */
-	FsmGraph *retFsm = fsms[0];
-	retFsm->joinOp( startId, finalId, fsms+1, exprList.length()-1 );
-
-	/* We can now unset entry points that are not longer used. */
-	pd->unsetObsoleteEntries( retFsm );
-
-	/* Pop the name scope. */
-	pd->popNameScope( nameFrame );
-
-	delete[] fsms;
 	return retFsm;
 }
 
 void Join::makeNameTree( ParseData *pd )
 {
-	if ( exprList.length() > 1 ) {
-		/* Create the new anonymous scope. */
-		NameInst *prevNameInst = pd->curNameInst;
-		pd->curNameInst = pd->addNameInst( loc, 0, false );
+	assert( exprList.length() == 1 );
 
-		/* Join scopes need an implicit "final" target. */
-		pd->curNameInst->final = new NameInst( InputLoc(), pd->curNameInst, "final", 
-				pd->nextNameId++, false );
+	/* Recurse into the single expression. */
+	exprList.head->makeNameTree( pd );
 
-		/* Recurse into all expressions in the list. */
-		for ( ExprList::Iter expr = exprList; expr.lte(); expr++ )
-			expr->makeNameTree( pd );
-
-		/* The name scope ends, pop the name instantiation. */
-		pd->curNameInst = prevNameInst;
-	}
-	else {
-		/* Recurse into the single expression. */
-		exprList.head->makeNameTree( pd );
-	}
+	/* Maybe the the context. */
+	if ( context != 0 )
+		context->makeNameTree( pd );
 }
 
 
 void Join::resolveNameRefs( ParseData *pd )
 {
 	/* Branch on whether or not there is to be a join. */
-	if ( exprList.length() > 1 ) {
-		/* The variable definition enters a new scope. */
-		NameFrame nameFrame = pd->enterNameScope( true, 1 );
-
-		/* The join scope must contain a start label. */
-		NameSet resolved = pd->resolvePart( pd->localNameScope, "start", true );
-		if ( resolved.length() > 0 ) {
-			/* Take the first. */
-			pd->curNameInst->start = resolved[0];
-			if ( resolved.length() > 1 ) {
-				/* Complain about the multiple references. */
-				error(loc) << "multiple start labels" << endl;
-				errorStateLabels( resolved );
-			}
-		}
+	assert( exprList.length() == 1 );
 
-		/* Make sure there is a start label. */
-		if ( pd->curNameInst->start != 0 ) {
-			/* There is an implicit reference to start name. */
-			pd->curNameInst->start->numRefs += 1;
-		}
-		else {
-			/* No start label. Complain and recover by adding a label to the
-			 * adding one. Recover ignoring the problem. */
-			error(loc) << "no start label" << endl;
-		}
-
-		/* Recurse into all expressions in the list. */
-		for ( ExprList::Iter expr = exprList; expr.lte(); expr++ )
-			expr->resolveNameRefs( pd );
+	/* Recurse into the single expression. */
+	exprList.head->resolveNameRefs( pd );
 
-		/* The name scope ends, pop the name instantiation. */
-		pd->popNameScope( nameFrame );
-	}
-	else {
-		/* Recurse into the single expression. */
-		exprList.head->resolveNameRefs( pd );
-	}
+	/* Maybe the the context. */
+	if ( context != 0 )
+		context->resolveNameRefs( pd );
 }
 
 /* Clean up after an expression node. */
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 6de45be6..86324848 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -480,17 +480,17 @@ struct Join
 {
 	/* Construct with the first expression. */
 	Join( Expression *expr );
-	Join( const InputLoc &loc, Expression *expr );
 
 	/* Tree traversal. */
 	FsmGraph *walk( ParseData *pd );
-	FsmGraph *walkJoin( ParseData *pd );
 	void makeNameTree( ParseData *pd );
 	void resolveNameRefs( ParseData *pd );
 
 	/* Data. */
-	InputLoc loc;
 	ExprList exprList;
+
+	Join *context;
+	Action *mark;
 };
 
 /*
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index a616de1b..99c20bad 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1410,6 +1410,11 @@ void ParseData::makeRuntimeData()
 					lel->objectDef->size();
 			runtimeData->lelInfo[i].termDupId = lel->termDup == 0 ? 0 : lel->termDup->id;
 			runtimeData->lelInfo[i].genericId = lel->generic == 0 ? 0 : lel->generic->id;
+
+			if ( lel->tokenDef != 0 && lel->tokenDef->join != 0 && lel->tokenDef->join->context != 0 )
+				runtimeData->lelInfo[i].matchEnd = lel->tokenDef->join->mark->matchEndNum;
+			else
+				runtimeData->lelInfo[i].matchEnd = -1;
 		}
 		else {
 			memset(&runtimeData->lelInfo[i], 0, sizeof(LangElInfo) );
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index f5d6de5e..62a8b8df 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -191,7 +191,9 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 
 		out << runtimeData->lelInfo[i].termDupId << ", ";
 
-		out << runtimeData->lelInfo[i].genericId;
+		out << runtimeData->lelInfo[i].genericId << ", ";
+
+		out << runtimeData->lelInfo[i].matchEnd;
 
 		out << " }";
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index b95d8806..a52edfbc 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -353,6 +353,7 @@ struct LangElInfo
 
 	long termDupId;
 	long genericId;
+	long matchEnd;
 };
 
 struct ObjFieldInfo
diff --git a/colm/redbuild.cpp b/colm/redbuild.cpp
index e7be055b..2df68aea 100644
--- a/colm/redbuild.cpp
+++ b/colm/redbuild.cpp
@@ -432,6 +432,7 @@ void RedFsmBuild::newAction( int anum, char *name, int line, int col, Action *ac
 	redFsm->allActions[anum].inlineList = action->inlineList;
 	redFsm->allActions[anum].objField = action->objField;
 	redFsm->allActions[anum].markType = action->markType;
+	redFsm->allActions[anum].matchEndNum = action->matchEndNum;
 }
 
 void RedFsmBuild::makeAction( Action *action )
diff --git a/colm/redfsm.h b/colm/redfsm.h
index d5d5a03f..4ddb0dbf 100644
--- a/colm/redfsm.h
+++ b/colm/redfsm.h
@@ -65,6 +65,9 @@ struct GenAction
 		name(0),
 		inlineList(0), 
 		actionId(0),
+		markType(MarkNone),
+		objField(0),
+		matchEndNum(0),
 		numTransRefs(0),
 		numToStateRefs(0),
 		numFromStateRefs(0),
@@ -77,8 +80,9 @@ struct GenAction
 	char *name;
 	InlineList *inlineList;
 	int actionId;
-	ObjField *objField;
 	MarkType markType;
+	ObjField *objField;
+	long matchEndNum;
 
 	string nameOrLoc();
 
-- 
cgit v1.2.1


From 2c21e2cd0340f2a777530da692bc0669bc8dc1bd Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Fri, 27 Feb 2009 03:42:08 +0000
Subject: Some work on unifying the marking facilities for trailing context and
 sub-regex capture. Now using the same marking array for the trailing context
 and the capture. The set markers are now shifted long with partial token
 matches. But not yet propigating the list of captures associated with a token
 to the runtime data.

---
 colm/fsmcodegen.cpp | 12 ++----------
 colm/fsmexec.cpp    | 12 ++----------
 colm/fsmrun.cpp     | 52 ++++++++++++++++++++++++++++------------------------
 colm/fsmrun.h       |  6 +++---
 colm/keyops.h       |  4 +---
 colm/lmparse.kh     |  1 +
 colm/lmparse.kl     | 15 +++++++++++----
 colm/parsedata.h    | 11 ++++++-----
 colm/parsetree.h    | 13 +++++++++++++
 colm/pdabuild.cpp   |  9 ++++++---
 colm/pdacodegen.cpp |  2 +-
 colm/pdarun.h       | 11 ++++++++++-
 colm/redbuild.cpp   |  2 +-
 colm/redfsm.h       |  4 ++--
 14 files changed, 87 insertions(+), 67 deletions(-)

diff --git a/colm/fsmcodegen.cpp b/colm/fsmcodegen.cpp
index 6d819970..fe5a6fb3 100644
--- a/colm/fsmcodegen.cpp
+++ b/colm/fsmcodegen.cpp
@@ -321,16 +321,8 @@ void FsmCodeGen::ACTION( ostream &ret, GenAction *action, int targState, bool in
 	ret << "\t{";
 	INLINE_LIST( ret, action->inlineList, targState, inFinish );
 
-	if ( action->objField ) {
-		ObjField *field = action->objField;
-		if ( action->markType == MarkEnter )
-			ret << "mark_enter[" << field->offset << "] = " << P() << ";\n";
-		else if ( action->markType == MarkLeave )
-			ret << "mark_leave[" << field->offset << "] = " << P() << ";\n";
-	}
-
-	if ( action->markType == MarkMatchEnd )
-		ret << "mark_match_end[" << action->matchEndNum << "] = " << P() << ";\n";
+	if ( action->markId >= 0 )
+		ret << "mark[" << action->markId << "] = " << P() << ";\n";
 
 	ret << "}\n";
 
diff --git a/colm/fsmexec.cpp b/colm/fsmexec.cpp
index ea1af928..8f5d7600 100644
--- a/colm/fsmexec.cpp
+++ b/colm/fsmexec.cpp
@@ -87,16 +87,8 @@ void FsmRun::execAction( GenAction *genAction )
 		}
 	}
 
-	if ( genAction->objField ) {
-		ObjField *field = genAction->objField;
-		if ( genAction->markType == MarkEnter )
-			mark_enter[field->offset] = p;
-		else if ( genAction->markType == MarkLeave )
-			mark_leave[field->offset] = p;
-	}
-
-	if ( genAction->markType == MarkMatchEnd )
-		mark_match_end[genAction->matchEndNum] = p;
+	if ( genAction->markType == MarkMark )
+		mark[genAction->markId] = p;
 }
 
 void FsmRun::execute()
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index bfbc898d..0f20b8cc 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -511,15 +511,15 @@ Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 	/* No children and ignores get added later. */
 	input->tree->child = attrs;
 
-	/* Set attributes for the labelled components. */
-	for ( int i = 0; i < 32; i++ ) {
-		if ( mark_leave[i] != 0 ) {
-			Head *data = string_alloc_new( prg, 
-					mark_enter[i], mark_leave[i] - mark_enter[i] );
-			set_attr( input->tree, i, construct_string( prg, data ) );
-			tree_upref( get_attr( input->tree, i ) );
-		}
-	}
+//	/* Set attributes for the labelled components. */
+//	for ( int i = 0; i < 32; i++ ) {
+//		if ( mark_leave[i] != 0 ) {
+//			Head *data = string_alloc_new( prg, 
+//					mark_enter[i], mark_leave[i] - mark_enter[i] );
+//			set_attr( input->tree, i, construct_string( prg, data ) );
+//			tree_upref( get_attr( input->tree, i ) );
+//		}
+//	}
 	
 	/* If the item is bound then store it in the bindings array. */
 	if ( bindId > 0 ) {
@@ -621,8 +621,8 @@ void FsmRun::execGen( long id )
 	#endif
 
 	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	if ( lelInfo[id].matchEnd >= 0 )
-		p = mark_match_end[lelInfo[id].matchEnd];
+	if ( lelInfo[id].markId >= 0 )
+		p = mark[lelInfo[id].markId];
 
 	/* Make the token data. */
 	long length = p - tokstart;
@@ -636,8 +636,7 @@ void FsmRun::execGen( long id )
 
 	generationAction( id, tokdata, false, 0 );
 
-	memset( mark_leave, 0, sizeof(mark_leave) );
-	memset( mark_match_end, 0, sizeof(mark_match_end) );
+	memset( mark, 0, sizeof(mark) );
 }
 
 void FsmRun::sendIgnore( long id )
@@ -649,8 +648,8 @@ void FsmRun::sendIgnore( long id )
 	#endif
 
 	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	if ( lelInfo[id].matchEnd >= 0 )
-		p = mark_match_end[lelInfo[id].matchEnd];
+	if ( lelInfo[id].markId >= 0 )
+		p = mark[lelInfo[id].markId];
 
 	/* Make the ignore string. */
 	int length = p - tokstart;
@@ -670,8 +669,7 @@ void FsmRun::sendIgnore( long id )
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
 
-	memset( mark_leave, 0, sizeof(mark_leave) );
-	memset( mark_match_end, 0, sizeof(mark_match_end) );
+	memset( mark, 0, sizeof(mark) );
 }
 
 void FsmRun::sendToken( long id )
@@ -683,8 +681,8 @@ void FsmRun::sendToken( long id )
 	#endif
 
 	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
-	if ( lelInfo[id].matchEnd >= 0 )
-		p = mark_match_end[lelInfo[id].matchEnd];
+	if ( lelInfo[id].markId >= 0 )
+		p = mark[lelInfo[id].markId];
 
 	/* Make the token data. */
 	long length = p - tokstart;
@@ -698,8 +696,7 @@ void FsmRun::sendToken( long id )
 	Kid *input = makeToken( id, tokdata, false, 0 );
 	send_handle_error( this, parser, input );
 
-	memset( mark_leave, 0, sizeof(mark_leave) );
-	memset( mark_match_end, 0, sizeof(mark_match_end) );
+	memset( mark, 0, sizeof(mark) );
 }
 
 void FsmRun::emitToken( KlangEl *token )
@@ -850,8 +847,7 @@ long FsmRun::run( PdaRun *destParser )
 	tokend = 0;
 	region = parser->getNextRegion();
 	cs = tables->entryByRegion[region];
-	memset( mark_leave, 0, sizeof(mark_leave) );
-	memset( mark_match_end, 0, sizeof(mark_match_end) );
+	memset( mark, 0, sizeof(mark) );
 
 	/* Start with the EOF test. The pattern and replacement input sources can
 	 * be EOF from the start. */
@@ -998,8 +994,16 @@ long FsmRun::run( PdaRun *destParser )
 				runBuf->next->length = FSM_BUFSIZE - have;
 
 				/* Compute tokstart and tokend. */
-				tokend = runBuf->buf + (tokend - tokstart);
+				long dist = tokstart - runBuf->buf;
+
+				tokend -= dist;
 				tokstart = runBuf->buf;
+
+				/* Shift any markers. */
+				for ( int i = 0; i < MARK_SLOTS; i++ ) {
+					if ( mark[i] != 0 )
+						mark[i] -= dist;
+				}
 			}
 			p = pe = runBuf->buf + have;
 			peof = 0;
diff --git a/colm/fsmrun.h b/colm/fsmrun.h
index 07930b49..ed25c829 100644
--- a/colm/fsmrun.h
+++ b/colm/fsmrun.h
@@ -81,6 +81,8 @@ struct RunBuf
 	RunBuf *next;
 };
 
+#define MARK_SLOTS 32
+
 struct FsmRun
 {
 	FsmRun( Program *prg );
@@ -122,9 +124,7 @@ struct FsmRun
 	bool eofSent;
 	RunBuf *runBuf;
 	bool gotoResume;
-	char *mark_enter[32];
-	char *mark_leave[32];
-	char *mark_match_end[32];
+	char *mark[MARK_SLOTS];
 };
 
 void send_queued_tokens( FsmRun *fsmRun, PdaRun *parser );
diff --git a/colm/keyops.h b/colm/keyops.h
index 791495ee..b5af65e7 100644
--- a/colm/keyops.h
+++ b/colm/keyops.h
@@ -28,9 +28,7 @@
 enum MarkType
 {
 	MarkNone,
-	MarkEnter,
-	MarkLeave,
-	MarkMatchEnd
+	MarkMark
 };
 
 typedef unsigned long long Size;
diff --git a/colm/lmparse.kh b/colm/lmparse.kh
index b51d0e3d..2cc3e99a 100644
--- a/colm/lmparse.kh
+++ b/colm/lmparse.kh
@@ -103,6 +103,7 @@ struct Parser
 	ProdElList *curProdElList;
 
 	PredType predType;
+	ReCaptureVect reCaptureVect;
 };
 
 %% write token_defs;
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index fa46c9fc..b796318e 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -734,6 +734,9 @@ token_def:
 		region->tokenDefList.append( tokenDef );
 		tokEl->tokenDef = tokenDef;
 
+		tokenDef->reCaptureVect = reCaptureVect;
+		reCaptureVect.empty();
+
 		/* Create the object def for the token. */
 		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, name, 
 				pd->objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
@@ -841,6 +844,9 @@ rl_def:
 		/* Generic creation of machine for instantiation and assignment. */
 		JoinOrLm *joinOrLm = new JoinOrLm( $4->join );
 		addRegularDef( $2->loc, namespaceStack.top(), $2->data, joinOrLm, false );
+
+		if ( reCaptureVect.length() > 0 )
+			error($1->loc) << "rl definitions cannot capture vars" << endl;
 	};
 
 type class token_data
@@ -1497,8 +1503,7 @@ opt_rl_join: rl_join opt_context
 
 		if ( $2->context != 0 ) {
 			/* Create the enter and leaving actions that will mark the substring. */
-			Action *mark = new Action( MarkMatchEnd, 0 );
-			mark->matchEndNum = pd->nextMatchEndNum++;
+			Action *mark = new Action( MarkMark, pd->nextMatchEndNum++ );
 			pd->actionList.append( mark );
 
 			$$->join->context = $2->context;
@@ -1636,14 +1641,16 @@ factor_with_label:
 		pd->objFieldMap->insert( $1->data, objField );
 
 		/* Create the enter and leaving actions that will mark the substring. */
-		Action *enter = new Action( MarkEnter, objField );
-		Action *leave = new Action( MarkLeave, objField );
+		Action *enter = new Action( MarkMark, pd->nextMatchEndNum++ );
+		Action *leave = new Action( MarkMark, pd->nextMatchEndNum++ );
 		pd->actionList.append( enter );
 		pd->actionList.append( leave );
 		
 		/* Add entering and leaving actions. */
 		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_start, 0, enter ) );
 		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_leave, 0, leave ) );
+
+		reCaptureVect.append( ReCapture( objField, enter, leave ) );
 	};
 
 nonterm factor_with_ep
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 855855fd..93fe2de0 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -279,6 +279,7 @@ struct PdaLiteral
 	long value;
 };
 
+
 /* Forwards. */
 using std::ostream;
 
@@ -299,7 +300,7 @@ public:
 		name(name),
 		markType(MarkNone),
 		objField(0),
-		matchEndNum(0),
+		markId(-1),
 		inlineList(inlineList), 
 		actionId(-1),
 		numTransRefs(0),
@@ -312,12 +313,12 @@ public:
 	{
 	}
 
-	Action( MarkType markType, ObjField *objField )
+	Action( MarkType markType, long markId )
 	:
 		name("mark"),
 		markType(markType),
-		objField(objField),
-		matchEndNum(0),
+		objField(0),
+		markId(markId),
 		inlineList(new InlineList), 
 		actionId(-1),
 		numTransRefs(0),
@@ -339,7 +340,7 @@ public:
 	
 	MarkType markType;
 	ObjField *objField;
-	long matchEndNum;
+	long markId;
 
 	InlineList *inlineList;
 	int actionId;
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 86324848..ece6ac5f 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -271,6 +271,18 @@ struct NamespaceQual
 	Namespace *getQual( ParseData *pd );
 };
 
+struct ReCapture
+{
+	ReCapture( ObjField *objField, Action *markEnter, Action *markLeave )
+		: objField(objField), markEnter(markEnter), markLeave(markLeave) {}
+
+	ObjField *objField;
+	Action *markEnter;
+	Action *markLeave;
+};
+
+typedef Vector<ReCapture> ReCaptureVect;
+
 struct TokenDef
 {
 	TokenDef( Join *join, KlangEl *token, InputLoc &semiLoc, 
@@ -295,6 +307,7 @@ struct TokenDef
 	bool inLmSelect;
 	Namespace *nspace;
 	TokenRegion *tokenRegion;
+	ReCaptureVect reCaptureVect;
 
 	TokenDef *prev, *next;
 };
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 99c20bad..07449330 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1411,10 +1411,11 @@ void ParseData::makeRuntimeData()
 			runtimeData->lelInfo[i].termDupId = lel->termDup == 0 ? 0 : lel->termDup->id;
 			runtimeData->lelInfo[i].genericId = lel->generic == 0 ? 0 : lel->generic->id;
 
-			if ( lel->tokenDef != 0 && lel->tokenDef->join != 0 && lel->tokenDef->join->context != 0 )
-				runtimeData->lelInfo[i].matchEnd = lel->tokenDef->join->mark->matchEndNum;
+			if ( lel->tokenDef != 0 && lel->tokenDef->join != 0 && 
+					lel->tokenDef->join->context != 0 )
+				runtimeData->lelInfo[i].markId = lel->tokenDef->join->mark->markId;
 			else
-				runtimeData->lelInfo[i].matchEnd = -1;
+				runtimeData->lelInfo[i].markId = -1;
 		}
 		else {
 			memset(&runtimeData->lelInfo[i], 0, sizeof(LangElInfo) );
@@ -1505,6 +1506,8 @@ void ParseData::makeRuntimeData()
 		runtimeData->litlen[el->value] = el->key.length();
 	}
 
+	/* FIXME: Captured attributes go here. */
+
 	runtimeData->fsmTables = fsmTables;
 	runtimeData->pdaTables = pdaTables;
 
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 62a8b8df..34d79061 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -193,7 +193,7 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 
 		out << runtimeData->lelInfo[i].genericId << ", ";
 
-		out << runtimeData->lelInfo[i].matchEnd;
+		out << runtimeData->lelInfo[i].markId;
 
 		out << " }";
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index a52edfbc..528f7073 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -353,7 +353,7 @@ struct LangElInfo
 
 	long termDupId;
 	long genericId;
-	long matchEnd;
+	long markId;
 };
 
 struct ObjFieldInfo
@@ -387,6 +387,13 @@ struct RegionInfo
 	long eofFrameId;
 };
 
+struct CaptureAttr
+{
+	long mark_enter;
+	long mark_leave;
+	long offset;
+};
+
 struct RuntimeData
 {
 	LangElInfo *lelInfo;
@@ -421,6 +428,8 @@ struct RuntimeData
 	Head **literals;
 	long numLiterals;
 
+//	CaptureAttr *captureAttr;
+
 	FsmTables *fsmTables;
 	PdaTables *pdaTables;
 	int *startStates;
diff --git a/colm/redbuild.cpp b/colm/redbuild.cpp
index 2df68aea..47b8c60d 100644
--- a/colm/redbuild.cpp
+++ b/colm/redbuild.cpp
@@ -432,7 +432,7 @@ void RedFsmBuild::newAction( int anum, char *name, int line, int col, Action *ac
 	redFsm->allActions[anum].inlineList = action->inlineList;
 	redFsm->allActions[anum].objField = action->objField;
 	redFsm->allActions[anum].markType = action->markType;
-	redFsm->allActions[anum].matchEndNum = action->matchEndNum;
+	redFsm->allActions[anum].markId = action->markId;
 }
 
 void RedFsmBuild::makeAction( Action *action )
diff --git a/colm/redfsm.h b/colm/redfsm.h
index 4ddb0dbf..305b67f9 100644
--- a/colm/redfsm.h
+++ b/colm/redfsm.h
@@ -67,7 +67,7 @@ struct GenAction
 		actionId(0),
 		markType(MarkNone),
 		objField(0),
-		matchEndNum(0),
+		markId(-1),
 		numTransRefs(0),
 		numToStateRefs(0),
 		numFromStateRefs(0),
@@ -82,7 +82,7 @@ struct GenAction
 	int actionId;
 	MarkType markType;
 	ObjField *objField;
-	long matchEndNum;
+	long markId;
 
 	string nameOrLoc();
 
-- 
cgit v1.2.1


From 208a0090dd0f6c12776eeb032f4f06f25f630a79 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sat, 28 Feb 2009 04:18:09 +0000
Subject: Capture info now propagated to the runtime data. In make token, the
 LEL's list of captures is used to create the attributes. No longer relying on
 the end markers. That scheme was wrong since the index of the end marker
 can't correctly correspond to the attribute offset, otherwise there could be
 interference among tokens.

---
 colm/fsmrun.cpp     | 20 +++++++++++---------
 colm/lmparse.kl     |  2 +-
 colm/parsetree.h    |  6 +++---
 colm/pdabuild.cpp   | 25 +++++++++++++++++++++++--
 colm/pdacodegen.cpp | 19 ++++++++++++++++++-
 colm/pdarun.h       |  5 ++++-
 6 files changed, 60 insertions(+), 17 deletions(-)

diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 0f20b8cc..fc9c45d2 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -511,15 +511,17 @@ Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 	/* No children and ignores get added later. */
 	input->tree->child = attrs;
 
-//	/* Set attributes for the labelled components. */
-//	for ( int i = 0; i < 32; i++ ) {
-//		if ( mark_leave[i] != 0 ) {
-//			Head *data = string_alloc_new( prg, 
-//					mark_enter[i], mark_leave[i] - mark_enter[i] );
-//			set_attr( input->tree, i, construct_string( prg, data ) );
-//			tree_upref( get_attr( input->tree, i ) );
-//		}
-//	}
+	LangElInfo *lelInfo = parser->tables->rtd->lelInfo;
+	if ( lelInfo[id].numCaptureAttr > 0 ) {
+		for ( int i = 0; i < lelInfo[id].numCaptureAttr; i++ ) {
+			CaptureAttr *ca = &parser->tables->rtd->captureAttr[lelInfo[id].captureAttr + i];
+			Head *data = string_alloc_new( prg, 
+					mark[ca->mark_enter], mark[ca->mark_leave] - mark[ca->mark_enter] );
+			Tree *string = construct_string( prg, data );
+			set_attr( input->tree, ca->offset, string );
+			tree_upref( string );
+		}
+	}
 	
 	/* If the item is bound then store it in the bindings array. */
 	if ( bindId > 0 ) {
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index b796318e..04e64d65 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -1650,7 +1650,7 @@ factor_with_label:
 		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_start, 0, enter ) );
 		$$->factorWithAug->actions.append( ParserAction( $1->loc, at_leave, 0, leave ) );
 
-		reCaptureVect.append( ReCapture( objField, enter, leave ) );
+		reCaptureVect.append( ReCapture( enter, leave, objField ) );
 	};
 
 nonterm factor_with_ep
diff --git a/colm/parsetree.h b/colm/parsetree.h
index ece6ac5f..86f81e7f 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -273,12 +273,12 @@ struct NamespaceQual
 
 struct ReCapture
 {
-	ReCapture( ObjField *objField, Action *markEnter, Action *markLeave )
-		: objField(objField), markEnter(markEnter), markLeave(markLeave) {}
+	ReCapture( Action *markEnter, Action *markLeave, ObjField *objField )
+		: markEnter(markEnter), markLeave(markLeave), objField(objField)  {}
 
-	ObjField *objField;
 	Action *markEnter;
 	Action *markLeave;
+	ObjField *objField;
 };
 
 typedef Vector<ReCapture> ReCaptureVect;
diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index 07449330..d824c7d5 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1506,7 +1506,29 @@ void ParseData::makeRuntimeData()
 		runtimeData->litlen[el->value] = el->key.length();
 	}
 
-	/* FIXME: Captured attributes go here. */
+	/* Captured attributes. Loop over tokens and count first. */
+	long numCapturedAttr = 0;
+	for ( RegionList::Iter reg = regionList; reg.lte(); reg++ ) {
+		for ( TokenDefList::Iter td = reg->tokenDefList; td.lte(); td++ )
+			numCapturedAttr += td->reCaptureVect.length();
+	}
+	runtimeData->captureAttr = new CaptureAttr[numCapturedAttr];
+	runtimeData->numCapturedAttr = numCapturedAttr;
+
+	count = 0;
+	for ( RegionList::Iter reg = regionList; reg.lte(); reg++ ) {
+		for ( TokenDefList::Iter td = reg->tokenDefList; td.lte(); td++ ) {
+			runtimeData->lelInfo[td->token->id].captureAttr = count;
+			runtimeData->lelInfo[td->token->id].numCaptureAttr = td->reCaptureVect.length();
+			for ( ReCaptureVect::Iter c = td->reCaptureVect; c.lte(); c++ ) {
+				runtimeData->captureAttr[count].mark_enter = c->markEnter->markId;
+				runtimeData->captureAttr[count].mark_leave = c->markLeave->markId;
+				runtimeData->captureAttr[count].offset = c->objField->offset;
+
+				count += 1;
+			}
+		}
+	}
 
 	runtimeData->fsmTables = fsmTables;
 	runtimeData->pdaTables = pdaTables;
@@ -1520,7 +1542,6 @@ void ParseData::makeRuntimeData()
 			runtimeData->eofLelIds[lel->parserId] = lel->eofLel->id;
 		}
 	}
-		
 
 	runtimeData->globalSize = globalObjectDef->size();
 
diff --git a/colm/pdacodegen.cpp b/colm/pdacodegen.cpp
index 34d79061..04a980ba 100644
--- a/colm/pdacodegen.cpp
+++ b/colm/pdacodegen.cpp
@@ -193,7 +193,11 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 
 		out << runtimeData->lelInfo[i].genericId << ", ";
 
-		out << runtimeData->lelInfo[i].markId;
+		out << runtimeData->lelInfo[i].markId << ", ";
+
+		out << runtimeData->lelInfo[i].captureAttr << ", ";
+
+		out << runtimeData->lelInfo[i].numCaptureAttr;
 
 		out << " }";
 
@@ -370,6 +374,16 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 	}
 	out << "};\n\n";
 
+	out << "CaptureAttr captureAttr[] = {\n";
+	for ( long i = 0; i < runtimeData->numCapturedAttr; i++ ) {
+		out << "\t{ " << 
+			runtimeData->captureAttr[i].mark_enter << ", " <<
+			runtimeData->captureAttr[i].mark_leave << ", " <<
+			runtimeData->captureAttr[i].offset  << " },\n";
+	}
+
+	out << "};\n\n";
+
 	out <<
 		"RuntimeData main_runtimeData = \n"
 		"{\n"
@@ -405,6 +419,9 @@ void PdaCodeGen::writeRuntimeData( RuntimeData *runtimeData, PdaTables *pdaTable
 		"	" << literals() << ",\n"
 		"	" << runtimeData->numLiterals << ",\n"
 		"\n"
+		"	captureAttr,\n"
+		"	" << runtimeData->numCapturedAttr << ",\n"
+		"\n"
 		"	&fsmTables_start,\n"
 		"	&pid_0_pdaTables,\n"
 		"	startStates, eofLelIds, " << runtimeData->numParsers << ",\n"
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 528f7073..30f5b0d2 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -354,6 +354,8 @@ struct LangElInfo
 	long termDupId;
 	long genericId;
 	long markId;
+	long captureAttr;
+	long numCaptureAttr;
 };
 
 struct ObjFieldInfo
@@ -428,7 +430,8 @@ struct RuntimeData
 	Head **literals;
 	long numLiterals;
 
-//	CaptureAttr *captureAttr;
+	CaptureAttr *captureAttr;
+	long numCapturedAttr;
 
 	FsmTables *fsmTables;
 	PdaTables *pdaTables;
-- 
cgit v1.2.1


From f067b4e5d7039c37e6cfb199d442862c0819b889 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 1 Mar 2009 02:42:25 +0000
Subject: Include captured attributes in constructor patterns and add them to
 the construced tree at runtime.

---
 colm/pdabuild.cpp | 19 +++++++++++++++++++
 colm/tree.cpp     | 13 +++++++++++++
 2 files changed, 32 insertions(+)

diff --git a/colm/pdabuild.cpp b/colm/pdabuild.cpp
index d824c7d5..d22a7db3 100644
--- a/colm/pdabuild.cpp
+++ b/colm/pdabuild.cpp
@@ -1569,6 +1569,9 @@ void mapNodes( Program *prg, int &count, Kid *kid )
 			count += 1;
 			ignore = ignore->next;
 		}
+		
+		count += prg->rtd->lelInfo[kid->tree->id].numCaptureAttr;
+
 		mapNodes( prg, count, tree_child( prg, kid->tree ) );
 		mapNodes( prg, count, kid->next );
 	}
@@ -1590,6 +1593,7 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 		node.length = string_length( kid->tree->tokdata );
 		node.data = string_data( kid->tree->tokdata );
 
+		/* Ignore items. */
 		Kid *ignore = tree_ignore( prg, kid->tree );
 		node.ignore = ignore == 0 ? -1 : ind;
 
@@ -1606,6 +1610,21 @@ void fillNodes( Program *prg, Bindings &bindings, long &bindId,
 			ignore = ignore->next;
 		}
 
+		/* The captured attributes. */
+		for ( int i = 0; i < prg->rtd->lelInfo[kid->tree->id].numCaptureAttr; i++ ) {
+			CaptureAttr *cap = prg->rtd->captureAttr + 
+					prg->rtd->lelInfo[kid->tree->id].captureAttr + i;
+
+			Tree *attr = get_attr( kid->tree, cap->offset );
+
+			PatReplNode &node = nodes[ind++];
+			memset( &node, 0, sizeof(PatReplNode) );
+
+			node.id = attr->id;
+			node.length = string_length( attr->tokdata );
+			node.data = string_data( attr->tokdata );
+		}
+
 		node.stop = kid->tree->flags & AF_TERM_DUP;
 
 		/* Recurse. */
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 42bcec9b..434a34f6 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -259,6 +259,19 @@ Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat )
 
 		tree->child = kid_list_concat( attrs, 
 				kid_list_concat( ignore, child ) );
+
+		for ( int i = 0; i < lelInfo[tree->id].numCaptureAttr; i++ ) {
+			long ci = pat+1+i;
+			CaptureAttr *ca = prg->rtd->captureAttr + lelInfo[tree->id].captureAttr + i;
+			Tree *attr = prg->treePool.allocate();
+			attr->id = nodes[ci].id;
+			attr->refs = 1;
+			attr->tokdata = nodes[ci].length == 0 ? 0 :
+					string_alloc_const( prg, 
+					nodes[ci].data, nodes[ci].length );
+
+			set_attr( tree, ca->offset, attr );
+		}
 	}
 
 	return tree;
-- 
cgit v1.2.1


From d7884f1080497f0432dbe7b6226c5294c5a98f9b Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Sun, 1 Mar 2009 03:44:49 +0000
Subject: Added objFieldList so that object attributes have their offets
 ordered as they appear. Otherwise the args to make_token need to be sorted
 according to the alphabetical sort of the attribute names. Also, debugging
 gets harder with an alphabetical sort and this has caused me problems on more
 than one occation.

---
 colm/compile.cpp | 34 ++++++++++++++++++++++++++--------
 colm/lmparse.kl  | 19 ++++++++++++++-----
 colm/parsedata.h |  1 +
 colm/parsetree.h |  9 +++++++--
 4 files changed, 48 insertions(+), 15 deletions(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index 2a9b810e..5fce43ce 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -1861,6 +1861,7 @@ void ParseData::addProdRedObjectVar( ObjectDef *localFrame, KlangEl *nonTerm )
 	initLocalInstructions( el );
 
 	localFrame->objFieldMap->insert( el->name, el );
+	localFrame->objFieldList->append( el );
 }
 
 void ParseData::addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList )
@@ -1884,6 +1885,7 @@ void ParseData::addProdRHSVars( ObjectDef *localFrame, ProdElList *prodElList )
 			el->inGetR = IN_GET_LOCAL_R;
 
 			localFrame->objFieldMap->insert( el->name, el );
+			localFrame->objFieldList->append( el );
 		}
 	}
 }
@@ -1901,6 +1903,7 @@ void ParseData::addMatchLength( ObjectDef *frame, KlangEl *lel )
 	el->useOffset = false;
 	el->inGetR    = IN_GET_MATCH_LENGTH_R;
 	frame->objFieldMap->insert( el->name, el );
+	frame->objFieldList->append( el );
 }
 
 void ParseData::addMatchText( ObjectDef *frame, KlangEl *lel )
@@ -1916,6 +1919,7 @@ void ParseData::addMatchText( ObjectDef *frame, KlangEl *lel )
 	el->useOffset = false;
 	el->inGetR    = IN_GET_MATCH_TEXT_R;
 	frame->objFieldMap->insert( el->name, el );
+	frame->objFieldList->append( el );
 }
 
 void ParseData::initFieldInstructions( ObjField *el )
@@ -1944,9 +1948,10 @@ void ParseData::initLocalRefInstructions( ObjField *el )
 void ParseData::initIntObject( )
 {
 	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjFieldList *fieldList = new ObjFieldList;
 	ObjMethodMap *methodMap = new ObjMethodMap;
 	intObj = new ObjectDef( ObjectDef::BuiltinType, "int", 
-			fieldMap, methodMap, nextObjectId++ );
+			fieldMap, fieldList, methodMap, nextObjectId++ );
 	intKlangEl->objectDef = intObj;
 
 	initFunction( uniqueTypeStr, intObj, "to_string", IN_INT_TO_STR, IN_INT_TO_STR, true );
@@ -1966,14 +1971,16 @@ void ParseData::addLengthField( ObjectDef *objDef, Code getLength )
 	el->inGetR = getLength;
 
 	objDef->objFieldMap->insert( el->name, el );
+	objDef->objFieldList->append( el );
 }
 
 void ParseData::initStrObject( )
 {
 	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjFieldList *fieldList = new ObjFieldList;
 	ObjMethodMap *methodMap = new ObjMethodMap;
 	strObj = new ObjectDef( ObjectDef::BuiltinType, "str", 
-			fieldMap, methodMap, nextObjectId++ );
+			fieldMap, fieldList, methodMap, nextObjectId++ );
 	strKlangEl->objectDef = strObj;
 
 	initFunction( uniqueTypeInt, strObj, "atoi",   IN_STR_ATOI, IN_STR_ATOI, true );
@@ -1989,9 +1996,10 @@ void ParseData::initStrObject( )
 void ParseData::initStreamObject( )
 {
 	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjFieldList *fieldList = new ObjFieldList;
 	ObjMethodMap *methodMap = new ObjMethodMap;
 	streamObj = new ObjectDef( ObjectDef::BuiltinType, "stream", 
-			fieldMap, methodMap, nextObjectId++ );
+			fieldMap, fieldList, methodMap, nextObjectId++ );
 	streamKlangEl->objectDef = streamObj;
 
 //	initFunction( uniqueTypeInt, strObj, "atoi",   IN_STR_ATOI, IN_STR_ATOI, true );
@@ -2043,15 +2051,18 @@ void ParseData::initTokenObjects( )
 {
 	/* Make a default object Definition. */
 	ObjFieldMap *fieldMap = new ObjFieldMap;
+	ObjFieldList *fieldList = new ObjFieldList;
 	ObjMethodMap *methodMap = new ObjMethodMap;
-	tokenObj = new ObjectDef( ObjectDef::BuiltinType, "token", fieldMap, 
+	tokenObj = new ObjectDef( ObjectDef::BuiltinType, "token", fieldMap, fieldList,
 			methodMap, nextObjectId++ );
 
 	ObjField *dataEl = makeDataEl();
 	tokenObj->objFieldMap->insert( dataEl->name, dataEl );
+	tokenObj->objFieldList->append( dataEl );
 
 	ObjField *posEl = makePosEl();
 	tokenObj->objFieldMap->insert( posEl->name, posEl );
+	tokenObj->objFieldList->append( posEl );
 
 
 	/* Give all user terminals the token object type. */
@@ -2063,10 +2074,12 @@ void ParseData::initTokenObjects( )
 				/* Create the "data" field. */
 				ObjField *dataEl = makeDataEl();
 				lel->objectDef->objFieldMap->insert( dataEl->name, dataEl );
+				lel->objectDef->objFieldList->append( dataEl );
 
 				/* Create the "pos" field. */
 				ObjField *posEl = makePosEl();
 				lel->objectDef->objFieldMap->insert( posEl->name, posEl );
+				lel->objectDef->objFieldList->append( posEl );
 			}
 		}
 	}
@@ -2305,13 +2318,13 @@ void ParseData::initAllLanguageObjects()
 		ObjectDef *obj = lel->objectDef;
 		if ( obj != 0 ) {
 			/* Init all fields of the object. */
-			for ( ObjFieldMap::Iter f = *obj->objFieldMap; f.lte(); f++ )
+			for ( ObjFieldList::Iter f = *obj->objFieldList; f.lte(); f++ )
 				obj->initField( this, f->value );
 		}
 	}
 
 	/* Init all fields of the global object. */
-	for ( ObjFieldMap::Iter f = *globalObjectDef->objFieldMap; f.lte(); f++ )
+	for ( ObjFieldList::Iter f = *globalObjectDef->objFieldList; f.lte(); f++ )
 		globalObjectDef->initField( this, f->value );
 }
 
@@ -2356,6 +2369,7 @@ void ParseData::initListField( GenericType *gen, const char *name, int offset )
 	el->inSetWV = IN_SET_LIST_MEM_WV;
 
 	gen->objDef->objFieldMap->insert( el->name, el );
+	gen->objDef->objFieldList->append( el );
 
 	el->useOffset = true;
 	el->beenReferenced = true;
@@ -2391,9 +2405,10 @@ void ParseData::resolveGenericTypes()
 				gen->keyUT = gen->keyTypeArg->lookupType( this );
 
 			ObjFieldMap *fieldMap = new ObjFieldMap;
+			ObjFieldList *fieldList = new ObjFieldList;
 			ObjMethodMap *methodMap = new ObjMethodMap;
 			gen->objDef = new ObjectDef( ObjectDef::BuiltinType, 
-					gen->name, fieldMap, methodMap, nextObjectId++ );
+					gen->name, fieldMap, fieldList, methodMap, nextObjectId++ );
 
 			switch ( gen->typeId ) {
 				case GEN_MAP: 
@@ -2429,6 +2444,7 @@ void ParseData::makeFuncVisible( Function *func, bool isUserIter )
 			error(param->loc) << "parameter " << param->name << " redeclared" << endp;
 
 		func->localFrame->objFieldMap->insert( param->name, param );
+		func->localFrame->objFieldList->append( param );
 		param->beenInitialized = true;
 		param->pos = paramPos;
 
@@ -2447,7 +2463,6 @@ void ParseData::makeFuncVisible( Function *func, bool isUserIter )
 	 * words containing the args. */
 	long paramOffset = 0;
 	for ( ParameterList::Iter param = *func->paramList; param.lte(); param++ ) {
-
 		/* Moving downward, and need the offset to point to the lower half of
 		 * the argument. */
 		paramOffset -= sizeOfField( paramUTs[param->pos] );
@@ -2649,6 +2664,7 @@ void ParseData::addStdin()
 	el->useOffset = false;
 	el->inGetR    = IN_GET_STDIN;
 	globalObjectDef->objFieldMap->insert( el->name, el );
+	globalObjectDef->objFieldList->append( el );
 }
 
 void ParseData::addStdout()
@@ -2664,6 +2680,7 @@ void ParseData::addStdout()
 	el->useOffset = false;
 	el->inGetR    = IN_GET_STDOUT;
 	globalObjectDef->objFieldMap->insert( el->name, el );
+	globalObjectDef->objFieldList->append( el );
 }
 
 void ParseData::addStderr()
@@ -2679,6 +2696,7 @@ void ParseData::addStderr()
 	el->useOffset = false;
 	el->inGetR    = IN_GET_STDERR;
 	globalObjectDef->objFieldMap->insert( el->name, el );
+	globalObjectDef->objFieldList->append( el );
 }
 
 void ParseData::initGlobalFunctions()
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 04e64d65..6f974c21 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -88,7 +88,8 @@ block_open: '{'
 	final {
 		/* Init the object representing the local frame. */
 		$$->localFrame = new ObjectDef( ObjectDef::FrameType, 
-				"local", new ObjFieldMap(), new ObjMethodMap(), pd->nextObjectId++ );
+				"local", new ObjFieldMap(), new ObjFieldList, 
+				new ObjMethodMap(), pd->nextObjectId++ );
 		pd->curLocalFrame = $$->localFrame;
 	};
 
@@ -239,6 +240,7 @@ global_def: KW_Global var_def opt_def_init
 			error($2->objField->loc) << "object field renamed" << endp;
 
 		globalObj->objFieldMap->insert( $2->objField->name, $2->objField );
+		globalObj->objFieldList->append( $2->objField );
 
 		if ( $3->expr != 0 ) {
 			LangVarRef *varRef = new LangVarRef( $2->objField->loc, 
@@ -296,7 +298,7 @@ cfl_def: cfl_def_head obj_var_list properties_list cfl_prod_list
 
 		/* Make a new object definition. */
 		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, curDefineId, 
-				pd->objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+				pd->objFieldMap, pd->objFieldList, new ObjMethodMap(), pd->nextObjectId++ ); 
 
 		langEl->objectDef = objectDef;
 	};
@@ -360,11 +362,13 @@ obj_var_list: obj_var_list var_def
 			error() << "object field renamed" << endp;
 
 		pd->objFieldMap->insert( $2->objField->name, $2->objField );
+		pd->objFieldList->append( $2->objField );
 	};
 
 obj_var_list:
 	final {
 		pd->objFieldMap = new ObjFieldMap;
+		pd->objFieldList = new ObjFieldList;
 	};
 
 
@@ -487,6 +491,7 @@ pattern_el: opt_label pattern_el_type_or_lit
 
 			/* Insert it into the field map. */
 			pd->curLocalFrame->objFieldMap->insert( $1->varRef->name, objField );
+			pd->curLocalFrame->objFieldList->append( objField );
 		}
 	};
 
@@ -739,7 +744,7 @@ token_def:
 
 		/* Create the object def for the token. */
 		ObjectDef *objectDef = new ObjectDef( ObjectDef::UserType, name, 
-				pd->objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+				pd->objFieldMap, pd->objFieldList, new ObjMethodMap(), pd->nextObjectId++ ); 
 
 		tokEl->objectDef = objectDef;
 
@@ -973,6 +978,7 @@ statement: var_def opt_def_init
 
 		/* Insert it into the field map. */
 		pd->curLocalFrame->objFieldMap->insert( $1->objField->name, $1->objField );
+		pd->curLocalFrame->objFieldList->append( $1->objField );
 
 		if ( $2->expr != 0 ) {
 			LangVarRef *varRef = new LangVarRef( $1->objField->loc, 
@@ -1025,6 +1031,7 @@ statement: KW_For TK_Word ':' type_ref KW_In iter_call block_or_single
 		 * to the iterator that is called. This lookup is done at compile time. */
 		ObjField *iterField = new ObjField( $2->loc, (TypeRef*)0, $2->data );
 		pd->curLocalFrame->objFieldMap->insert( $2->data, iterField );
+		pd->curLocalFrame->objFieldList->append( iterField );
 
 		$$->stmt = new LangStmt( $1->loc, LangStmt::ForIterType, 
 				iterField, $4->typeRef, $6->langTerm, $7->stmtList );
@@ -1639,6 +1646,7 @@ factor_with_label:
 
 		/* Insert it into the map. */
 		pd->objFieldMap->insert( $1->data, objField );
+		pd->objFieldList->append( objField );
 
 		/* Create the enter and leaving actions that will mark the substring. */
 		Action *enter = new Action( MarkMark, pd->nextMatchEndNum++ );
@@ -2001,8 +2009,9 @@ void Parser::init()
 	/* Set up the global object. */
 	String global = "global";
 	ObjFieldMap *objFieldMap = new ObjFieldMap;
+	ObjFieldList *objFieldList = new ObjFieldList;
 	pd->globalObjectDef = new ObjectDef( ObjectDef::UserType, global, 
-			objFieldMap, new ObjMethodMap(), pd->nextObjectId++ ); 
+			objFieldMap, objFieldList, new ObjMethodMap(), pd->nextObjectId++ ); 
 	
 	/* The eofTokenRegion defaults to the root region. */
 	pd->eofTokenRegion = rootRegion;
@@ -2014,7 +2023,7 @@ void Parser::init()
 	pd->initGraphDict();
 
 	pd->rootLocalFrame = new ObjectDef( ObjectDef::FrameType, 
-				"local", new ObjFieldMap(), new ObjMethodMap(), 
+				"local", new ObjFieldMap(), new ObjFieldList(), new ObjMethodMap(), 
 				pd->nextObjectId++ );
 	pd->curLocalFrame = pd->rootLocalFrame;
 
diff --git a/colm/parsedata.h b/colm/parsedata.h
index 93fe2de0..8d4dcb23 100644
--- a/colm/parsedata.h
+++ b/colm/parsedata.h
@@ -916,6 +916,7 @@ struct ParseData
 
 	long nextLabelId;
 	ObjFieldMap *objFieldMap;
+	ObjFieldList *objFieldList;
 
 	bool revertOn;
 
diff --git a/colm/parsetree.h b/colm/parsetree.h
index 86f81e7f..87880364 100644
--- a/colm/parsetree.h
+++ b/colm/parsetree.h
@@ -30,6 +30,7 @@
 #include "bstset.h"
 #include "vector.h"
 #include "dlist.h"
+#include "dlistval.h"
 #include "astring.h"
 #include "bytecode.h"
 #include "avlbasic.h"
@@ -1247,6 +1248,8 @@ struct ObjField
 typedef AvlMap<String, ObjField*, CmpStr> ObjFieldMap;
 typedef AvlMapEl<String, ObjField*> ObjFieldMapEl;
 
+typedef DListVal<ObjField*> ObjFieldList;
+
 typedef DList<ObjField> ParameterList; 
 
 struct TemplateType;
@@ -1261,14 +1264,16 @@ struct ObjectDef
 	};
 
 	ObjectDef( Type type, String name, 
-			ObjFieldMap *objFieldMap, ObjMethodMap *objMethodMap, int id )
+			ObjFieldMap *objFieldMap, ObjFieldList *objFieldList, 
+			ObjMethodMap *objMethodMap, int id )
 	:
-		type(type), name(name), objFieldMap(objFieldMap), 
+		type(type), name(name), objFieldMap(objFieldMap), objFieldList(objFieldList),
 		objMethodMap(objMethodMap), id(id), nextOffset(0) {}
 
 	Type type;
 	String name;
 	ObjFieldMap *objFieldMap;	
+	ObjFieldList *objFieldList;
 	ObjMethodMap *objMethodMap;	
 
 	long id;
-- 
cgit v1.2.1


From db51647c541b6a0827d2791e82232a55dc140aed Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Mon, 2 Mar 2009 03:46:28 +0000
Subject: Regex subexpression captures are now bound as local variables in
 token generation actions.

---
 colm/bytecode.cpp | 30 ++++++++++++++++++++++++++++--
 colm/bytecode.h   |  5 ++++-
 colm/compile.cpp  |  9 +++++++++
 colm/fsmrun.cpp   | 14 +++++++-------
 colm/lmparse.kl   | 15 ++++++++++++++-
 colm/pdarun.cpp   |  4 ++--
 6 files changed, 64 insertions(+), 13 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 08a1ac98..75417880 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -402,7 +402,7 @@ void Program::run()
 
 	if ( rtd->rootCodeLen > 0 ) {
 		CodeVect reverseCode;
-		Execution execution( this, reverseCode, 0, rtd->rootCode, 0, 0 );
+		Execution execution( this, reverseCode, 0, rtd->rootCode, 0, 0, 0 );
 		execution.execute( root );
 
 		/* Pull out the reverse code and free it. */
@@ -422,7 +422,7 @@ void Program::run()
 }
 
 Execution::Execution( Program *prg, CodeVect &reverseCode,
-		PdaRun *parser, Code *code, Tree *lhs, Head *matchText )
+		PdaRun *parser, Code *code, Tree *lhs, long genId, Head *matchText )
 : 
 	prg(prg), 
 	parser(parser), 
@@ -430,6 +430,7 @@ Execution::Execution( Program *prg, CodeVect &reverseCode,
 	frame(0), iframe(0),
 	lhs(lhs),
 	parsed(0),
+	genId(genId),
 	matchText(matchText),
 	reject(false), 
 	reverseCode(reverseCode),
@@ -945,6 +946,31 @@ again:
 			push( prg->global );
 			break;
 		}
+		case IN_INIT_CAPTURES: {
+			uchar ncaps;
+			read_byte( ncaps );
+
+			#ifdef COLM_LOG_BYTECODE
+			if ( colm_log_bytecode ) {
+				cerr << "IN_INIT_CAPTURES " << ncaps << endl;
+			}
+			#endif
+
+			/* If there are captures (this is a translate block) then copy them into
+			 * the local frame now. */
+			LangElInfo *lelInfo = prg->rtd->lelInfo;
+			char **mark = parser->fsmRun->mark;
+
+			for ( int i = 0; i < lelInfo[genId].numCaptureAttr; i++ ) {
+				CaptureAttr *ca = &prg->rtd->captureAttr[lelInfo[genId].captureAttr + i];
+				Head *data = string_alloc_new( prg, 
+						mark[ca->mark_enter], mark[ca->mark_leave] - mark[ca->mark_enter] );
+				Tree *string = construct_string( prg, data );
+				tree_upref( string );
+				set_local( frame, -1 - i, string );
+			}
+			break;
+		}
 		case IN_INIT_RHS_EL: {
 			Half position;
 			short field;
diff --git a/colm/bytecode.h b/colm/bytecode.h
index 1b3eb02a..d7dc0d00 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -110,6 +110,7 @@ typedef unsigned char uchar;
 #define IN_GET_TOKEN_POS_R       0x35
 
 #define IN_INIT_RHS_EL           0x3b
+#define IN_INIT_CAPTURES         0xaa
 
 #define IN_TRITER_FROM_REF       0x3c
 #define IN_TRITER_ADVANCE        0x3d
@@ -688,7 +689,8 @@ struct Program
 struct Execution
 {
 	Execution( Program *prg, CodeVect &reverseCode,
-			PdaRun *parser, Code *code, Tree *lhs, Head *matchText );
+			PdaRun *parser, Code *code, Tree *lhs,
+			long genId, Head *matchText );
 
 	Program *prg;
 	PdaTables *pdaTables;
@@ -702,6 +704,7 @@ struct Execution
 	Tree *lhs;
 	Tree *parsed;
 
+	long genId;
 	Head *matchText;
 	bool reject;
 
diff --git a/colm/compile.cpp b/colm/compile.cpp
index 5fce43ce..d4d2f503 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -2208,6 +2208,15 @@ void ParseData::compileTranslateBlock( KlangEl *langEl )
 	code.append( IN_INIT_LOCALS );
 	code.appendHalf( 0 );
 
+	if ( langEl->tokenDef->reCaptureVect.length() > 0 ) {
+		code.append( IN_INIT_CAPTURES );
+		code.append( langEl->tokenDef->reCaptureVect.length() );
+
+		ObjFieldList::Iter f = *curLocalFrame->objFieldList;
+		for ( int i = 0; i < langEl->tokenDef->reCaptureVect.length(); i++, f++ )
+			curLocalFrame->referenceField( this, f->value );
+	}
+
 	/* Set the local frame and compile the reduce block. */
 	block->compile( this, code );
 
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index fc9c45d2..6f184b35 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -265,7 +265,7 @@ void FsmRun::sendBackIgnore( Kid *ignore )
 		/* Check for reverse code. */
 		if ( ignore->tree->flags & AF_HAS_RCODE ) {
 			Execution execution( prg, parser->reverseCode, 
-					parser, 0, 0, 0 );
+					parser, 0, 0, 0, 0 );
 
 			/* Do the reverse exeuction. */
 			execution.rexecute( parser->root, parser->allReverseCode );
@@ -307,7 +307,7 @@ void FsmRun::sendBack( Kid *input )
 	/* Check for reverse code. */
 	if ( input->tree->flags & AF_HAS_RCODE ) {
 		Execution execution( prg, parser->reverseCode, 
-				parser, 0, 0, 0 );
+				parser, 0, 0, 0, 0 );
 
 		/* Do the reverse exeuction. */
 		execution.rexecute( parser->root, parser->allReverseCode );
@@ -441,10 +441,10 @@ void FsmRun::sendNamedLangEl()
 	send_handle_error( this, parser, input );
 }
 
-void execute_generation_action( Program *prg, PdaRun *parser, Code *code, Head *tokdata )
+void execute_generation_action( Program *prg, PdaRun *parser, Code *code, long id, Head *tokdata )
 {
 	/* Execute the translation. */
-	Execution execution( prg, parser->reverseCode, parser, code, 0, tokdata );
+	Execution execution( prg, parser->reverseCode, parser, code, 0, id, tokdata );
 	execution.execute( parser->root );
 
 	/* If there is revese code but nothing generated we need a noToken. */
@@ -481,7 +481,7 @@ void FsmRun::generationAction( int id, Head *tokdata, bool namedLangEl, int bind
 			parser->tables->rtd->lelInfo[id].frameId].codeWV;
 
 	/* Execute the action and process the queue. */
-	execute_generation_action( prg, parser, code, tokdata );
+	execute_generation_action( prg, parser, code, id, tokdata );
 
 	/* Finished with the match text. */
 	string_free( prg, tokdata );
@@ -518,8 +518,8 @@ Kid *FsmRun::makeToken( int id, Head *tokdata, bool namedLangEl, int bindId )
 			Head *data = string_alloc_new( prg, 
 					mark[ca->mark_enter], mark[ca->mark_leave] - mark[ca->mark_enter] );
 			Tree *string = construct_string( prg, data );
-			set_attr( input->tree, ca->offset, string );
 			tree_upref( string );
+			set_attr( input->tree, ca->offset, string );
 		}
 	}
 	
@@ -772,7 +772,7 @@ void FsmRun::sendEOF( )
 		Code *code = parser->tables->rtd->frameInfo[frameId].codeWV;
 
 		/* Execute the action and process the queue. */
-		execute_generation_action( prg, parser, code, 0 );
+		execute_generation_action( prg, parser, code, input->tree->id, 0 );
 
 		/* Send the generated tokens. */
 		send_queued_tokens( this, parser );
diff --git a/colm/lmparse.kl b/colm/lmparse.kl
index 6f974c21..d4618c00 100644
--- a/colm/lmparse.kl
+++ b/colm/lmparse.kl
@@ -91,6 +91,20 @@ block_open: '{'
 				"local", new ObjFieldMap(), new ObjFieldList, 
 				new ObjMethodMap(), pd->nextObjectId++ );
 		pd->curLocalFrame = $$->localFrame;
+
+		/* Add captures to the local frame. We Depend on these becoming the
+		 * first local variables so we can compute their location. */
+
+		/* Make local variables corresponding to the local capture vector. */
+		for ( ReCaptureVect::Iter c = reCaptureVect; c.lte(); c++ )
+		{
+			ObjField *objField = new ObjField( c->objField->loc,
+					c->objField->typeRef, c->objField->name );
+
+			/* Insert it into the field map. */
+			pd->curLocalFrame->objFieldMap->insert( objField->name, objField );
+			pd->curLocalFrame->objFieldList->append( objField );
+		}
 	};
 
 block_close: '}' 
@@ -1987,7 +2001,6 @@ opt_commit: KW_Commit final { $$->commit = true; };
 
 void Parser::init()
 {
-
 	/* Set up the root namespace. */
 	const char *rootNamespaceName = "___ROOT_NAMESPACE";
 	Namespace *rootNamespace = new Namespace( InputLoc(), 
diff --git a/colm/pdarun.cpp b/colm/pdarun.cpp
index 07bd8d09..b85a32c0 100644
--- a/colm/pdarun.cpp
+++ b/colm/pdarun.cpp
@@ -463,7 +463,7 @@ again:
 
 			/* Execution environment for the reduction code. */
 			Execution execution( prg, reverseCode, 
-					this, fi->codeWV, redLel->tree, 0 );
+					this, fi->codeWV, redLel->tree, 0, 0 );
 
 			/* Execute it. */
 			execution.execute( root );
@@ -629,7 +629,7 @@ parseError:
 
 			/* Check for an execution environment. */
 			if ( undoLel->tree->flags & AF_HAS_RCODE ) {
-				Execution execution( prg, reverseCode, this, 0, 0, 0 );
+				Execution execution( prg, reverseCode, this, 0, 0, 0, 0 );
 
 				/* Do the reverse exeuction. */
 				execution.rexecute( root, allReverseCode );
-- 
cgit v1.2.1


From 82123d34d3bc28bce9e75be756acc016e6560561 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 4 Mar 2009 04:14:46 +0000
Subject: Bug fix: match_text was getting into the list of locals. It loaded
 with a special bytecode and is not on the stack.

---
 colm/compile.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/colm/compile.cpp b/colm/compile.cpp
index d4d2f503..19f42293 100644
--- a/colm/compile.cpp
+++ b/colm/compile.cpp
@@ -2091,7 +2091,9 @@ void ParseData::findLocalTrees( CharSet &trees )
 	 * the frame is is cleaned and so it must survive. */
 	for ( ObjFieldMap::Iter of = *curLocalFrame->objFieldMap; of.lte(); of++ ) {
 		ObjField *el = of->value;
-		if ( !el->isLhsEl && el->beenReferenced ) {
+		/* FIXME: This test needs to be improved. Match_text was getting
+		 * through before useOffset was tested. What will? */
+		if ( el->useOffset && !el->isLhsEl && el->beenReferenced ) {
 			UniqueType *ut = el->typeRef->lookupType( this );
 			if ( ut->typeId == TYPE_TREE || ut->typeId == TYPE_PTR )
 				trees.insert( el->offset );
-- 
cgit v1.2.1


From a38bc6696d82b082d48125fb42340b4e8fc635da Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Wed, 4 Mar 2009 04:17:27 +0000
Subject: Eliminated PdaRun::run(). We should be pulling tokens from scanner
 and pushing them to the parser, rather than calling the scanner and pushing
 to the parser from there. This is a small start on that.

---
 colm/bytecode.cpp  | 2 +-
 colm/fsmrun.cpp    | 9 ++-------
 colm/parsedata.cpp | 4 ++--
 colm/pdarun.h      | 1 -
 4 files changed, 5 insertions(+), 11 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 75417880..7030d3a5 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -133,7 +133,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 {
 	PdaTables *tables = prg->rtd->pdaTables;
 	PdaRun parser( sp, prg, tables, parserId, stream->scanner, stopId, revertOn );
-	parser.run();
+	stream->scanner->run( &parser );
 	commit_full( &parser, 0 );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
 	tree_upref( tree );
diff --git a/colm/fsmrun.cpp b/colm/fsmrun.cpp
index 6f184b35..7281c76b 100644
--- a/colm/fsmrun.cpp
+++ b/colm/fsmrun.cpp
@@ -805,13 +805,6 @@ void FsmRun::attachInputStream( InputStream *in )
 	inputStream->position = 0;
 }
 
-long PdaRun::run()
-{
-	/* PDA must be init first to set next region. */
-	init();
-	return fsmRun->run( this );
-}
-
 long PdaRun::undoParse( Tree *tree, CodeVect *rev )
 {
 	/* PDA must be init first to set next region. */
@@ -844,6 +837,8 @@ long FsmRun::run( PdaRun *destParser )
 	PdaRun *prevParser = parser;
 	parser = destParser;
 
+	parser->init();
+
 	act = 0;
 	tokstart = 0;
 	tokend = 0;
diff --git a/colm/parsedata.cpp b/colm/parsedata.cpp
index 19599e6b..32da2e5c 100644
--- a/colm/parsedata.cpp
+++ b/colm/parsedata.cpp
@@ -1698,7 +1698,7 @@ void ParseData::parsePatterns()
 
 		repl->pdaRun = new PdaRun( root, &program,
 				pdaTables, repl->langEl->parserId, &fsmRun, 0, false );
-		repl->pdaRun->run();
+		fsmRun.run( repl->pdaRun );
 
 			//#ifdef COLM_LOG_COMPILE
 			//if ( colm_log_compile ) {
@@ -1714,7 +1714,7 @@ void ParseData::parsePatterns()
 
 		pat->pdaRun = new PdaRun( root, &program,
 				pdaTables, pat->langEl->parserId, &fsmRun, 0, false );
-		pat->pdaRun->run();
+		fsmRun.run( pat->pdaRun );
 
 			//#ifdef COLM_LOG_COMPILE
 			//if ( colm_log_compile ) {
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 30f5b0d2..9baa5edb 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -524,7 +524,6 @@ struct PdaRun
 	void parseToken( Kid *input );
 	bool isParserStopFinished();
 	void match( Kid *tree, Kid *pattern );
-	long run();
 	long undoParse( Tree *tree, CodeVect *rev );
 
 	void send( Kid *kid );
-- 
cgit v1.2.1


From 70445937dd29d7f74e8a6dd82474f61fdb53b462 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 5 Mar 2009 02:50:16 +0000
Subject: Fixed open_file().

---
 colm/bytecode.cpp | 14 +++++++-------
 colm/bytecode.h   |  2 +-
 colm/pdarun.h     |  2 +-
 colm/tree.cpp     | 23 +++++++----------------
 4 files changed, 16 insertions(+), 25 deletions(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 7030d3a5..6a2816d8 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -132,7 +132,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 		long parserId, long stopId, CodeVect *&cv, bool revertOn )
 {
 	PdaTables *tables = prg->rtd->pdaTables;
-	PdaRun parser( sp, prg, tables, parserId, stream->scanner, stopId, revertOn );
+	PdaRun parser( sp, prg, tables, parserId, stream->fsmRun, stopId, revertOn );
 	stream->scanner->run( &parser );
 	commit_full( &parser, 0 );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
@@ -157,14 +157,14 @@ void undo_parse( Tree **&sp, Program *prg, Stream *stream,
 		long parserId, Tree *tree, CodeVect *rev )
 {
 	PdaTables *tables = prg->rtd->pdaTables;
-	PdaRun parser( sp, prg, tables, parserId, stream->scanner, 0, false );
+	PdaRun parser( sp, prg, tables, parserId, stream->fsmRun, 0, false );
 	parser.undoParse( tree, rev );
 }
 
 Tree *stream_pull( Program *prg, Stream *stream, Tree *length )
 {
 	long len = ((Int*)length)->value;
-	Head *tokdata = stream->scanner->extractToken( len );
+	Head *tokdata = stream->fsmRun->extractToken( len );
 	return construct_string( prg, tokdata );
 }
 
@@ -172,20 +172,20 @@ void undo_pull( Program *prg, Stream *stream, Tree *str )
 {
 	const char *data = string_data( ( (Str*)str )->value );
 	long length = string_length( ( (Str*)str )->value );
-	stream->scanner->sendBackText( data, length );
+	stream->fsmRun->sendBackText( data, length );
 }
 
 Word stream_push( Tree **&sp, Program *prg, Stream *stream, Tree *any )
 {
 	std::stringstream ss;
 	print_tree( ss, sp, prg, any );
-	stream->scanner->streamPush( ss.str().c_str(), ss.str().size());
+	stream->fsmRun->streamPush( ss.str().c_str(), ss.str().size());
 	return ss.str().size();
 }
 
 void undo_stream_push( Tree **&sp, Program *prg, Stream *stream, Word len )
 {
-	stream->scanner->undoStreamPush( len );
+	stream->fsmRun->undoStreamPush( len );
 }
 
 void set_local( Tree **frame, long field, Tree *tree )
@@ -3196,7 +3196,7 @@ again:
 			#endif
 
 			Tree *name = pop();
-			Tree *res = open_file( prg, name );
+			Tree *res = (Tree*)open_file( prg, name );
 			tree_upref( res );
 			push( res );
 			tree_downref( prg, sp, name );
diff --git a/colm/bytecode.h b/colm/bytecode.h
index d7dc0d00..fc326906 100644
--- a/colm/bytecode.h
+++ b/colm/bytecode.h
@@ -465,7 +465,7 @@ Tree *construct_term( Program *prg, Word id, Head *tokdata );
 Tree *construct_replacement_tree( Tree **bindings, Program *prg, long pat );
 Tree *create_generic( Program *prg, long genericId );
 
-Tree *open_file( Program *prg, Tree *name );
+Stream *open_file( Program *prg, Tree *name );
 Stream *open_stream_fd( Program *prg, long fd );
 Stream *open_stream( Program *prg, FILE *file );
 
diff --git a/colm/pdarun.h b/colm/pdarun.h
index 9baa5edb..240d97a4 100644
--- a/colm/pdarun.h
+++ b/colm/pdarun.h
@@ -259,7 +259,7 @@ struct Stream
 
 	FILE *file;
 	InputStream *in;
-	FsmRun *scanner;
+	FsmRun *fsmRun;
 };
 
 /*
diff --git a/colm/tree.cpp b/colm/tree.cpp
index 434a34f6..f856ad3a 100644
--- a/colm/tree.cpp
+++ b/colm/tree.cpp
@@ -114,8 +114,8 @@ Stream *open_stream_file( Program *prg, FILE *file )
 	res->id = LEL_ID_STREAM;
 	res->file = file;
 	res->in = new InputStreamFile( file );
-	res->scanner = new FsmRun( prg );
-	res->scanner->attachInputStream( res->in );
+	res->fsmRun = new FsmRun( prg );
+	res->fsmRun->attachInputStream( res->in );
 	return res;
 }
 
@@ -124,25 +124,16 @@ Stream *open_stream_fd( Program *prg, long fd )
 	Stream *res = (Stream*)prg->mapElPool.allocate();
 	res->id = LEL_ID_STREAM;
 	res->in = new InputStreamFD( fd );
-	res->scanner = new FsmRun( prg );
-	res->scanner->attachInputStream( res->in );
+	res->fsmRun = new FsmRun( prg );
+	res->fsmRun->attachInputStream( res->in );
 	return res;
 }
 
-Tree *open_file( Program *prg, Tree *name )
+Stream *open_file( Program *prg, Tree *name )
 {
 	Head *head = ((Str*)name)->value;
 	FILE *file = fopen( string_data(head), "rb" );
-	Tree *res = 0;
-
-	if ( file != 0 ) {
-		res = (Tree*) open_stream_file( prg, file );
-		res = prg->treePool.allocate();
-		res->id = LEL_ID_STREAM;
-		((Stream *)res)->file = file;
-	}
-
-	return res;
+	return open_stream_file( prg, file );
 }
 
 Tree *construct_integer( Program *prg, long i )
@@ -647,7 +638,7 @@ void print_xml_tree( Tree **&sp, Program *prg, Tree *tree, bool commAttr )
 
 void stream_free( Program *prg, Stream *s )
 {
-	delete s->scanner;
+	delete s->fsmRun;
 	delete s->in;
 	if ( s->file != 0 )
 		fclose( s->file );
-- 
cgit v1.2.1


From a56c3a5d4b9b2139fb203b6adf93b93c88b75f52 Mon Sep 17 00:00:00 2001
From: Adrian Thurston <thurston@complang.org>
Date: Thu, 5 Mar 2009 03:34:39 +0000
Subject: Fixed broken build from last commit.

---
 colm/bytecode.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/colm/bytecode.cpp b/colm/bytecode.cpp
index 6a2816d8..03474e73 100644
--- a/colm/bytecode.cpp
+++ b/colm/bytecode.cpp
@@ -133,7 +133,7 @@ Tree *call_parser( Tree **&sp, Program *prg, Stream *stream,
 {
 	PdaTables *tables = prg->rtd->pdaTables;
 	PdaRun parser( sp, prg, tables, parserId, stream->fsmRun, stopId, revertOn );
-	stream->scanner->run( &parser );
+	stream->fsmRun->run( &parser );
 	commit_full( &parser, 0 );
 	Tree *tree = parser.getParsedRoot( stopId > 0 );
 	tree_upref( tree );
-- 
cgit v1.2.1