--- yapps2-2.1.1.orig/changelog
+++ yapps2-2.1.1/changelog
@@ -1,3 +1,304 @@
+ChangeSet
+  1.38 05/01/22 19:36:32 smurf@smurf.noris.de +2 -0
+  Add option to limit backtrace depth on syntax errors.
+
+  yapps/runtime.py
+    1.15 05/01/22 19:36:31 smurf@smurf.noris.de +5 -1
+    Add option to limit backtrace depth on syntax errors.
+
+  debian/changelog
+    1.20 05/01/22 19:36:31 smurf@smurf.noris.de +2 -1
+    Add option to limit backtrace depth on syntax errors.
+
+ChangeSet
+  1.37 05/01/22 03:39:56 smurf@smurf.noris.de +2 -0
+  Fix recursive includes.
+
+  yapps/runtime.py
+    1.14 05/01/22 03:39:54 smurf@smurf.noris.de +395 -381
+    Fix recursive includes.
+
+  debian/changelog
+    1.19 05/01/22 03:39:54 smurf@smurf.noris.de +6 -0
+    Fix recursive includes.
+
+ChangeSet
+  1.36 04/12/23 23:49:52 smurf@smurf.noris.de +1 -0
+  Brown paper bag -- fix Python 2.4 stuff.
+
+  debian/changelog
+    1.18 04/12/23 23:49:52 smurf@smurf.noris.de +6 -0
+    Brown paper bag -- fix Python 2.4 stuff.
+
+ChangeSet
+  1.35 04/12/23 21:00:34 smurf@smurf.noris.de +1 -0
+  typo
+
+  debian/control
+    1.10 04/12/23 21:00:33 smurf@smurf.noris.de +1 -1
+    typo
+
+ChangeSet
+  1.34 04/12/12 20:22:54 smurf@smurf.noris.de +2 -0
+  Add support for Python 2.4
+
+  debian/control
+    1.9 04/12/12 20:22:52 smurf@smurf.noris.de +1 -1
+    Add support for Python 2.4
+
+  debian/changelog
+    1.17 04/12/12 20:22:52 smurf@smurf.noris.de +6 -0
+    Add support for Python 2.4
+
+ChangeSet
+  1.33 04/09/23 11:24:16 smurf@smurf.noris.de +3 -0
+  update documentation:
+  - toss hyphens
+  - document extensions
+
+  doc/yapps2.tex
+    1.3 04/09/23 11:24:16 smurf@smurf.noris.de +21 -0
+    add a Debian Extensions section
+
+  debian/yapps.1
+    1.2 04/09/23 11:24:16 smurf@smurf.noris.de +14 -9
+    escape more hyphens (i.e., all the rest)
+
+  debian/changelog
+    1.16 04/09/23 11:24:16 smurf@smurf.noris.de +2 -0
+    update documentation:
+    - toss hyphens
+    - document extensions
+
+ChangeSet
+  1.32 04/09/23 11:23:24 smurf@smurf.noris.de +2 -0
+  turn off triggers
+
+  BitKeeper/triggers/pre-commit.upversion
+    1.2 04/09/23 11:23:24 smurf@smurf.noris.de +2 -0
+    off
+
+  BitKeeper/triggers/post-commit.changelog
+    1.2 04/09/23 11:23:24 smurf@smurf.noris.de +2 -0
+    off
+
+ChangeSet
+  1.31 04/09/23 10:55:24 smurf@smurf.noris.de +1 -0
+  ignore new package's files
+
+  BitKeeper/etc/ignore
+    1.17 04/09/23 10:55:23 smurf@smurf.noris.de +1 -0
+    added debian/yapps2-runtime/*
+
+  debian/yapps2-runtime.README
+    1.1 04/09/23 10:50:33 smurf@smurf.noris.de +11 -0
+
+ChangeSet
+  1.30 04/09/23 10:50:33 smurf@smurf.noris.de +8 -0
+  split off runtime to its own package
+  document the fact that I can't use the original runtime
+
+  debian/yapps2-runtime.dirs
+    1.6 04/09/23 10:50:33 smurf@smurf.noris.de +2 -4
+    split off runtime
+
+  debian/yapps2-runtime.README
+    1.0 04/09/23 10:50:33 smurf@smurf.noris.de +0 -0
+    BitKeeper file /daten/src/debian/python_yapps/debian/yapps2-runtime.README
+
+  debian/rules
+    1.5 04/09/23 10:50:33 smurf@smurf.noris.de +4 -1
+    move runtime files to their own package
+
+  debian/control
+    1.8 04/09/23 10:50:33 smurf@smurf.noris.de +14 -1
+    split off runtime to its own package
+
+  debian/changelog
+    1.15 04/09/23 10:50:33 smurf@smurf.noris.de +9 -0
+    document package split
+
+  debian/README
+    1.2 04/09/23 10:50:33 smurf@smurf.noris.de +21 -4
+    Updated for package split
+
+  debian/yapps2.docs
+    1.3 04/09/23 10:31:15 smurf@smurf.noris.de +0 -0
+    Rename: debian/docs -> debian/yapps2.docs
+
+  debian/yapps2-runtime.dirs
+    1.5 04/09/23 10:30:48 smurf@smurf.noris.de +0 -0
+    bk cp yapps2.dirs yapps2-runtime.dirs
+
+  debian/yapps2.dirs
+    1.4 04/09/23 10:30:42 smurf@smurf.noris.de +0 -0
+    Rename: debian/dirs -> debian/yapps2.dirs
+
+  debian/yapps2.dirs
+    1.4 04/09/23 10:30:42 smurf@smurf.noris.de +0 -0
+    Rename: debian/dirs -> debian/yapps2.dirs
+
+ChangeSet
+  1.29 04/07/19 09:30:22 smurf@smurf.noris.de +5 -0
+  latex2html => hevea
+
+  debian/yapps2.doc-base
+    1.2 04/07/19 09:30:21 smurf@smurf.noris.de +2 -2
+    latex2html => hevea
+
+  debian/rules
+    1.4 04/07/19 09:30:21 smurf@smurf.noris.de +4 -2
+    latex2html => hevea
+
+  debian/control
+    1.7 04/07/19 09:30:21 smurf@smurf.noris.de +1 -1
+    latex2html => hevea
+
+  debian/changelog
+    1.14 04/07/19 09:30:21 smurf@smurf.noris.de +6 -0
+    latex2html => hevea
+
+  BitKeeper/etc/ignore
+    1.16 04/07/19 09:30:06 smurf@smurf.noris.de +1 -0
+    added doc/yapps2.haux
+
+  BitKeeper/etc/ignore
+    1.15 04/07/19 09:29:55 smurf@smurf.noris.de +1 -0
+    added doc/yapps2.ht*
+
+ChangeSet
+  1.28 04/07/12 09:35:59 smurf@smurf.noris.de +2 -0
+  Build-Depend on python.
+
+  debian/control
+    1.6 04/07/12 09:35:58 smurf@smurf.noris.de +1 -1
+    Build-Depend on python.
+
+  debian/changelog
+    1.13 04/07/12 09:35:58 smurf@smurf.noris.de +6 -0
+    doc
+
+ChangeSet
+  1.27 04/05/16 22:02:40 smurf@smurf.noris.de +2 -0
+  ship "empty" file
+
+  yapps/__init__.py
+    1.2 04/05/16 22:02:39 smurf@smurf.noris.de +1 -0
+    ship "empty" file
+
+  debian/changelog
+    1.12 04/05/16 22:02:39 smurf@smurf.noris.de +2 -1
+    doc
+
+ChangeSet
+  1.26 04/05/16 22:01:42 smurf@smurf.noris.de +2 -0
+  Typo (made large file handling slow)
+
+  yapps/runtime.py
+    1.13 04/05/16 22:01:42 smurf@smurf.noris.de +1 -1
+    Typo
+
+  debian/changelog
+    1.11 04/05/16 22:01:42 smurf@smurf.noris.de +6 -0
+    Version 2.1.1-11
+
+ChangeSet
+  1.25 04/05/14 12:25:51 smurf@smurf.noris.de +1 -0
+  exporter: test was in wrong dir
+
+  debian/exporter
+    1.3 04/05/14 12:25:51 smurf@smurf.noris.de +1 -0
+    wrong dir
+
+ChangeSet
+  1.24 04/05/14 12:20:04 smurf@smurf.noris.de +1 -0
+  Clean up external source before generating a diff
+
+  debian/exporter
+    1.2 04/05/14 12:20:04 smurf@smurf.noris.de +7 -0
+    Clean up external source before generating a diff
+
+ChangeSet
+  1.23 04/05/14 12:14:34 smurf@linux.smurf.noris.de +13 -0
+  Documentation update:
+   build and install HTML documentation from LaTex source
+
+  debian/changelog
+    1.10 04/05/14 12:14:33 smurf@linux.smurf.noris.de +7 -0
+    Version 2.1.1-10
+
+  debian/yapps2.doc-base
+    1.1 04/05/14 12:14:32 smurf@smurf.noris.de +13 -0
+
+  yapps_grammar.g
+    1.5 04/05/14 12:14:31 smurf@smurf.noris.de +1 -0
+    add my copyright notice
+
+  yapps/runtime.py
+    1.12 04/05/14 12:14:31 smurf@smurf.noris.de +1 -0
+    add my copyright notice
+
+  debian/yapps2.doc-base
+    1.0 04/05/14 12:14:31 smurf@smurf.noris.de +0 -0
+    BitKeeper file /usr/local/src/misc/yapps/debian/yapps2.doc-base
+
+  debian/rules
+    1.3 04/05/14 12:14:31 smurf@smurf.noris.de +5 -5
+    gernerate and install html documentation
+    don't install LICENSE file
+
+  debian/yapps2-runtime.dirs
+    1.3 04/05/14 12:14:30 smurf@smurf.noris.de +1 -2
+    drop overrides
+    add doc dir +html
+
+  debian/docs
+    1.2 04/05/14 12:14:30 smurf@smurf.noris.de +1 -1
+    install latex documentation
+
+  debian/dirs
+    1.3 04/05/14 12:14:30 smurf@smurf.noris.de +1 -2
+    drop overrides
+    add doc dir +html
+
+  debian/copyright
+    1.3 04/05/14 12:14:30 smurf@smurf.noris.de +21 -3
+    include license here instead of installing a LICENSE file
+
+  debian/control
+    1.5 04/05/14 12:14:30 smurf@smurf.noris.de +6 -6
+    Dep on latex2html
+    indent list
+
+  BitKeeper/etc/ignore
+    1.14 04/05/14 12:06:12 smurf@smurf.noris.de +1 -0
+    added doc/yapps2/*
+
+  BitKeeper/etc/ignore
+    1.13 04/05/14 12:06:07 smurf@smurf.noris.de +3 -0
+    added debian/yapps2/* debian/*.substvars debian/*.debhelper
+
+  BitKeeper/deleted/.del-overrides.lintian~19711613dc4ce90f
+    1.3 04/05/14 11:51:33 smurf@smurf.noris.de +0 -0
+    Delete: debian/overrides.lintian
+
+  BitKeeper/deleted/.del-overrides.linda~b0c6fa08da170a16
+    1.2 04/05/14 11:51:33 smurf@smurf.noris.de +0 -0
+    Delete: debian/overrides.linda
+
+  doc/yapps2.tex
+    1.2 04/05/14 11:34:34 smurf@smurf.noris.de +0 -0
+    Rename: yapps2.tex -> doc/yapps2.tex
+
+ChangeSet
+  1.22 04/05/14 11:33:27 smurf@smurf.noris.de +1 -0
+  Merge bk://server/public/python_yapps
+  into smurf.noris.de:/usr/local/src/misc/yapps
+
+  BitKeeper/deleted/.del-logging_ok~530b65bc14e5cc7c
+    1.2 04/05/14 11:33:26 smurf@smurf.noris.de +0 -0
+    'Auto converge rename'
+
   BitKeeper/etc/logging_ok
     1.1 04/05/14 11:33:13 smurf@smurf.noris.de +1 -0
 
@@ -25,6 +326,10 @@
     Fixed name
     Updated long description
 
+  debian/yapps2-runtime.dirs
+    1.2 04/05/14 11:31:17 smurf@smurf.noris.de +1 -1
+    rename: python-yapps => yapps2
+
   debian/rules
     1.2 04/05/14 11:31:17 smurf@smurf.noris.de +8 -8
     rename: python-yapps => yapps2
@@ -170,6 +475,9 @@
     1.0 03/12/30 11:51:25 smurf@smurf.noris.de +0 -0
     BitKeeper file /usr/local/src/misc/yapps/setup.py
 
+  debian/yapps2-runtime.dirs
+    1.1 03/12/30 11:51:24 smurf@smurf.noris.de +5 -0
+
   debian/yapps.1
     1.0 03/12/30 11:51:25 smurf@smurf.noris.de +0 -0
     BitKeeper file /usr/local/src/misc/yapps/debian/yapps.1
@@ -226,6 +534,10 @@
     1.10 03/12/30 11:51:24 smurf@smurf.noris.de +0 -2
     Drop shebang line, this is not a program.
 
+  debian/yapps2-runtime.dirs
+    1.0 03/12/30 11:51:24 smurf@smurf.noris.de +0 -0
+    BitKeeper file /usr/local/src/misc/yapps/debian/dirs
+
   debian/overrides.linda
     1.0 03/12/30 11:51:24 smurf@smurf.noris.de +0 -0
     BitKeeper file /usr/local/src/misc/yapps/debian/overrides.linda
--- yapps2-2.1.1.orig/debian/README
+++ yapps2-2.1.1/debian/README
@@ -0,0 +1,23 @@
+The Debian Package yapps2
+-------------------------
+
+This package contains several upward-compatible enhancements to the
+original YAPPS source:
+- Handle stacked input ("include files")
+- augmented ignore-able patterns
+  (this means that yapps2 now can parse things like multi-line C comments)
+- better error reporting
+- read input incrementally
+
+Traditionally, the yapps runtime is called yappsrt.py and it was
+installed with the binary that uses the parser. However, as soon as
+there is more than one of those, this method breaks.
+
+Therefore, and because the new runtime isn't entirely compatible to the
+old yappsrt.py, I decided to rename the generated parser to
+yapps/runtime.py. It is provided by the yapps2-runtime package.
+You need to depend on this package if you Debianize Python programs that
+use yapps2.
+
+-- 
+Matthias Urlichs
--- yapps2-2.1.1.orig/debian/changelog
+++ yapps2-2.1.1/debian/changelog
@@ -0,0 +1,157 @@
+yapps2 (2.1.1-17.5) unstable; urgency=medium
+
+  * Non-maintainer upload.
+  * Move binary-arch rule to binary-indep, since all our binary packages are
+    Architecture: all.
+
+ -- Colin Watson <cjwatson@debian.org>  Tue, 08 Nov 2016 19:48:31 +0000
+
+yapps2 (2.1.1-17.4) unstable; urgency=medium
+
+  * Non-maintainer upload.
+  * Bump to debhelper compat level 9 (closes: #817771).
+  * Use ${binary:Version} rather than ${Source-Version} (closes: #833233).
+
+ -- Colin Watson <cjwatson@debian.org>  Sun, 06 Nov 2016 17:11:44 +0000
+
+yapps2 (2.1.1-17.3) unstable; urgency=medium
+
+  * Non-maintainer upload.
+  * Build using dh-python. Closes: #786242.
+
+ -- Matthias Klose <doko@debian.org>  Sat, 22 Aug 2015 15:10:19 +0200
+
+yapps2 (2.1.1-17.2) unstable; urgency=low
+
+  * Non-maintainer upload.
+  * Python 2.6 transition (closes: #547877):
+    + debian/control:
+      - Bump python-dev to >= 2.5.4-1~.
+    + debian/rules:
+      - Use macros provided by /usr/share/python/python.mk to install
+        files in correct locations for every supported Python version.
+
+ -- Luca Falavigna <dktrkranz@debian.org>  Wed, 14 Oct 2009 23:05:28 +0200
+
+yapps2 (2.1.1-17.1) unstable; urgency=low
+
+  * Non-maintainer upload.
+  * Update package to the last python policy (Closes: 380992).
+  * Bump Standards-Version to 3.7.2.
+  * Move debhelper to Build-Depends.
+
+ -- Pierre Habouzit <madcoder@debian.org>  Sun,  3 Sep 2006 23:51:24 +0200
+
+yapps2 (2.1.1-17) unstable; urgency=medium
+
+  * Fix recursive includes.
+  * Add option to limit backtrace depth on syntax errors.
+
+ -- Matthias Urlichs <smurf@debian.org>  Sat, 22 Jan 2005 04:10:33 +0100
+
+yapps2 (2.1.1-16) unstable; urgency=medium
+
+  * Brown paper bag -- fix Python 2.4 stuff.
+
+ -- Matthias Urlichs <smurf@debian.org>  Thu, 23 Dec 2004 23:48:58 +0100
+
+yapps2 (2.1.1-15) unstable; urgency=medium
+
+  * Add support for Python 2.4.
+
+ -- Matthias Urlichs <smurf@debian.org>  Sun, 12 Dec 2004 20:20:18 +0100
+
+yapps2 (2.1.1-14) unstable; urgency=medium
+
+  * Split off the Python parser runtime into its own package
+    + sort-of Closes: #272738: Generated python files import yapps.runtime
+                               instead of yappsrt
+      - can't use yappsrt; it's not downward-compatible
+  * too many (i.e. more than zero) unquoted hyphens in the manpage
+  * update documentation that this is an enhanced version
+
+ -- Matthias Urlichs <smurf@debian.org>  Thu, 23 Sep 2004 10:44:41 +0200
+
+yapps2 (2.1.1-13) unstable; urgency=low
+
+  * latex2html => hevea
+
+ -- Matthias Urlichs <smurf@debian.org>  Mon, 19 Jul 2004 09:29:17 +0200
+
+yapps2 (2.1.1-12) unstable; urgency=low
+
+  * Build-Depend on python.
+
+ -- Matthias Urlichs <smurf@debian.org>  Mon, 12 Jul 2004 09:35:29 +0200
+
+yapps2 (2.1.1-11) unstable; urgency=low
+
+  * Typo (made large file handling slow)
+  * installation problem (new zero-sized file)
+
+ -- Matthias Urlichs <smurf@debian.org>  Sun, 16 May 2004 22:01:53 +0200
+
+yapps2 (2.1.1-10) unstable; urgency=low
+
+  * Documentation update:
+    build and install HTML documentation from LaTex source
+
+ -- Matthias Urlichs <smurf@debian.org>  Fri, 14 May 2004 12:14:33 +0200
+
+yapps2 (2.1.1-9) unstable; urgency=low
+
+  * Renamed the package to "yapps2".
+  * Submit to Debian. Closes: #201568.
+  * Fix minor problem with setup.py.
+
+ -- Matthias Urlichs <smurf@debian.org>  Fri, 14 May 2004 11:17:20 +0200
+
+yapps (2.1.1-8) unstable; urgency=low
+
+  * require python-dev because of distutils.
+
+ -- Matthias Urlichs <smurf@debian.org>  Wed, 31 Dec 2003 14:00:42 +0100
+
+yapps (2.1.1-7) unstable; urgency=low
+
+  * Change yapps.py to exit with 1 if there was a parser failure.
+
+ -- Matthias Urlichs <smurf@debian.org>  Wed, 31 Dec 2003 13:57:38 +0100
+
+yapps (2.1.1-6) unstable; urgency=low
+
+  * Update to 3.6.1, use build-depends-indep.
+
+ -- Matthias Urlichs <smurf@debian.org>  Tue, 30 Dec 2003 15:36:56 +0100
+
+yapps (2.1.1-5) unstable; urgency=low
+
+  * Add some notes.
+
+ -- Matthias Urlichs <smurf@debian.org>  Tue, 30 Dec 2003 15:33:19 +0100
+
+yapps (2.1.1-4) unstable; urgency=low
+
+  * Correctly report syntax errors if there are no line numbers.
+
+ -- Matthias Urlichs <smurf@debian.org>  Tue, 30 Dec 2003 15:30:05 +0100
+
+yapps (2.1.1-3) unstable; urgency=low
+
+  * Repair ignored-pattern upcall.
+
+ -- Matthias Urlichs <smurf@debian.org>  Tue, 30 Dec 2003 14:02:37 +0100
+
+yapps (2.1.1-2) unstable; urgency=low
+
+  * runtime: fix error reporting.
+
+ -- Matthias Urlichs <smurf@debian.org>  Tue, 30 Dec 2003 13:30:14 +0100
+
+yapps (2.1.1-1) unstable; urgency=low
+
+  * Initial Debian packaging.
+    - Added a manpage.
+
+ -- Matthias Urlichs <smurf@debian.org>  Mon, 29 Dec 2003 17:13:59 +0100
+
--- yapps2-2.1.1.orig/debian/compat
+++ yapps2-2.1.1/debian/compat
@@ -0,0 +1 @@
+9
--- yapps2-2.1.1.orig/debian/control
+++ yapps2-2.1.1/debian/control
@@ -0,0 +1,41 @@
+Source: yapps2
+Section: python
+Priority: optional
+Maintainer: Matthias Urlichs <smurf@debian.org>
+Build-Depends: debhelper (>= 9~)
+Build-Depends-Indep: python-dev (>= 2.5.4-1~), hevea, dh-python
+Standards-Version: 3.7.2
+
+Package: yapps2
+Architecture: all
+Depends: ${python:Depends}, yapps2-runtime (= ${binary:Version})
+Description: Yet Another Python Parser System
+ YAPPS is an easy to use parser generator that is written in Python and
+ generates Python code.  There are several parser generator systems
+ already available for Python, but this parser has different goals:
+ Yapps is simple, very easy to use, and produces human-readable parsers.
+ .
+ It is not the fastest or most powerful parser.  Yapps is designed to be
+ used when regular expressions are not enough and other parser systems
+ are too much: situations where you might otherwise write your own
+ recursive descent parser.
+ .
+ This package contains several upward-compatible enhancements to the
+ original YAPPS source:
+ .
+     - handles recursive input ("include files")
+     - better error reporting
+     - reads input incrementally
+
+Package: yapps2-runtime
+Architecture: all
+Depends: ${python:Depends}
+Description: Yet Another Python Parser System
+ YAPPS is an easy to use parser generator that is written in Python and
+ generates Python code.  There are several parser generator systems
+ already available for Python, but this parser has different goals:
+ Yapps is simple, very easy to use, and produces human-readable parsers.
+ .
+ This package contains the Python runtime support for parsers generated
+ with yapps2.
+
--- yapps2-2.1.1.orig/debian/copyright
+++ yapps2-2.1.1/debian/copyright
@@ -0,0 +1,41 @@
+This is yapps2, Yet Another Python Parser System,
+written by Amit J. Patel <amitp@theory.stanford.edu>.
+
+It was packaged for Debian by Matthias Urlichs <smurf@debian.org>
+on Fri, 14 May 2004.
+
+The original source can be found at:
+    http://theory.stanford.edu/~amitp/yapps/yapps2.1.1.zip
+
+The original copyright notice states:
+
+# Yapps 2 - yet another python parser system
+# Copyright 1999-2003 by Amit J. Patel <amitp@cs.stanford.edu>
+#
+# This version of Yapps 2 can be distributed under the
+# terms of the MIT open source license, either found in the LICENSE file
+# included with the Yapps distribution
+# <http://theory.stanford.edu/~amitp/yapps/> or at
+# <http://www.opensource.org/licenses/mit-license.php>
+
+The LICENSE file states:
+  <http://www.opensource.org/licenses/mit-license.php>
+
+  Permission is hereby granted, free of charge, to any person obtaining 
+  a copy of this software and associated documentation files (the 
+  "Software"), to deal in the Software without restriction, including 
+  without limitation the rights to use, copy, modify, merge, publish, 
+  distribute, sublicense, and/or sell copies of the Software, and to 
+  permit persons to whom the Software is furnished to do so, subject to 
+  the following conditions: 
+
+  The above copyright notice and this permission notice shall be included 
+  in all copies or substantial portions of the Software. 
+
+  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 
+  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 
+  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. 
+  IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY 
+  CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 
+  TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 
+  SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 
--- yapps2-2.1.1.orig/debian/exporter
+++ yapps2-2.1.1/debian/exporter
@@ -0,0 +1,18 @@
+#!/bin/sh
+
+set -e
+
+test -n "$1"
+test -z "$3"
+if test -z "$2" ; then T="+"; else T="$2"; fi
+D="$1"
+
+bk changes -v -r1.0..$T > "$D"/changelog
+cd "$D"
+if test ! -d doc ; then
+	mkdir doc yapps
+	mv yapps2.tex doc
+	mv yappsrt.py yapps/runtime.py
+	mv parsetree.py grammar.py yapps/
+	rm yapps_grammar.py
+fi
--- yapps2-2.1.1.orig/debian/pyversions
+++ yapps2-2.1.1/debian/pyversions
@@ -0,0 +1 @@
+2.2-
--- yapps2-2.1.1.orig/debian/rules
+++ yapps2-2.1.1/debian/rules
@@ -0,0 +1,100 @@
+#!/usr/bin/make -f
+# -*- makefile -*-
+# Sample debian/rules that uses debhelper.
+# GNU copyright 1997 to 1999 by Joey Hess.
+
+# Uncomment this to turn on verbose mode.
+#export DH_VERBOSE=1
+
+include /usr/share/python/python.mk
+
+PWD=$(shell pwd)
+PYVER=$(shell pyversions -d)
+
+CFLAGS = -Wall -g
+
+ifneq (,$(findstring noopt,$(DEB_BUILD_OPTIONS)))
+	CFLAGS += -O0
+else
+	CFLAGS += -O2
+endif
+ifeq (,$(findstring nostrip,$(DEB_BUILD_OPTIONS)))
+	INSTALL_PROGRAM += -s
+endif
+
+configure: configure-stamp
+configure-stamp:
+	dh_testdir
+	# Add here commands to configure the package.
+
+	touch configure-stamp
+
+
+build: build-stamp
+
+build-stamp: configure-stamp 
+	dh_testdir
+
+	# Add here commands to compile the package.
+	python setup.py build
+	#/usr/bin/docbook-to-man debian/yapps2.sgml > yapps.1
+	#cd doc && latex2html yapps2.tex
+	cd doc && hevea yapps2.tex
+	cd doc && hevea yapps2.tex # twice because of TOC
+
+	touch build-stamp
+
+clean:
+	dh_testdir
+	dh_testroot
+	rm -f build-stamp configure-stamp
+
+	rm -rf build debian/yapps2 doc/yapps2
+	test -f changelog || bk changes > changelog
+
+	dh_clean 
+
+install: build
+	dh_testdir
+	dh_testroot
+	dh_clean -k 
+	dh_installdirs
+	dh_installdirs -pyapps2-runtime usr/lib/$(PYVER)/${call py_sitename, ${PYVER}}/yapps
+
+	# Add here commands to install the package into debian/yapps.
+	python setup.py install --root=$(PWD)/debian/yapps2 --no-compile ${py_setup_install_args}
+	install -m 755 yapps2.py debian/yapps2/usr/bin/yapps
+	install -m 755 doc/yapps2.html debian/yapps2/usr/share/doc/yapps2/
+	set -e; \
+	for f in runtime.py __init__.py; do \
+	    mv $(PWD)/debian/yapps2/usr/lib/$(PYVER)/${call py_sitename, ${PYVER}}/yapps/$$f \
+	        $(PWD)/debian/yapps2-runtime/usr/lib/$(PYVER)/${call py_sitename, ${PYVER}}/yapps/; \
+	done
+
+# Build architecture-independent files here.
+binary-indep: build install
+	dh_testdir
+	dh_testroot
+	dh_installchangelogs 
+	dh_installdocs 
+	dh_installexamples examples/* test yapps_grammar.g
+	dh_installman debian/yapps.1
+	find debian/yapps2/usr/share -name SCCS -print0 | xargs -0r rm -rf
+	dh_compress
+	dh_compress usr/share/doc/yapps2/NOTES
+	dh_fixperms
+#	dh_perl
+	dh_python2
+#	dh_makeshlibs
+	dh_installdeb
+	dh_shlibdeps
+	dh_gencontrol
+	dh_md5sums
+	dh_builddeb
+
+# Build architecture-dependent files here.
+binary-arch: build install
+# We have nothing to do by default.
+
+binary: binary-indep binary-arch
+.PHONY: build clean binary-indep binary-arch binary install configure
--- yapps2-2.1.1.orig/debian/yapps.1
+++ yapps2-2.1.1/debian/yapps.1
@@ -0,0 +1,63 @@
+.\" $Revision: 1.5 $
+.TH YAPPS 1
+.SH NAME
+yapps \- create a Python module from a grammar file
+.SH SYNOPSIS
+.B yapps 
+[
+.B \-\-dump
+]
+[
+.B \-\-use\-devel\-grammar
+]
+[
+.B \-fcontext\-insensitive\-scanner
+]
+[
+.BI \-p
+.BI " pid"
+]
+[
+.BI \-f
+]
+input.g
+[
+.BI output.py
+]
+.BI " name"
+.SH DESCRIPTION
+
+  \-\-dump                           Dump out grammar information
+    \-\-use\-devel\-grammar              Use the devel grammar parser from
+	yapps_grammar.py instead of the stable grammar from grammar.py
+	  \-fcontext\-insensitive\-scanner    Scan all tokens (see docs)
+
+.I yapps
+generates a Python program which will parse a given grammar.
+.PP
+.SH OPTIONS
+.TP
+.B \-\-dump
+Dump the grammar information to stdout.
+.TP
+.B \-\-use\-devel\-grammar
+Use the grammar file in ./yapps_grammar.py instead of yapps/grammar.py.
+.br
+This option is useful for testing new grammar parsers. (Yes, yapps'
+parser is itself written with yapps...)
+.TP
+.B \-fcontext\-insensitive\-scanner
+Set the option to use the non\-context\-sensitive scanner.
+.SH CAVEATS
+.I yapps
+implements a recursive\-descent scanner.
+.SH HISTORY
+Written by Amit J. Patel <amitp@cs.stanford.edu>.
+.br
+This version was enhanced by Matthias Urlichs <smurf@debian.org>.
+It is
+.B not
+downwards-compatible with the original yapps2 (yet) and uses a different
+runtime library.
+.br
+See the change log for details.
--- yapps2-2.1.1.orig/debian/yapps2-runtime.README
+++ yapps2-2.1.1/debian/yapps2-runtime.README
@@ -0,0 +1,11 @@
+The Debian Package yapps2-runtime
+---------------------------------
+
+This package contains the new runtime Python code for the augmented
+yapps2 parser which is included in Debian.
+
+You need to depend on this package if you Debianize Python programs that
+contain a yapps2-built parser.
+
+-- 
+Matthias Urlichs
--- yapps2-2.1.1.orig/debian/yapps2-runtime.dirs
+++ yapps2-2.1.1/debian/yapps2-runtime.dirs
@@ -0,0 +1 @@
+usr/share/doc/yapps2-runtime
--- yapps2-2.1.1.orig/debian/yapps2.dirs
+++ yapps2-2.1.1/debian/yapps2.dirs
@@ -0,0 +1,3 @@
+usr/bin
+usr/share/doc/yapps2
+usr/share/doc/yapps2/html/
--- yapps2-2.1.1.orig/debian/yapps2.doc-base
+++ yapps2-2.1.1/debian/yapps2.doc-base
@@ -0,0 +1,13 @@
+Document: yapps2
+Title: Debian yapps Manual
+Author: Amit J. Patel <amitp@theory.stanford.edu>
+Abstract: This manual describes the YAPPS parser generator.
+Section: python
+
+Format: latex
+Files: /usr/share/doc/yapps2/yapps2.tex.gz
+
+Format: HTML
+Index: /usr/share/doc/yapps2/yapps2.html
+Files: /usr/share/doc/yapps2/yapps2.html
+
--- yapps2-2.1.1.orig/debian/yapps2.docs
+++ yapps2-2.1.1/debian/yapps2.docs
@@ -0,0 +1,3 @@
+NOTES
+changelog
+doc/yapps2.tex
--- yapps2-2.1.1.orig/doc/yapps2.haux
+++ yapps2-2.1.1/doc/yapps2.haux
@@ -0,0 +1,31 @@
+\@@addtocsec{htoc}{sec1}{0}{\@print{1}\quad{}Introduction{}}
+\@@addtocsec{htoc}{sec2}{0}{\@print{2}\quad{}Examples{}}
+\@@addtocsec{htoc}{sec3}{1}{\@print{2.1}\quad{}Introduction to Grammars{}}
+\@@addtocsec{htoc}{sec4}{1}{\@print{2.2}\quad{}Lisp Expressions{}}
+\@@addtocsec{htoc}{sec7}{1}{\@print{2.3}\quad{}Calculator{}}
+\@@addtocsec{htoc}{sec8}{1}{\@print{2.4}\quad{}Calculator with Memory{}}
+\@@addtocsec{htoc}{sec9}{0}{\@print{3}\quad{}Grammars{}}
+\@@addtocsec{htoc}{sec10}{1}{\@print{3.1}\quad{}Left Factoring{}}
+\newlabel{sec:Left-Factoring}{{3.1}{X}}
+\@@addtocsec{htoc}{sec11}{1}{\@print{3.2}\quad{}Left Recursion{}}
+\@@addtocsec{htoc}{sec12}{1}{\@print{3.3}\quad{}Ambiguous Grammars{}}
+\newlabel{sec:Ambiguous-Grammars}{{3.3}{X}}
+\@@addtocsec{htoc}{sec13}{0}{\@print{4}\quad{}Customization{}}
+\@@addtocsec{htoc}{sec14}{1}{\@print{4.1}\quad{}Customizing Parsers{}}
+\@@addtocsec{htoc}{sec15}{1}{\@print{4.2}\quad{}Customizing Scanners{}}
+\@@addtocsec{htoc}{sec16}{0}{\@print{5}\quad{}Parser Mechanics{}}
+\@@addtocsec{htoc}{sec17}{1}{\@print{5.1}\quad{}Parser Objects{}}
+\newlabel{sec:Parser-Objects}{{5.1}{X}}
+\@@addtocsec{htoc}{sec18}{1}{\@print{5.2}\quad{}Context Sensitive Scanner{}}
+\@@addtocsec{htoc}{sec19}{1}{\@print{5.3}\quad{}Internal Variables{}}
+\@@addtocsec{htoc}{sec20}{1}{\@print{5.4}\quad{}Pre- and Post-Parser Code{}}
+\@@addtocsec{htoc}{sec21}{1}{\@print{5.5}\quad{}Representation of Grammars{}}
+\@@addtocsec{htoc}{sec22}{0}{\@print{A}\quad{}Grammar for Parsers{}}
+\@@addtocsec{htoc}{sec23}{0}{\@print{B}\quad{}Upgrading{}}
+\@@addtocsec{htoc}{sec24}{0}{\@print{C}\quad{}Troubleshooting{}}
+\@@addtocsec{htoc}{sec25}{0}{\@print{D}\quad{}History{}}
+\@@addtocsec{htoc}{sec26}{0}{\@print{E}\quad{}Debian Extensions{}}
+\newlabel{sec:debian}{{E}{X}}
+\@@addtocsec{htoc}{sec27}{0}{\@print{F}\quad{}Future Extensions{}}
+\newlabel{sec:future}{{F}{X}}
+\@@addtocsec{htoc}{sec28}{0}{\@print{G}\quad{}References{}}
--- yapps2-2.1.1.orig/doc/yapps2.html
+++ yapps2-2.1.1/doc/yapps2.html
@@ -0,0 +1,871 @@
+<!DOCTYPE html>
+<html >
+<head>
+<meta http-equiv="Content-Type" content="text/html; charset=US-ASCII">
+<meta name="generator" content="hevea 2.23">
+<style type="text/css">
+.li-itemize{margin:1ex 0ex;}
+.li-enumerate{margin:1ex 0ex;}
+.dd-description{margin:0ex 0ex 1ex 4ex;}
+.dt-description{margin:0ex;}
+.toc{list-style:none;}
+.footnotetext{margin:0ex; padding:0ex;}
+div.footnotetext P{margin:0px; text-indent:1em;}
+.thefootnotes{text-align:left;margin:0ex;}
+.dt-thefootnotes{margin:0em;}
+.dd-thefootnotes{margin:0em 0em 0em 2em;}
+.footnoterule{margin:1em auto 1em 0px;width:50%;}
+.caption{padding-left:2ex; padding-right:2ex; margin-left:auto; margin-right:auto}
+.title{margin:2ex auto;text-align:center}
+.titlemain{margin:1ex 2ex 2ex 1ex;}
+.titlerest{margin:0ex 2ex;}
+.center{text-align:center;margin-left:auto;margin-right:auto;}
+.flushleft{text-align:left;margin-left:0ex;margin-right:auto;}
+.flushright{text-align:right;margin-left:auto;margin-right:0ex;}
+div table{margin-left:inherit;margin-right:inherit;margin-bottom:2px;margin-top:2px}
+td table{margin:auto;}
+table{border-collapse:collapse;}
+td{padding:0;}
+.cellpadding0 tr td{padding:0;}
+.cellpadding1 tr td{padding:1px;}
+pre{text-align:left;margin-left:0ex;margin-right:auto;}
+blockquote{margin-left:4ex;margin-right:4ex;text-align:left;}
+td p{margin:0px;}
+.boxed{border:1px solid black}
+.textboxed{border:1px solid black}
+.vbar{border:none;width:2px;background-color:black;}
+.hbar{border:none;height:2px;width:100%;background-color:black;}
+.hfill{border:none;height:1px;width:200%;background-color:black;}
+.vdisplay{border-collapse:separate;border-spacing:2px;width:auto; empty-cells:show; border:2px solid red;}
+.vdcell{white-space:nowrap;padding:0px; border:2px solid green;}
+.display{border-collapse:separate;border-spacing:2px;width:auto; border:none;}
+.dcell{white-space:nowrap;padding:0px; border:none;}
+.dcenter{margin:0ex auto;}
+.vdcenter{border:solid #FF8000 2px; margin:0ex auto;}
+.minipage{text-align:left; margin-left:0em; margin-right:auto;}
+.marginpar{border:solid thin black; width:20%; text-align:left;}
+.marginparleft{float:left; margin-left:0ex; margin-right:1ex;}
+.marginparright{float:right; margin-left:1ex; margin-right:0ex;}
+.theorem{text-align:left;margin:1ex auto 1ex 0ex;}
+.part{margin:2ex auto;text-align:center}
+</style>
+<title>yapps2</title>
+</head>
+<body >
+<!--HEVEA command line is: /usr/bin/hevea yapps2.tex -->
+<!--CUT STYLE article--><!--CUT DEF section 1 --><div class="center">
+<table style="border-spacing:6px;border-collapse:separate;" class="cellpading0"><tr><td style="text-align:center;white-space:nowrap" ><span style="font-size:x-large">The </span><span style="font-size:x-large"><em>Yapps</em></span><span style="font-size:x-large"> Parser Generator System</span></td></tr>
+<tr><td style="text-align:center;white-space:nowrap" ><code>http://theory.stanford.edu/~amitp/Yapps/</code></td></tr>
+<tr><td style="text-align:center;white-space:nowrap" > Version 2</td></tr>
+<tr><td style="text-align:center;white-space:nowrap" >&nbsp;</td></tr>
+<tr><td style="text-align:center;white-space:nowrap" >Amit J. Patel</td></tr>
+<tr><td style="text-align:center;white-space:nowrap" >http://www-cs-students.stanford.edu/&#XA0;amitp/
+http://www-cs-students.stanford.edu/&#XA0;amitp/ </td></tr>
+</table> <hr style="height:2">
+</div>
+<!--TOC section id="sec1" Introduction-->
+<h2 id="sec1" class="section">1&#XA0;&#XA0;Introduction</h2><!--SEC END --><p><em>Yapps</em> (<U>Y</U>et <U>A</U>nother <U>P</U>ython
+<U>P</U>arser <U>S</U>ystem) is an easy to use parser
+generator that is written in Python and generates Python code. There
+are several parser generator systems already available for Python,
+including <span style="font-family:monospace">PyLR, kjParsing, PyBison,</span> and <span style="font-family:monospace">mcf.pars,</span>
+but I had different goals for my parser. Yapps is simple, is easy to
+use, and produces human-readable parsers. It is not the fastest or
+most powerful parser. Yapps is designed to be used when regular
+expressions are not enough and other parser systems are too much:
+situations where you may write your own recursive descent parser.</p><p>Some unusual features of Yapps that may be of interest are:</p><ol class="enumerate" type=1><li class="li-enumerate">Yapps produces recursive descent parsers that are readable by
+humans, as opposed to table-driven parsers that are difficult to
+read. A Yapps parser for a simple calculator looks similar to the
+one that Mark Lutz wrote by hand for <em>Programming Python.</em></li><li class="li-enumerate">Yapps also allows for rules that accept parameters and pass
+arguments to be used while parsing subexpressions. Grammars that
+allow for arguments to be passed to subrules and for values to be
+passed back are often called <em>attribute grammars.</em> In many
+cases parameterized rules can be used to perform actions at &#X201C;parse
+time&#X201D; that are usually delayed until later. For example,
+information about variable declarations can be passed into the
+rules that parse a procedure body, so that undefined variables can
+be detected at parse time. The types of defined variables can be
+used in parsing as well&#X2014;for example, if the type of <span style="font-family:monospace">X</span> is
+known, we can determine whether <span style="font-family:monospace">X(1)</span> is an array reference or 
+a function call.</li><li class="li-enumerate">Yapps grammars are fairly easy to write, although there are
+some inconveniences having to do with ELL(1) parsing that have to be
+worked around. For example, rules have to be left factored and
+rules may not be left recursive. However, neither limitation seems 
+to be a problem in practice. <p>Yapps grammars look similar to the notation used in the Python
+reference manual, with operators like <code>*</code>, <code>+</code>, <code>|</code>,
+<code>[]</code>, and <code>()</code> for patterns, names (<span style="font-family:monospace">tim</span>) for rules,
+regular expressions (<code>"[a-z]+"</code>) for tokens, and <code>#</code> for
+comments.</p></li><li class="li-enumerate">The Yapps parser generator is written as a single Python module
+with no C extensions. Yapps produces parsers that are written
+entirely in Python, and require only the Yapps run-time module (5k)
+for support.</li><li class="li-enumerate">Yapps&#X2019;s scanner is context-sensitive, picking tokens based on
+the types of the tokens accepted by the parser. This can be
+helpful when implementing certain kinds of parsers, such as for a
+preprocessor.</li></ol><p>There are several disadvantages of using Yapps over another parser system:</p><ol class="enumerate" type=1><li class="li-enumerate">Yapps parsers are <span style="font-family:monospace">ELL(1)</span> (Extended LL(1)), which is
+less powerful than <span style="font-family:monospace">LALR</span> (used by <span style="font-family:monospace">PyLR</span>) or
+<span style="font-family:monospace">SLR</span> (used by <span style="font-family:monospace">kjParsing</span>), so Yapps would not be a
+good choice for parsing complex languages. For example, allowing
+both <span style="font-family:monospace">x := 5;</span> and <span style="font-family:monospace">x;</span> as statements is difficult
+because we must distinguish based on only one token of lookahead.
+Seeing only <span style="font-family:monospace">x</span>, we cannot decide whether we have an
+assignment statement or an expression statement. (Note however
+that this kind of grammar can be matched with backtracking; see
+section <a href="#sec%3Afuture">F</a>.)</li><li class="li-enumerate">The scanner that Yapps provides can only read from strings, not
+files, so an entire file has to be read in before scanning can
+begin. It is possible to build a custom scanner, though, so in
+cases where stream input is needed (from the console, a network, or
+a large file are examples), the Yapps parser can be given a custom
+scanner that reads from a stream instead of a string.</li><li class="li-enumerate">Yapps is not designed with efficiency in mind.</li></ol><p>Yapps provides an easy to use parser generator that produces parsers
+similar to what you might write by hand. It is not meant to be a
+solution for all parsing problems, but instead an aid for those times
+you would write a parser by hand rather than using one of the more
+powerful parsing packages available.</p><p>Yapps 2.0 is easier to use than Yapps 1.0. New features include a
+less restrictive input syntax, which allows mixing of sequences,
+choices, terminals, and nonterminals; optional matching; the ability
+to insert single-line statements into the generated parser; and
+looping constructs <code>*</code> and <code>+</code> similar to the repetitive
+matching constructs in regular expressions. Unfortunately, the
+addition of these constructs has made Yapps 2.0 incompatible with
+Yapps 1.0, so grammars will have to be rewritten. See section
+<a href="#sec%3AUpgrading">??</a> for tips on changing Yapps 1.0 grammars for use
+with Yapps 2.0.</p>
+<!--TOC section id="sec2" Examples-->
+<h2 id="sec2" class="section">2&#XA0;&#XA0;Examples</h2><!--SEC END --><p>In this section are several examples that show the use of Yapps.
+First, an introduction shows how to construct grammars and write them
+in Yapps form. This example can be skipped by someone familiar with
+grammars and parsing. Next is a Lisp expression grammar that produces
+a parse tree as output. This example demonstrates the use of tokens
+and rules, as well as returning values from rules. The third example
+is a expression evaluation grammar that evaluates during parsing
+(instead of producing a parse tree).</p>
+<!--TOC subsection id="sec3" Introduction to Grammars-->
+<h3 id="sec3" class="subsection">2.1&#XA0;&#XA0;Introduction to Grammars</h3><!--SEC END --><p>A <em>grammar</em> for a natural language specifies how words can be put
+together to form large structures, such as phrases and sentences. A
+grammar for a computer language is similar in that it specifies how
+small components (called <em>tokens</em>) can be put together to form
+larger structures. In this section we will write a grammar for a tiny
+subset of English.</p><p>Simple English sentences can be described as being a noun phrase
+followed by a verb followed by a noun phrase. For example, in the
+sentence, &#X201C;Jack sank the blue ship,&#X201D; the word &#X201C;Jack&#X201D; is the first
+noun phrase, &#X201C;sank&#X201D; is the verb, and &#X201C;the blue ship&#X201D; is the second
+noun phrase. In addition we should say what a noun phrase is; for
+this example we shall say that a noun phrase is an optional article
+(a, an, the) followed by any number of adjectives followed by a noun.
+The tokens in our language are the articles, nouns, verbs, and
+adjectives. The <em>rules</em> in our language will tell us how to
+combine the tokens together to form lists of adjectives, noun phrases,
+and sentences:</p><ul class="itemize"><li class="li-itemize">
+<span style="font-family:monospace">sentence: noun_phrase verb noun_phrase</span>
+</li><li class="li-itemize"><span style="font-family:monospace">noun_phrase: [article] adjective* noun</span>
+</li></ul><p>Notice that some things that we said easily in English, such as
+&#X201C;optional article,&#X201D; are expressed using special syntax, such as
+brackets. When we said, &#X201C;any number of adjectives,&#X201D; we wrote
+<span style="font-family:monospace">adjective*</span>, where the <span style="font-family:monospace">*</span> means &#X201C;zero or more of the
+preceding pattern&#X201D;.</p><p>The grammar given above is close to a Yapps grammar. We also have to
+specify what the tokens are, and what to do when a pattern is matched.
+For this example, we will do nothing when patterns are matched; the
+next example will explain how to perform match actions.</p><pre class="verbatim">parser TinyEnglish:
+  ignore:          "\\W+"
+  token noun:      "(Jack|spam|ship)"
+  token verb:      "(sank|threw)"
+  token article:   "(a|an|the)"
+  token adjective: "(blue|red|green)"
+
+  rule sentence:       noun_phrase verb noun_phrase
+  rule noun_phrase:    [article] adjective* noun
+</pre><p>The tokens are specified as Python <em>regular expressions</em>. Since
+Yapps produces Python code, you can write any regular expression that
+would be accepted by Python. (<em>Note:</em> These are Python 1.5
+regular expressions from the <span style="font-family:monospace">re</span> module, not Python 1.4
+regular expressions from the <span style="font-family:monospace">regex</span> module.) In addition to
+tokens that you want to see (which are given names), you can also
+specify tokens to ignore, marked by the <span style="font-family:monospace">ignore</span> keyword. In
+this parser we want to ignore whitespace.</p><p>The TinyEnglish grammar shows how you define tokens and rules, but it
+does not specify what should happen once we&#X2019;ve matched the rules. In
+the next example, we will take a grammar and produce a <em>parse
+tree</em> from it.</p>
+<!--TOC subsection id="sec4" Lisp Expressions-->
+<h3 id="sec4" class="subsection">2.2&#XA0;&#XA0;Lisp Expressions</h3><!--SEC END --><p>Lisp syntax, although hated by many, has a redeeming quality: it is
+simple to parse. In this section we will construct a Yapps grammar to
+parse Lisp expressions and produce a parse tree as output.</p><!--TOC subsubsection id="sec5" Defining the Grammar-->
+<h4 id="sec5" class="subsubsection">Defining the Grammar</h4><!--SEC END --><p>The syntax of Lisp is simple. It has expressions, which are
+identifiers, strings, numbers, and lists. A list is a left
+parenthesis followed by some number of expressions (separated by
+spaces) followed by a right parenthesis. For example, <code>5</code>,
+<code>"ni"</code>, and <code>(print "1+2 = " (+ 1 2))</code> are Lisp expressions.
+Written as a grammar,</p><pre class="verbatim">    expr:   ID | STR | NUM | list
+    list:   ( expr* )  
+</pre><p>In addition to having a grammar, we need to specify what to do every
+time something is matched. For the tokens, which are strings, we just
+want to get the &#X201C;value&#X201D; of the token, attach its type (identifier,
+string, or number) in some way, and return it. For the lists, we want
+to construct and return a Python list.</p><p>Once some pattern is matched, we enclose a return statement enclosed
+in <code>{{...}}</code>. The braces allow us to insert any one-line
+statement into the parser. Within this statement, we can refer to the
+values returned by matching each part of the rule. After matching a
+token such as <span style="font-family:monospace">ID</span>, &#X201C;ID&#X201D; will be bound to the text of the
+matched token. Let&#X2019;s take a look at the rule:</p><pre class="verbatim">    rule expr: ID   {{ return ('id', ID) }}
+      ...
+</pre><p>In a rule, tokens return the text that was matched. For identifiers,
+we just return the identifier, along with a &#X201C;tag&#X201D; telling us that
+this is an identifier and not a string or some other value. Sometimes
+we may need to convert this text to a different form. For example, if
+a string is matched, we want to remove quotes and handle special forms
+like <code>\n</code>. If a number is matched, we want to convert it into a
+number. Let&#X2019;s look at the return values for the other tokens:</p><pre class="verbatim">      ...
+             | STR  {{ return ('str', eval(STR)) }}
+             | NUM  {{ return ('num', atoi(NUM)) }}
+      ...
+</pre><p>If we get a string, we want to remove the quotes and process any
+special backslash codes, so we run <span style="font-family:monospace">eval</span> on the quoted string.
+If we get a number, we convert it to an integer with <span style="font-family:monospace">atoi</span> and
+then return the number along with its type tag.</p><p>For matching a list, we need to do something slightly more
+complicated. If we match a Lisp list of expressions, we want to
+create a Python list with those values.</p><pre class="verbatim">    rule list: "\\("                 # Match the opening parenthesis
+               {{ result = [] }}     # Create a Python list
+               ( 
+                  expr               # When we match an expression,
+                  {{ result.append(expr) }}   # add it to the list
+               )*                    # * means repeat this if needed
+               "\\)"                 # Match the closing parenthesis
+               {{ return result }}   # Return the Python list
+</pre><p>In this rule we first match the opening parenthesis, then go into a
+loop. In this loop we match expressions and add them to the list.
+When there are no more expressions to match, we match the closing
+parenthesis and return the resulting. Note that <code>#</code> is used for
+comments, just as in Python.</p><p>The complete grammar is specified as follows:
+</p><pre class="verbatim">parser Lisp:
+    ignore:      '\\s+'
+    token NUM:   '[0-9]+'
+    token ID:    '[-+*/!@%^&amp;=.a-zA-Z0-9_]+' 
+    token STR:   '"([^\\"]+|\\\\.)*"'
+
+    rule expr:   ID     {{ return ('id', ID) }}
+               | STR    {{ return ('str', eval(STR)) }}
+               | NUM    {{ return ('num', atoi(NUM)) }}
+               | list   {{ return list }}
+    rule list: "\\("    {{ result = [] }} 
+               ( expr   {{ result.append(expr) }}
+               )*  
+               "\\)"    {{ return result }} 
+</pre><p>One thing you may have noticed is that <code>"\\("</code> and <code>"\\)"</code>
+appear in the <span style="font-family:monospace">list</span> rule. These are <em>inline tokens</em>:
+they appear in the rules without being given a name with the
+<span style="font-family:monospace">token</span> keyword. Inline tokens are more convenient to use, but
+since they do not have a name, the text that is matched cannot be used
+in the return value. They are best used for short simple patterns
+(usually punctuation or keywords).</p><p>Another thing to notice is that the number and identifier tokens
+overlap. For example, &#X201C;487&#X201D; matches both NUM and ID. In Yapps, the
+scanner only tries to match tokens that are acceptable to the parser.
+This rule doesn&#X2019;t help here, since both NUM and ID can appear in the
+same place in the grammar. There are two rules used to pick tokens if
+more than one matches. One is that the <em>longest</em> match is
+preferred. For example, &#X201C;487x&#X201D; will match as an ID (487x) rather
+than as a NUM (487) followed by an ID (x). The second rule is that if
+the two matches are the same length, the <em>first</em> one listed in
+the grammar is preferred. For example, &#X201C;487&#X201D; will match as an NUM
+rather than an ID because NUM is listed first in the grammar. Inline
+tokens have preference over any tokens you have listed.</p><p>Now that our grammar is defined, we can run Yapps to produce a parser,
+and then run the parser to produce a parse tree.</p><!--TOC subsubsection id="sec6" Running Yapps-->
+<h4 id="sec6" class="subsubsection">Running Yapps</h4><!--SEC END --><p>In the Yapps module is a function <span style="font-family:monospace">generate</span> that takes an
+input filename and writes a parser to another file. We can use this
+function to generate the Lisp parser, which is assumed to be in
+<span style="font-family:monospace">lisp.g</span>.</p><pre class="verbatim">% python
+Python 1.5.1 (#1, Sep  3 1998, 22:51:17)  [GCC 2.7.2.3] on linux-i386
+Copyright 1991-1995 Stichting Mathematisch Centrum, Amsterdam
+&gt;&gt;&gt; import yapps
+&gt;&gt;&gt; yapps.generate('lisp.g')
+</pre><p>At this point, Yapps has written a file <span style="font-family:monospace">lisp.py</span> that contains
+the parser. In that file are two classes (one scanner and one parser)
+and a function (called <span style="font-family:monospace">parse</span>) that puts things together for
+you.</p><p>Alternatively, we can run Yapps from the command line to generate the
+parser file:</p><pre class="verbatim">% python yapps.py lisp.g
+</pre><p>After running Yapps either from within Python or from the command
+line, we can use the Lisp parser by calling the <span style="font-family:monospace">parse</span>
+function. The first parameter should be the rule we want to match,
+and the second parameter should be the string to parse.</p><pre class="verbatim">&gt;&gt;&gt; import lisp
+&gt;&gt;&gt; lisp.parse('expr', '(+ 3 4)')
+[('id', '+'), ('num', 3), ('num', 4)]
+&gt;&gt;&gt; lisp.parse('expr', '(print "3 = " (+ 1 2))')
+[('id', 'print'), ('str', '3 = '), [('id', '+'), ('num', 1), ('num', 2)]]
+</pre><p>The <span style="font-family:monospace">parse</span> function is not the only way to use the parser;
+section <a href="#sec%3AParser-Objects">5.1</a> describes how to access parser objects
+directly.</p><p>We&#X2019;ve now gone through the steps in creating a grammar, writing a
+grammar file for Yapps, producing a parser, and using the parser. In
+the next example we&#X2019;ll see how rules can take parameters and also how
+to do computations instead of just returning a parse tree.</p>
+<!--TOC subsection id="sec7" Calculator-->
+<h3 id="sec7" class="subsection">2.3&#XA0;&#XA0;Calculator</h3><!--SEC END --><p>A common example parser given in many textbooks is that for simple
+expressions, with numbers, addition, subtraction, multiplication,
+division, and parenthesization of subexpressions. We&#X2019;ll write this
+example in Yapps, evaluating the expression as we parse.</p><p>Unlike <span style="font-family:monospace">yacc</span>, Yapps does not have any way to specify
+precedence rules, so we have to do it ourselves. We say that an
+expression is the sum of terms, and that a term is the product of
+factors, and that a factor is a number or a parenthesized expression:</p><pre class="verbatim">    expr:           factor ( ("+"|"-") factor )*
+    factor:         term   ( ("*"|"/") term )*
+    term:           NUM | "(" expr ")"
+</pre><p>In order to evaluate the expression as we go, we should keep along an
+accumulator while evaluating the lists of terms or factors. Just as
+we kept a &#X201C;result&#X201D; variable to build a parse tree for Lisp
+expressions, we will use a variable to evaluate numerical
+expressions. The full grammar is given below:</p><pre class="verbatim">parser Calculator:
+    token END: "$"         # $ means end of string
+    token NUM: "[0-9]+"
+
+    rule goal:           expr END         {{ return expr }}
+
+    # An expression is the sum and difference of factors
+    rule expr:           factor           {{ v = factor }}
+                       ( "[+]" factor       {{ v = v+factor }}
+                       |  "-"  factor       {{ v = v-factor }}
+                       )*                 {{ return v }}
+
+    # A factor is the product and division of terms
+    rule factor:         term             {{ v = term }}
+                       ( "[*]" term         {{ v = v*term }}
+                       |  "/"  term         {{ v = v/term }}
+                       )*                 {{ return v }}
+
+    # A term is either a number or an expression surrounded by parentheses
+    rule term:           NUM              {{ return atoi(NUM) }}
+                       | "\\(" expr "\\)" {{ return expr }}
+</pre><p>The top-level rule is <em>goal</em>, which says that we are looking for
+an expression followed by the end of the string. The <span style="font-family:monospace">END</span>
+token is needed because without it, it isn&#X2019;t clear when to stop
+parsing. For example, the string &#X201C;1+3&#X201D; could be parsed either as
+the expression &#X201C;1&#X201D; followed by the string &#X201C;+3&#X201D; or it could be
+parsed as the expression &#X201C;1+3&#X201D;. By requiring expressions to end
+with <span style="font-family:monospace">END</span>, the parser is forced to take &#X201C;1+3&#X201D;.</p><p>In the two rules with repetition, the accumulator is named <span style="font-family:monospace">v</span>.
+After reading in one expression, we initialize the accumulator. Each
+time through the loop, we modify the accumulator by adding,
+subtracting, multiplying by, or dividing the previous accumulator by
+the expression that has been parsed. At the end of the rule, we
+return the accumulator.</p><p>The calculator example shows how to process lists of elements using
+loops, as well as how to handle precedence of operators.</p><p><em>Note:</em> It&#X2019;s often important to put the <span style="font-family:monospace">END</span> token in, so 
+put it in unless you are sure that your grammar has some other
+non-ambiguous token marking the end of the program.</p>
+<!--TOC subsection id="sec8" Calculator with Memory-->
+<h3 id="sec8" class="subsection">2.4&#XA0;&#XA0;Calculator with Memory</h3><!--SEC END --><p>In the previous example we learned how to write a calculator that
+evaluates simple numerical expressions. In this section we will
+extend the example to support both local and global variables.</p><p>To support global variables, we will add assignment statements to the
+&#X201C;goal&#X201D; rule.</p><pre class="verbatim">    rule goal:           expr END         {{ return expr }}
+              | 'set' ID expr END         {{ global_vars[ID] = expr }}
+                                          {{ return expr }}   
+</pre><p>To use these variables, we need a new kind of terminal:</p><pre class="verbatim">    rule term: ... | ID {{ return global_vars[ID] }} 
+</pre><p>So far, these changes are straightforward. We simply have a global
+dictionary <span style="font-family:monospace">global_vars</span> that stores the variables and values, 
+we modify it when there is an assignment statement, and we look up
+variables in it when we see a variable name.</p><p>To support local variables, we will add variable declarations to the
+set of allowed expressions.</p><pre class="verbatim">    rule term: ... | 'let' VAR '=' expr 'in' expr ...
+</pre><p>This is where it becomes tricky. Local variables should be stored in
+a local dictionary, not in the global one. One trick would be to save 
+a copy of the global dictionary, modify it, and then restore it
+later. In this example we will instead use <em>attributes</em> to
+create local information and pass it to subrules.</p><p>A rule can optionally take parameters. When we invoke the rule, we
+must pass in arguments. For local variables, let&#X2019;s use a single
+parameter, <span style="font-family:monospace">local_vars</span>:</p><pre class="verbatim">    rule expr&lt;&lt;local_vars&gt;&gt;:   ...
+    rule factor&lt;&lt;local_vars&gt;&gt;: ...
+    rule term&lt;&lt;local_vars&gt;&gt;:   ...
+</pre><p>Each time we want to match <span style="font-family:monospace">expr</span>, <span style="font-family:monospace">factor</span>, or
+<span style="font-family:monospace">term</span>, we will pass the local variables in the current rule to
+the subrule. One interesting case is when we pass as an argument
+something <em>other</em> than <span style="font-family:monospace">local_vars</span>:</p><pre class="verbatim">   rule term&lt;&lt;local_vars&gt;&gt;: ...
+                | 'let' VAR '=' expr&lt;&lt;local_vars&gt;&gt;
+                  {{ local_vars = [(VAR, expr)] + local_vars }}
+                  'in' expr&lt;&lt;local_vars&gt;&gt;
+                  {{ return expr }}
+</pre><p>Note that the assignment to the local variables list does not modify
+the original list. This is important to keep local variables from
+being seen outside the &#X201C;let&#X201D;.</p><p>The other interesting case is when we find a variable:</p><pre class="verbatim">global_vars = {}
+
+def lookup(map, name):
+    for x,v in map:  if x==name: return v
+    return global_vars[name]
+%%
+   ...
+   rule term&lt;&lt;local_vars&gt;: ...
+                | VAR {{ return lookup(local_vars, VAR) }}
+</pre><p>The lookup function will search through the local variable list, and
+if it cannot find the name there, it will look it up in the global
+variable dictionary.</p><p>A complete grammar for this example, including a read-eval-print loop
+for interacting with the calculator, can be found in the examples
+subdirectory included with Yapps.</p><p>In this section we saw how to insert code before the parser. We also
+saw how to use attributes to transmit local information from one rule
+to its subrules.</p>
+<!--TOC section id="sec9" Grammars-->
+<h2 id="sec9" class="section">3&#XA0;&#XA0;Grammars</h2><!--SEC END --><p>Each Yapps grammar has a name, a list of tokens, and a set of
+production rules. A grammar named <span style="font-family:monospace">X</span> will be used to produce
+a parser named <span style="font-family:monospace">X</span> and a scanner anmed <span style="font-family:monospace">XScanner</span>. As
+in Python, names are case sensitive, start with a letter, and contain
+letters, numbers, and underscores (_).</p><p>There are three kinds of tokens in Yapps: named, inline, and ignored.
+As their name implies, named tokens are given a name, using the token
+construct: <span style="font-family:monospace">token </span><span style="font-family:monospace"><em>name</em></span><span style="font-family:monospace"> : </span><span style="font-family:monospace"><em>regexp</em></span>. In a rule, the
+token can be matched by using the name. Inline tokens are regular
+expressions that are used in rules without being declared. Ignored
+tokens are declared using the ignore construct: <span style="font-family:monospace">ignore:
+</span><span style="font-family:monospace"><em>regexp</em></span>. These tokens are ignored by the scanner, and are
+not seen by the parser. Often whitespace is an ignored token. The
+regular expressions used to define tokens should use the syntax
+defined in the <span style="font-family:monospace">re</span> module, so some symbols may have to be
+backslashed.</p><p>Production rules in Yapps have a name and a pattern to match. If the
+rule is parameterized, the name should be followed by a list of
+parameter names in <code>&lt;&lt;...&gt;&gt;</code>. A pattern can be a simple pattern
+or a compound pattern. Simple patterns are the name of a named token,
+a regular expression in quotes (inline token), the name of a
+production rule (followed by arguments in <code>&lt;&lt;...&gt;&gt;</code>, if the rule
+has parameters), and single line Python statements (<code>{{...}}</code>).
+Compound patterns are sequences (<code>A B C ...</code>), choices (
+<code>A | B | C | ...</code>), options (<code>[...]</code>), zero-or-more repetitions
+(<code>...*</code>), and one-or-more repetitions (<code>...+</code>). Like
+regular expressions, repetition operators have a higher precedence
+than sequences, and sequences have a higher precedence than choices.</p><p>Whenever <code>{{...}}</code> is used, a legal one-line Python statement
+should be put inside the braces. The token <code>}}</code> should not
+appear within the <code>{{...}}</code> section, even within a string, since
+Yapps does not attempt to parse the Python statement. A workaround
+for strings is to put two strings together (<code>"}" "}"</code>), or to use
+backslashes (<code>"}\}"</code>). At the end of a rule you should use a
+<code>{{ return X }}</code> statement to return a value. However, you
+should <em>not</em> use any control statements (<span style="font-family:monospace">return</span>,
+<span style="font-family:monospace">continue</span>, <span style="font-family:monospace">break</span>) in the middle of a rule. Yapps
+needs to make assumptions about the control flow to generate a parser,
+and any changes to the control flow will confuse Yapps.</p><p>The <code>&lt;&lt;...&gt;&gt;</code> form can occur in two places: to define parameters
+to a rule and to give arguments when matching a rule. Parameters use
+the syntax used for Python functions, so they can include default
+arguments and the special forms (<code>*args</code> and <code>**kwargs</code>).
+Arguments use the syntax for Python function call arguments, so they
+can include normal arguments and keyword arguments. The token
+<code>&gt;&gt;</code> should not appear within the <code>&lt;&lt;...&gt;&gt;</code> section.</p><p>In both the statements and rule arguments, you can use names defined
+by the parser to refer to matched patterns. You can refer to the text
+matched by a named token by using the token name. You can use the
+value returned by a production rule by using the name of that rule.
+If a name <span style="font-family:monospace">X</span> is matched more than once (such as in loops), you
+will have to save the earlier value(s) in a temporary variable, and
+then use that temporary variable in the return value. The next
+section has an example of a name that occurs more than once.</p>
+<!--TOC subsection id="sec10" Left Factoring-->
+<h3 id="sec10" class="subsection">3.1&#XA0;&#XA0;Left Factoring</h3><!--SEC END --><p>
+<a id="sec:Left-Factoring"></a></p><p>Yapps produces ELL(1) parsers, which determine which clause to match
+based on the first token available. Sometimes the leftmost tokens of
+several clauses may be the same. The classic example is the
+<em>if/then/else</em> construct in Pascal:</p><pre class="verbatim">rule stmt:  "if" expr "then" stmt {{ then_part = stmt }} 
+                      "else" stmt {{ return ('If',expr,then_part,stmt) }}
+          | "if" expr "then" stmt {{ return ('If',expr,stmt,[]) }}
+</pre><p>(Note that we have to save the first <span style="font-family:monospace">stmt</span> into a variable
+because there is another <span style="font-family:monospace">stmt</span> that will be matched.) The
+left portions of the two clauses are the same, which presents a
+problem for the parser. The solution is <em>left-factoring</em>: the
+common parts are put together, and <em>then</em> a choice is made about
+the remaining part:</p><pre class="verbatim">rule stmt:  "if" expr 
+              "then" stmt {{ then_part = stmt }}
+              {{ else_part = [] }}
+              [ "else" stmt {{ else_part = stmt }} ]
+            {{ return ('If', expr, then_part, else_part) }}
+</pre><p>Unfortunately, the classic <em>if/then/else</em> situation is
+<em>still</em> ambiguous when you left-factor. Yapps can deal with this
+situation, but will report a warning; see section
+<a href="#sec%3AAmbiguous-Grammars">3.3</a> for details.</p><p>In general, replace rules of the form:</p><pre class="verbatim">rule A:   a b1 {{ return E1 }}
+        | a b2 {{ return E2 }}
+        | c3   {{ return E3 }}
+        | c4   {{ return E4 }}
+</pre><p>with rules of the form:</p><pre class="verbatim">rule A:   a ( b1 {{ return E1 }}
+            | b2 {{ return E2 }}
+            )
+        | c3   {{ return E3 }}
+        | c4   {{ return E4 }}
+</pre>
+<!--TOC subsection id="sec11" Left Recursion-->
+<h3 id="sec11" class="subsection">3.2&#XA0;&#XA0;Left Recursion</h3><!--SEC END --><p>A common construct in grammars is for matching a list of patterns,
+sometimes separated with delimiters such as commas or semicolons. In
+LR-based parser systems, we can parse a list with something like this:</p><pre class="verbatim">rule sum:  NUM             {{ return NUM }}
+         | sum "+" NUM     {{ return (sum, NUM) }}
+</pre><p>Parsing <span style="font-family:monospace">1+2+3+4</span> would produce the output
+<span style="font-family:monospace">(((1,2),3),4)</span>, which is what we want from a left-associative
+addition operator. Unfortunately, this grammar is <em>left
+recursive,</em> because the <span style="font-family:monospace">sum</span> rule contains a clause that
+begins with <span style="font-family:monospace">sum</span>. (The recursion occurs at the left side of
+the clause.)</p><p>We must restructure this grammar to be <em>right recursive</em> instead:</p><pre class="verbatim">rule sum:  NUM             {{ return NUM }}
+         | NUM "+" sum     {{ return (NUM, sum) }}
+</pre><p>Unfortunately, using this grammar, <span style="font-family:monospace">1+2+3+4</span> would be parsed as
+<span style="font-family:monospace">(1,(2,(3,4)))</span>, which no longer follows left associativity.
+The rule also needs to be left-factored. Instead, we write the
+pattern as a loop instead:</p><pre class="verbatim">rule sum:       NUM {{ v = NUM }}
+                ( "[+]" NUM {{ v = (v,NUM) }} )*
+                {{ return v }}
+</pre><p>In general, replace rules of the form:</p><pre class="verbatim">rule A:  A a1 -&gt; &lt;&lt; E1 &gt;&gt; 
+       | A a2 -&gt; &lt;&lt; E2 &gt;&gt;
+       | b3   -&gt; &lt;&lt; E3 &gt;&gt;
+       | b4   -&gt; &lt;&lt; E4 &gt;&gt;
+</pre><p>with rules of the form:</p><pre class="verbatim">rule A:  ( b3 {{ A = E3 }} 
+         | b4 {{ A = E4 }} )
+         ( a1 {{ A = E1 }}
+         | a2 {{ A = E2 }} )*
+         {{ return A }}
+</pre><p>We have taken a rule that proved problematic for with recursion and
+turned it into a rule that works well with looping constructs.</p>
+<!--TOC subsection id="sec12" Ambiguous Grammars-->
+<h3 id="sec12" class="subsection">3.3&#XA0;&#XA0;Ambiguous Grammars</h3><!--SEC END --><p>
+<a id="sec:Ambiguous-Grammars"></a></p><p>In section <a href="#sec%3ALeft-Factoring">3.1</a> we saw the classic if/then/else
+ambiguity, which occurs because the &#X201C;else &#X2026;&#X201D; portion of an &#X201C;if
+&#X2026;then &#X2026;else &#X2026;&#X201D; construct is optional. Programs with 
+nested if/then/else constructs can be ambiguous when one of the else
+clauses is missing:
+</p><pre class="verbatim">if 1 then            if 1 then
+    if 5 then            if 5 then
+        x := 1;              x := 1;
+    else             else
+        y := 9;          y := 9;
+</pre><p>The indentation shows that the program can be parsed in two different
+ways. (Of course, if we all would adopt Python&#X2019;s indentation-based
+structuring, this would never happen!) Usually we want the parsing on
+the left: the &#X201C;else&#X201D; should be associated with the closest &#X201C;if&#X201D;
+statement. In section <a href="#sec%3ALeft-Factoring">3.1</a> we &#X201C;solved&#X201D; the
+problem by using the following grammar:</p><pre class="verbatim">rule stmt:  "if" expr 
+              "then" stmt {{ then_part = stmt }}
+              {{ else_part = [] }}
+              [ "else" stmt {{ else_part = stmt }} ]
+            {{ return ('If', expr, then_part, else_part) }}
+</pre><p>Here, we have an optional match of &#X201C;else&#X201D; followed by a statement.
+The ambiguity is that if an &#X201C;else&#X201D; is present, it is not clear
+whether you want it parsed immediately or if you want it to be parsed
+by the outer &#X201C;if&#X201D;.</p><p>Yapps will deal with the situation by matching when the else pattern
+when it can. The parser will work in this case because it prefers the
+<em>first</em> matching clause, which tells Yapps to parse the &#X201C;else&#X201D;.
+That is exactly what we want!</p><p>For ambiguity cases with choices, Yapps will choose the <em>first</em>
+matching choice. However, remember that Yapps only looks at the first 
+token to determine its decision, so <span style="font-family:monospace">(a b | a c)</span> will result in
+Yapps choosing <span style="font-family:monospace">a b</span> even when the input is <span style="font-family:monospace">a c</span>. It only
+looks at the first token, <span style="font-family:monospace">a</span>, to make its decision.</p>
+<!--TOC section id="sec13" Customization-->
+<h2 id="sec13" class="section">4&#XA0;&#XA0;Customization</h2><!--SEC END --><p>Both the parsers and the scanners can be customized. The parser is
+usually extended by subclassing, and the scanner can either be
+subclassed or completely replaced.</p>
+<!--TOC subsection id="sec14" Customizing Parsers-->
+<h3 id="sec14" class="subsection">4.1&#XA0;&#XA0;Customizing Parsers</h3><!--SEC END --><p>If additional fields and methods are needed in order for a parser to
+work, Python subclassing can be used. (This is unlike parser classes
+written in static languages, in which these fields and methods must be
+defined in the generated parser class.) We simply subclass the
+generated parser, and add any fields or methods required. Expressions
+in the grammar can call methods of the subclass to perform any actions
+that cannot be expressed as a simple expression. For example,
+consider this simple grammar:</p><pre class="verbatim">parser X:
+    rule goal:  "something"  {{ self.printmsg() }}
+</pre><p>The <span style="font-family:monospace">printmsg</span> function need not be implemented in the parser
+class <span style="font-family:monospace">X</span>; it can be implemented in a subclass:</p><pre class="verbatim">import Xparser
+
+class MyX(Xparser.X):
+    def printmsg(self):
+        print "Hello!"
+</pre>
+<!--TOC subsection id="sec15" Customizing Scanners-->
+<h3 id="sec15" class="subsection">4.2&#XA0;&#XA0;Customizing Scanners</h3><!--SEC END --><p>The generated parser class is not dependent on the generated scanner
+class. A scanner object is passed to the parser object&#X2019;s constructor
+in the <span style="font-family:monospace">parse</span> function. To use a different scanner, write
+your own function to construct parser objects, with an instance of a
+different scanner. Scanner objects must have a <span style="font-family:monospace">token</span> method
+that accepts an integer <span style="font-family:monospace">N</span> as well as a list of allowed token
+types, and returns the Nth token, as a tuple. The default scanner
+raises <span style="font-family:monospace">NoMoreTokens</span> if no tokens are available, and
+<span style="font-family:monospace">SyntaxError</span> if no token could be matched. However, the
+parser does not rely on these exceptions; only the <span style="font-family:monospace">parse</span>
+convenience function (which calls <span style="font-family:monospace">wrap_error_reporter</span>) and
+the <span style="font-family:monospace">print_error</span> error display function use those exceptions.</p><p>The tuples representing tokens have four elements. The first two are
+the beginning and ending indices of the matched text in the input
+string. The third element is the type tag, matching either the name
+of a named token or the quoted regexp of an inline or ignored token.
+The fourth element of the token tuple is the matched text. If the
+input string is <span style="font-family:monospace">s</span>, and the token tuple is
+<span style="font-family:monospace">(b,e,type,val)</span>, then <span style="font-family:monospace">val</span> should be equal to
+<span style="font-family:monospace">s[b:e]</span>.</p><p>The generated parsers do not the beginning or ending index. They use
+only the token type and value. However, the default error reporter
+uses the beginning and ending index to show the user where the error
+is.</p>
+<!--TOC section id="sec16" Parser Mechanics-->
+<h2 id="sec16" class="section">5&#XA0;&#XA0;Parser Mechanics</h2><!--SEC END --><p>The base parser class (Parser) defines two methods, <span style="font-family:monospace">_scan</span>
+and <span style="font-family:monospace">_peek</span>, and two fields, <span style="font-family:monospace">_pos</span> and
+<span style="font-family:monospace">_scanner</span>. The generated parser inherits from the base
+parser, and contains one method for each rule in the grammar. To
+avoid name clashes, do not use names that begin with an underscore
+(<span style="font-family:monospace">_</span>).</p>
+<!--TOC subsection id="sec17" Parser Objects-->
+<h3 id="sec17" class="subsection">5.1&#XA0;&#XA0;Parser Objects</h3><!--SEC END --><p>
+<a id="sec:Parser-Objects"></a></p><p>Yapps produces as output two exception classes, a scanner class, a
+parser class, and a function <span style="font-family:monospace">parse</span> that puts everything
+together. The <span style="font-family:monospace">parse</span> function does not have to be used;
+instead, one can create a parser and scanner object and use them
+together for parsing.</p><pre class="verbatim">    def parse(rule, text):
+        P = X(XScanner(text))
+        return wrap_error_reporter(P, rule)
+</pre><p>The <span style="font-family:monospace">parse</span> function takes a name of a rule and an input string
+as input. It creates a scanner and parser object, then calls
+<span style="font-family:monospace">wrap_error_reporter</span> to execute the method in the parser
+object named <span style="font-family:monospace">rule</span>. The wrapper function will call the
+appropriate parser rule and report any parsing errors to standard
+output.</p><p>There are several situations in which the <span style="font-family:monospace">parse</span> function
+would not be useful. If a different parser or scanner is being used,
+or exceptions are to be handled differently, a new <span style="font-family:monospace">parse</span>
+function would be required. The supplied <span style="font-family:monospace">parse</span> function can
+be used as a template for writing a function for your own needs. An
+example of a custom parse function is the <span style="font-family:monospace">generate</span> function
+in <span style="font-family:monospace">Yapps.py</span>.</p>
+<!--TOC subsection id="sec18" Context Sensitive Scanner-->
+<h3 id="sec18" class="subsection">5.2&#XA0;&#XA0;Context Sensitive Scanner</h3><!--SEC END --><p>Unlike most scanners, the scanner produced by Yapps can take into
+account the context in which tokens are needed, and try to match only
+good tokens. For example, in the grammar:</p><pre class="verbatim">parser IniFile:
+   token ID:   "[a-zA-Z_0-9]+"
+   token VAL:  ".*"
+
+   rule pair:  ID "[ \t]*=[ \t]*" VAL "\n"
+</pre><p>we would like to scan lines of text and pick out a name/value pair.
+In a conventional scanner, the input string <span style="font-family:monospace">shell=progman.exe</span>
+would be turned into a single token of type <span style="font-family:monospace">VAL</span>. The Yapps
+scanner, however, knows that at the beginning of the line, an
+<span style="font-family:monospace">ID</span> is expected, so it will return <span style="font-family:monospace">"shell"</span> as a token
+of type <span style="font-family:monospace">ID</span>. Later, it will return <span style="font-family:monospace">"progman.exe"</span> as
+a token of type <span style="font-family:monospace">VAL</span>.</p><p>Context sensitivity decreases the separation between scanner and
+parser, but it is useful in parsers like <span style="font-family:monospace">IniFile</span>, where the
+tokens themselves are not unambiguous, but <em>are</em> unambiguous
+given a particular stage in the parsing process.</p><p>Unfortunately, context sensitivity can make it more difficult to
+detect errors in the input. For example, in parsing a Pascal-like
+language with &#X201C;begin&#X201D; and &#X201C;end&#X201D; as keywords, a context sensitive
+scanner would only match &#X201C;end&#X201D; as the END token if the parser is in
+a place that will accept the END token. If not, then the scanner
+would match &#X201C;end&#X201D; as an identifier. To disable the context
+sensitive scanner in Yapps, add the
+<span style="font-family:monospace">context-insensitive-scanner</span> option to the grammar:</p><pre class="verbatim">Parser X:
+    option:  "context-insensitive-scanner"
+</pre><p>Context-insensitive scanning makes the parser look cleaner as well.</p>
+<!--TOC subsection id="sec19" Internal Variables-->
+<h3 id="sec19" class="subsection">5.3&#XA0;&#XA0;Internal Variables</h3><!--SEC END --><p>There are two internal fields that may be of use. The parser object
+has two fields, <span style="font-family:monospace">_pos</span>, which is the index of the current
+token being matched, and <span style="font-family:monospace">_scanner</span>, which is the scanner
+object. The token itself can be retrieved by accessing the scanner
+object and calling the <span style="font-family:monospace">token</span> method with the token index. However, if you call <span style="font-family:monospace">token</span> before the token has been requested by the parser, it may mess up a context-sensitive scanner.<sup><a id="text1" href="#note1">1</a></sup> A
+potentially useful combination of these fields is to extract the
+portion of the input matched by the current rule. To do this, just save the scanner state (<span style="font-family:monospace">_scanner.pos</span>) before the text is matched and then again after the text is matched:</p><pre class="verbatim">  rule R: 
+      {{ start = self._scanner.pos }}
+      a b c 
+      {{ end = self._scanner.pos }}
+      {{ print 'Text is', self._scanner.input[start:end] }}
+</pre>
+<!--TOC subsection id="sec20" Pre- and Post-Parser Code-->
+<h3 id="sec20" class="subsection">5.4&#XA0;&#XA0;Pre- and Post-Parser Code</h3><!--SEC END --><p>Sometimes the parser code needs to rely on helper variables,
+functions, and classes. A Yapps grammar can optionally be surrounded
+by double percent signs, to separate the grammar from Python code.</p><pre class="verbatim">... Python code ...
+%%
+... Yapps grammar ...
+%%
+... Python code ...
+</pre><p>The second <code>%%</code> can be omitted if there is no Python code at the
+end, and the first <code>%%</code> can be omitted if there is no extra
+Python code at all. (To have code only at the end, both separators
+are required.)</p><p>If the second <code>%%</code> is omitted, Yapps will insert testing code
+that allows you to use the generated parser to parse a file.</p><p>The extended calculator example in the Yapps examples subdirectory
+includes both pre-parser and post-parser code.</p>
+<!--TOC subsection id="sec21" Representation of Grammars-->
+<h3 id="sec21" class="subsection">5.5&#XA0;&#XA0;Representation of Grammars</h3><!--SEC END --><p>For each kind of pattern there is a class derived from Pattern. Yapps 
+has classes for Terminal, NonTerminal, Sequence, Choice, Option, Plus, 
+Star, and Eval. Each of these classes has the following interface:</p><ul class="itemize"><li class="li-itemize">
+setup(<em>gen</em>) Set accepts-&#X454;, and call
+<em>gen.changed()</em> if it changed. This function can change the
+flag from false to true but <em>not</em> from true to false.
+</li><li class="li-itemize">update(<em>(</em>gen)) Set <span style="font-variant:small-caps">first</span>and <span style="font-variant:small-caps">follow</span>, and call
+<em>gen.changed()</em> if either changed. This function can add to
+the sets but <em>not</em> remove from them.
+</li><li class="li-itemize">output(<em>gen</em>, <em>indent</em>) Generate code for matching
+this rule, using <em>indent</em> as the current indentation level.
+Writes are performed using <em>gen.write</em>.
+</li><li class="li-itemize">used(<em>vars</em>) Given a list of variables <em>vars</em>,
+return two lists: one containing the variables that are used, and
+one containing the variables that are assigned. This function is
+used for optimizing the resulting code.
+</li></ul><p>Both <em>setup</em> and <em>update</em> monotonically increase the
+variables they modify. Since the variables can only increase a finite
+number of times, we can repeatedly call the function until the
+variable stabilized. The <em>used</em> function is not currently
+implemented.</p><p>With each pattern in the grammar Yapps associates three pieces of
+information: the <span style="font-variant:small-caps">first</span>set, the <span style="font-variant:small-caps">follow</span>set, and the
+accepts-&#X454; flag.</p><p>The <span style="font-variant:small-caps">first</span>set contains the tokens that can appear as we start
+matching the pattern. The <span style="font-variant:small-caps">follow</span>set contains the tokens that can
+appear immediately after we match the pattern. The accepts-&#X454; 
+flag is true if the pattern can match no tokens. In this case, <span style="font-variant:small-caps">first</span>will contain all the elements in <span style="font-variant:small-caps">follow</span>. The <span style="font-variant:small-caps">follow</span>set is not
+needed when accepts-&#X454; is false, and may not be accurate in
+those cases.</p><p>Yapps does not compute these sets precisely. Its approximation can
+miss certain cases, such as this one:</p><pre class="verbatim">  rule C: ( A* | B )
+  rule B: C [A]
+</pre><p>Yapps will calculate <span style="font-family:monospace">C</span>&#X2019;s <span style="font-variant:small-caps">follow</span>set to include <span style="font-family:monospace">A</span>.
+However, <span style="font-family:monospace">C</span> will always match all the <span style="font-family:monospace">A</span>&#X2019;s, so <span style="font-family:monospace">A</span> will
+never follow it. Yapps 2.0 does not properly handle this construct,
+but if it seems important, I may add support for it in a future
+version.</p><p>Yapps also cannot handle constructs that depend on the calling
+sequence. For example:</p><pre class="verbatim">  rule R: U | 'b'
+  rule S:   | 'c'
+  rule T: S 'b'
+  rule U: S 'a'
+</pre><p>The <span style="font-variant:small-caps">follow</span>set for <span style="font-family:monospace">S</span> includes <span style="font-family:monospace">a</span> and <span style="font-family:monospace">b</span>. Since <span style="font-family:monospace">S</span> can be empty, the <span style="font-variant:small-caps">first</span>set for <span style="font-family:monospace">S</span> should include <span style="font-family:monospace">a</span>,
+<span style="font-family:monospace">b</span>, and <span style="font-family:monospace">c</span>. However, when parsing <span style="font-family:monospace">R</span>, if the lookahead
+is <span style="font-family:monospace">b</span> we should <em>not</em> parse <span style="font-family:monospace">U</span>. That&#X2019;s because in <span style="font-family:monospace">U</span>, <span style="font-family:monospace">S</span> is followed by <span style="font-family:monospace">a</span> and not <span style="font-family:monospace">b</span>. Therefore in
+<span style="font-family:monospace">R</span>, we should choose rule <span style="font-family:monospace">U</span> only if there is an <span style="font-family:monospace">a</span> or
+<span style="font-family:monospace">c</span>, but not if there is a <span style="font-family:monospace">b</span>. Yapps and many other LL(1)
+systems do not distinguish <span style="font-family:monospace">S b</span> and <span style="font-family:monospace">S a</span>, making <span style="font-family:monospace">S</span>&#X2019;s <span style="font-variant:small-caps">follow</span>set <span style="font-family:monospace">a, b</span>, and making <span style="font-family:monospace">R</span> always try to match
+<span style="font-family:monospace">U</span>. In this case we can solve the problem by changing <span style="font-family:monospace">R</span> to 
+<code>'b' | U</code> but it may not always be possible to solve all such
+problems in this way.</p>
+<!--TOC section id="sec22" Grammar for Parsers-->
+<h2 id="sec22" class="section">A&#XA0;&#XA0;Grammar for Parsers</h2><!--SEC END --><p>This is the grammar for parsers, without any Python code mixed in.
+The complete grammar can be found in <span style="font-family:monospace">parsedesc.g</span> in the Yapps
+distribution.</p><pre class="verbatim">parser ParserDescription:
+    ignore:      "\\s+"
+    ignore:      "#.*?\r?\n"
+    token END:   "$"  # $ means end of string
+    token ATTR:  "&lt;&lt;.+?&gt;&gt;"
+    token STMT:  "{{.+?}}"
+    token ID:    '[a-zA-Z_][a-zA-Z_0-9]*'
+    token STR:   '[rR]?\'([^\\n\'\\\\]|\\\\.)*\'|[rR]?"([^\\n"\\\\]|\\\\.)*"'
+
+    rule Parser: "parser" ID ":"
+                   Options
+                   Tokens
+                   Rules
+                 END 
+
+    rule Options:  ( "option" ":" STR )*
+    rule Tokens:   ( "token" ID ":" STR | "ignore"   ":" STR )*
+    rule Rules:    ( "rule" ID OptParam ":" ClauseA )*
+
+    rule ClauseA:  ClauseB ( '[|]' ClauseB )*
+    rule ClauseB:  ClauseC*
+    rule ClauseC:  ClauseD [ '[+]' | '[*]' ]
+    rule ClauseD:  STR | ID [ATTR] | STMT
+                 | '\\(' ClauseA '\\) | '\\[' ClauseA '\\]'
+</pre>
+<!--TOC section id="sec23" Upgrading-->
+<h2 id="sec23" class="section">B&#XA0;&#XA0;Upgrading</h2><!--SEC END --><p>Yapps 2.0 is not backwards compatible with Yapps 1.0. In this section 
+are some tips for upgrading:</p><ol class="enumerate" type=1><li class="li-enumerate">
+Yapps 1.0 was distributed as a single file. Yapps 2.0 is
+instead distributed as two Python files: a <em>parser generator</em>
+(26k) and a <em>parser runtime</em> (5k). You need both files to
+create parsers, but you need only the runtime (<span style="font-family:monospace">yappsrt.py</span>)
+to use the parsers.</li><li class="li-enumerate">Yapps 1.0 supported Python 1.4 regular expressions from the
+<span style="font-family:monospace">regex</span> module. Yapps 2.0 uses Python 1.5 regular
+expressions from the <span style="font-family:monospace">re</span> module. <em>The new syntax for
+regular expressions is not compatible with the old syntax.</em>
+Andrew Kuchling has a guide to converting
+regular
+expressionshttp://www.python.org/doc/howto/regex-to-re/ on his
+web page.</li><li class="li-enumerate">Yapps 1.0 wants a pattern and then a return value in <code>-&gt;</code>
+<code>&lt;&lt;...&gt;&gt;</code>. Yapps 2.0 allows patterns and Python statements to
+be mixed. To convert a rule like this:<pre class="verbatim">rule R: A B C -&gt; &lt;&lt; E1 &gt;&gt;
+      | X Y Z -&gt; &lt;&lt; E2 &gt;&gt;
+</pre><p>to Yapps 2.0 form, replace the return value specifiers with return
+statements:</p><pre class="verbatim">rule R: A B C {{ return E1 }}
+      | X Y Z {{ return E2 }}
+</pre></li><li class="li-enumerate">Yapps 2.0 does not perform tail recursion elimination. This
+means any recursive rules you write will be turned into recursive
+methods in the parser. The parser will work, but may be slower.
+It can be made faster by rewriting recursive rules, using instead
+the looping operators <code>*</code> and <code>+</code> provided in Yapps 2.0.</li></ol>
+<!--TOC section id="sec24" Troubleshooting-->
+<h2 id="sec24" class="section">C&#XA0;&#XA0;Troubleshooting</h2><!--SEC END --><ul class="itemize"><li class="li-itemize">
+A common error is to write a grammar that doesn&#X2019;t have an END
+token. End tokens are needed when it is not clear when to stop
+parsing. For example, when parsing the expression <span style="font-family:monospace">3+5</span>, it is 
+not clear after reading <span style="font-family:monospace">3</span> whether to treat it as a complete
+expression or whether the parser should continue reading.
+Therefore the grammar for numeric expressions should include an end 
+token. Another example is the grammar for Lisp expressions. In
+Lisp, it is always clear when you should stop parsing, so you do
+<em>not</em> need an end token. In fact, it may be more useful not
+to have an end token, so that you can read in several Lisp expressions.
+</li><li class="li-itemize">If there is a chance of ambiguity, make sure to put the choices 
+in the order you want them checked. Usually the most specific
+choice should be first. Empty sequences should usually be last.
+</li><li class="li-itemize">The context sensitive scanner is not appropriate for all
+grammars. You might try using the insensitive scanner with the
+<span style="font-family:monospace">context-insensitive-scanner</span> option in the grammar.
+</li><li class="li-itemize">If performance turns out to be a problem, try writing a custom
+scanner. The Yapps scanner is rather slow (but flexible and easy
+to understand).
+</li></ul>
+<!--TOC section id="sec25" History-->
+<h2 id="sec25" class="section">D&#XA0;&#XA0;History</h2><!--SEC END --><p>Yapps 1 had several limitations that bothered me while writing
+parsers:</p><ol class="enumerate" type=1><li class="li-enumerate">
+It was not possible to insert statements into the generated
+parser. A common workaround was to write an auxilliary function
+that executed those statements, and to call that function as part
+of the return value calculation. For example, several of my
+parsers had an &#X201C;append(x,y)&#X201D; function that existed solely to call 
+&#X201C;x.append(y)&#X201D;.
+</li><li class="li-enumerate">The way in which grammars were specified was rather
+restrictive: a rule was a choice of clauses. Each clause was a
+sequence of tokens and rule names, followed by a return value.
+</li><li class="li-enumerate">Optional matching had to be put into a separate rule because
+choices were only made at the beginning of a rule.
+</li><li class="li-enumerate">Repetition had to be specified in terms of recursion. Not only 
+was this awkward (sometimes requiring additional rules), I had to
+add a tail recursion optimization to Yapps to transform the
+recursion back into a loop.
+</li></ol><p>Yapps 2 addresses each of these limitations.</p><ol class="enumerate" type=1><li class="li-enumerate">
+Statements can occur anywhere within a rule. (However, only
+one-line statements are allowed; multiline blocks marked by
+indentation are not.)
+</li><li class="li-enumerate">Grammars can be specified using any mix of sequences, choices,
+tokens, and rule names. To allow for complex structures,
+parentheses can be used for grouping.
+</li><li class="li-enumerate">Given choices and parenthesization, optional matching can be
+expressed as a choice between some pattern and nothing. In
+addition, Yapps 2 has the convenience syntax <code>[A B ...]</code> for
+matching <code>A B ...</code> optionally.
+</li><li class="li-enumerate">Repetition operators <code>*</code> for zero or more and <code>+</code> for 
+one or more make it easy to specify repeating patterns.
+</li></ol><p>It is my hope that Yapps 2 will be flexible enough to meet my needs
+for another year, yet simple enough that I do not hesitate to use it.</p>
+<!--TOC section id="sec26" Debian Extensions-->
+<h2 id="sec26" class="section">E&#XA0;&#XA0;Debian Extensions</h2><!--SEC END --><p>
+<a id="sec:debian"></a></p><p>The Debian version adds the following enhancements to the original
+Yapps code. They were written by Matthias Urlichs.</p><ol class="enumerate" type=1><li class="li-enumerate">
+Yapps can stack input sources ("include files"). A usage example
+is supplied with the calc.g sample program.
+</li><li class="li-enumerate">Yapps now understands augmented ignore-able patterns.
+This means that Yapps can parse multi-line C comments; this wasn&#X2019;t
+possible before.
+</li><li class="li-enumerate">Better error reporting.
+</li><li class="li-enumerate">Yapps now reads its input incrementally.
+</li></ol><p>The generated parser has been renamed to <span style="font-family:monospace">yapps/runtime.py</span>.
+In Debian, this file is provided by the <span style="font-family:monospace">yapps2-runtime</span> package.
+You need to depend on it if you Debianize Python programs which use
+yapps.</p>
+<!--TOC section id="sec27" Future Extensions-->
+<h2 id="sec27" class="section">F&#XA0;&#XA0;Future Extensions</h2><!--SEC END --><p>
+<a id="sec:future"></a></p><p>I am still investigating the possibility of LL(2) and higher
+lookahead. However, it looks like the resulting parsers will be
+somewhat ugly. </p><p>It would be nice to control choices with user-defined predicates.</p><p>The most likely future extension is backtracking. A grammar pattern
+like <code>(VAR ':=' expr)? {{ return Assign(VAR,expr) }} : expr {{ return expr }}</code>
+would turn into code that attempted to match <code>VAR ':=' expr</code>. If 
+it succeeded, it would run <code>{{ return ... }}</code>. If it failed, it
+would match <code>expr {{ return expr }}</code>. Backtracking may make it
+less necessary to write LL(2) grammars.</p>
+<!--TOC section id="sec28" References-->
+<h2 id="sec28" class="section">G&#XA0;&#XA0;References</h2><!--SEC END --><ol class="enumerate" type=1><li class="li-enumerate">
+The Python-Parser
+SIGhttp://www.python.org/sigs/parser-sig/ is the first place
+to look for a list of parser systems for Python.</li><li class="li-enumerate">ANTLR/PCCTS, by Terrence Parr, is available at
+The ANTLR Home Pagehttp://www.antlr.org/.</li><li class="li-enumerate">PyLR, by Scott Cotton, is at his Starship
+pagehttp://starship.skyport.net/crew/scott/PyLR.html.</li><li class="li-enumerate">John Aycock&#X2019;s Compiling Little Languages
+Frameworkhttp://www.foretec.com/python/workshops/1998-11/proceedings/papers/aycock-little/aycock-little.html.</li><li class="li-enumerate">PyBison, by Scott Hassan, can be found at
+his Python Projects
+pagehttp://coho.stanford.edu/~hassan/Python/.</li><li class="li-enumerate">mcf.pars, by Mike C. Fletcher, is available at
+his web
+pagehttp://members.rogers.com/mcfletch/programming/simpleparse/simpleparse.html.</li><li class="li-enumerate">kwParsing, by Aaron Watters, is available at
+his Starship
+pagehttp://starship.skyport.net/crew/aaron_watters/kwParsing/.
+</li></ol><!--BEGIN NOTES document-->
+<hr class="footnoterule"><dl class="thefootnotes"><dt class="dt-thefootnotes">
+<a id="note1" href="#text1">1</a></dt><dd class="dd-thefootnotes"><div class="footnotetext">When using a context-sensitive scanner, the parser tells the scanner what the valid token types are at each point. If you call <span style="font-family:monospace">token</span> before the parser can tell the scanner the valid token types, the scanner will attempt to match without considering the context.</div></dd></dl>
+<!--END NOTES-->
+<!--CUT END -->
+<!--HTMLFOOT-->
+<!--ENDHTML-->
+<!--FOOTER-->
+<hr style="height:2"><blockquote class="quote"><em>This document was translated from L<sup>A</sup>T<sub>E</sub>X by
+</em><a href="http://hevea.inria.fr/index.html"><em>H</em><em><span style="font-size:small"><sup>E</sup></span></em><em>V</em><em><span style="font-size:small"><sup>E</sup></span></em><em>A</em></a><em>.</em></blockquote></body>
+</html>
--- yapps2-2.1.1.orig/doc/yapps2.htoc
+++ yapps2-2.1.1/doc/yapps2.htoc
@@ -0,0 +1,36 @@
+\begin{tocenv}
+\tocitem \@locref{sec1}{\begin{@norefs}\@print{1}\quad{}Introduction{}\end{@norefs}}
+\tocitem \@locref{sec2}{\begin{@norefs}\@print{2}\quad{}Examples{}\end{@norefs}}
+\begin{tocenv}
+\tocitem \@locref{sec3}{\begin{@norefs}\@print{2.1}\quad{}Introduction to Grammars{}\end{@norefs}}
+\tocitem \@locref{sec4}{\begin{@norefs}\@print{2.2}\quad{}Lisp Expressions{}\end{@norefs}}
+\tocitem \@locref{sec7}{\begin{@norefs}\@print{2.3}\quad{}Calculator{}\end{@norefs}}
+\tocitem \@locref{sec8}{\begin{@norefs}\@print{2.4}\quad{}Calculator with Memory{}\end{@norefs}}
+\end{tocenv}
+\tocitem \@locref{sec9}{\begin{@norefs}\@print{3}\quad{}Grammars{}\end{@norefs}}
+\begin{tocenv}
+\tocitem \@locref{sec10}{\begin{@norefs}\@print{3.1}\quad{}Left Factoring{}\end{@norefs}}
+\tocitem \@locref{sec11}{\begin{@norefs}\@print{3.2}\quad{}Left Recursion{}\end{@norefs}}
+\tocitem \@locref{sec12}{\begin{@norefs}\@print{3.3}\quad{}Ambiguous Grammars{}\end{@norefs}}
+\end{tocenv}
+\tocitem \@locref{sec13}{\begin{@norefs}\@print{4}\quad{}Customization{}\end{@norefs}}
+\begin{tocenv}
+\tocitem \@locref{sec14}{\begin{@norefs}\@print{4.1}\quad{}Customizing Parsers{}\end{@norefs}}
+\tocitem \@locref{sec15}{\begin{@norefs}\@print{4.2}\quad{}Customizing Scanners{}\end{@norefs}}
+\end{tocenv}
+\tocitem \@locref{sec16}{\begin{@norefs}\@print{5}\quad{}Parser Mechanics{}\end{@norefs}}
+\begin{tocenv}
+\tocitem \@locref{sec17}{\begin{@norefs}\@print{5.1}\quad{}Parser Objects{}\end{@norefs}}
+\tocitem \@locref{sec18}{\begin{@norefs}\@print{5.2}\quad{}Context Sensitive Scanner{}\end{@norefs}}
+\tocitem \@locref{sec19}{\begin{@norefs}\@print{5.3}\quad{}Internal Variables{}\end{@norefs}}
+\tocitem \@locref{sec20}{\begin{@norefs}\@print{5.4}\quad{}Pre- and Post-Parser Code{}\end{@norefs}}
+\tocitem \@locref{sec21}{\begin{@norefs}\@print{5.5}\quad{}Representation of Grammars{}\end{@norefs}}
+\end{tocenv}
+\tocitem \@locref{sec22}{\begin{@norefs}\@print{A}\quad{}Grammar for Parsers{}\end{@norefs}}
+\tocitem \@locref{sec23}{\begin{@norefs}\@print{B}\quad{}Upgrading{}\end{@norefs}}
+\tocitem \@locref{sec24}{\begin{@norefs}\@print{C}\quad{}Troubleshooting{}\end{@norefs}}
+\tocitem \@locref{sec25}{\begin{@norefs}\@print{D}\quad{}History{}\end{@norefs}}
+\tocitem \@locref{sec26}{\begin{@norefs}\@print{E}\quad{}Debian Extensions{}\end{@norefs}}
+\tocitem \@locref{sec27}{\begin{@norefs}\@print{F}\quad{}Future Extensions{}\end{@norefs}}
+\tocitem \@locref{sec28}{\begin{@norefs}\@print{G}\quad{}References{}\end{@norefs}}
+\end{tocenv}
--- yapps2-2.1.1.orig/doc/yapps2.tex
+++ yapps2-2.1.1/doc/yapps2.tex
@@ -1177,6 +1177,27 @@
 It is my hope that Yapps 2 will be flexible enough to meet my needs
 for another year, yet simple enough that I do not hesitate to use it.
 
+\mysection{Debian Extensions}
+\label{sec:debian}
+
+The Debian version adds the following enhancements to the original
+Yapps code. They were written by Matthias Urlichs.
+
+\begin{enumerate}
+ \item Yapps can stack input sources ("include files"). A usage example
+ is supplied with the calc.g sample program.
+ \item Yapps now understands augmented ignore-able patterns.
+  This means that Yapps can parse multi-line C comments; this wasn't
+  possible before.
+ \item Better error reporting.
+ \item Yapps now reads its input incrementally.
+\end{enumerate}
+
+The generated parser has been renamed to \texttt{yapps/runtime.py}.
+In Debian, this file is provided by the \texttt{yapps2-runtime} package.
+You need to depend on it if you Debianize Python programs which use
+yapps.
+
 \mysection{Future Extensions}
 \label{sec:future}
 
--- yapps2-2.1.1.orig/examples/calc.g
+++ yapps2-2.1.1/examples/calc.g
@@ -6,9 +6,15 @@
     if not globalvars.has_key(name): print 'Undefined (defaulting to 0):', name
     return globalvars.get(name, 0)
 
+def stack_input(scanner,ign):
+    """Grab more input"""
+    scanner.stack_input(raw_input(">?> "))
+
 %%
 parser Calculator:
     ignore:    "[ \r\t\n]+"
+    ignore:    "[?]"         {{ stack_input }}
+
     token END: "$"
     token NUM: "[0-9]+"
     token VAR: "[a-zA-Z_]+"
@@ -34,7 +40,7 @@
 
     # A term is a number, variable, or an expression surrounded by parentheses
     rule term<<V>>:   
-                 NUM                      {{ return atoi(NUM) }}
+                 NUM                      {{ return int(NUM) }}
                | VAR                      {{ return lookup(V, VAR) }}
                | "\\(" expr "\\)"         {{ return expr }}
                | "let" VAR "=" expr<<V>>  {{ V = [(VAR, expr)] + V }}
@@ -51,8 +57,8 @@
     # one expression, get the result, enter another expression, etc.)
     while 1:
         try: s = raw_input('>>> ')
-	except EOFError: break
-        if not strip(s): break
+        except EOFError: break
+        if not s.strip(): break
         parse('goal', s)
     print 'Bye.'
 
--- yapps2-2.1.1.orig/examples/notes
+++ yapps2-2.1.1/examples/notes
@@ -0,0 +1,44 @@
+Hints
+#####
+
+Some additional hints for your edification.
+
+Author: Matthias Urlichs <smurf@debian.org>
+
+How to process C preprocessor codes:
+====================================
+
+Rudimentary include handling has been added to the parser by me.
+
+However, if you want to do anything fancy, like for instance whatever
+the C preprocessor does, things get more complicated. Fortunately,
+there's already a nice tool to handle C preprocessing -- CPP itself.
+
+If you want to report errors correctly in that situation, do this:
+
+	def set_line(s,m):
+		"""Fixup the scanner's idea of the current line"""
+		s.filename = m.group(2)
+		line = int(m.group(1))
+		s.del_line = line - s.line
+
+	%%
+	parser whatever:
+		ignore:    '^#\s*(\d+)\s*"([^"\n]+)"\s*\n' {{ set_line }}
+		ignore:    '^#.*\n'
+
+	[...]
+	%%
+	if __name__=='__main__':
+		import sys,os
+		for a in sys.argv[1:]:
+			f=os.popen("cpp "+repr(a),"r")
+
+			P = whatever(whateverScanner("", filename=a, file=f))
+			try: P.goal()
+			except runtime.SyntaxError, e:
+				runtime.print_error(e, P._scanner)
+				sys.exit(1)
+
+			f.close()
+
--- yapps2-2.1.1.orig/setup.py
+++ yapps2-2.1.1/setup.py
@@ -0,0 +1,42 @@
+#!/usr/bin/env python
+
+"""Setup script for 'yapps'"""
+
+from distutils.core import setup
+
+description = "Yet Another Python Parser System"
+long_description = \
+"""
+YAPPS is an easy to use parser generator that is written in Python and
+generates Python code.  There are several parser generator systems
+already available for Python, but this parser has different goals:
+Yapps is simple, very easy to use, and produces human-readable parsers.
+
+It is not the fastest or most powerful parser.  Yapps is designed to be
+used when regular expressions are not enough and other parser systems
+are too much: situations where you might otherwise write your own
+recursive descent parser.
+
+This package contains several upward-compatible enhancements to the
+original YAPPS source:
+- Handle stacked input ("include files")
+- augmented ignore-able patterns (can parse multi-line C comments correctly)
+- better error reporting
+- read input incrementally
+"""
+
+setup (name = "python-yapps",
+       version = "2.1.1",
+       description = description,
+       long_description = long_description,
+       author = "Amit J. Patel",
+       author_email = "amitp@cs.stanford.edu",
+       maintainer = "Matthias Urlichs",
+       maintainer_email = "smurf@debian.org",
+       url = "http://theory.stanford.edu/~amitp/yapps/",
+       license = 'MIT',
+       platforms = ['POSIX'],
+       keywords = ['parsing'],
+       packages = ['yapps'],
+       #cmdclass = {'bdist_rpm': MyBDist_RPM},
+      )
--- yapps2-2.1.1.orig/yapps/__init__.py
+++ yapps2-2.1.1/yapps/__init__.py
@@ -0,0 +1 @@
+# empty
--- yapps2-2.1.1.orig/yapps/grammar.py
+++ yapps2-2.1.1/yapps/grammar.py
@@ -1,5 +1,3 @@
-#!/usr/bin/python2
-#
 # grammar.py, part of Yapps 2 - yet another python parser system
 # Copyright 1999-2003 by Amit J. Patel <amitp@cs.stanford.edu>
 #
@@ -19,7 +17,7 @@
 """
 
 import sys, re
-import parsetree
+from yapps import parsetree
 
 ######################################################################
 def cleanup_choice(rule, lst):
@@ -33,9 +31,9 @@
 
 def resolve_name(rule, tokens, id, args):
     if id in [x[0] for x in tokens]:
-        # It's a token
-        if args:
-            print 'Warning: ignoring parameters on TOKEN %s<<%s>>' % (id, args)
+	# It's a token
+	if args:
+	    print 'Warning: ignoring parameters on TOKEN %s<<%s>>' % (id, args)
         return parsetree.Terminal(rule, id)
     else:
         # It's a name, so assume it's a nonterminal
@@ -44,9 +42,9 @@
 
 # Begin -- grammar generated by Yapps
 import sys, re
-import yappsrt
+from yapps import runtime
 
-class ParserDescriptionScanner(yappsrt.Scanner):
+class ParserDescriptionScanner(runtime.Scanner):
     patterns = [
         ('"rule"', re.compile('rule')),
         ('"ignore"', re.compile('ignore')),
@@ -71,163 +69,142 @@
         ('QUEST', re.compile('[?]')),
         ('COLON', re.compile(':')),
     ]
-    def __init__(self, str):
-        yappsrt.Scanner.__init__(self,None,['[ \t\r\n]+', '#.*?\r?\n'],str)
-
-class ParserDescription(yappsrt.Parser):
-    Context = yappsrt.Context
-    def LINENO(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'LINENO', [])
-        return 1 + self._scanner.get_input_scanned().count('\n')
+    def __init__(self, str,*args,**kw):
+        runtime.Scanner.__init__(self,None,{'[ \t\r\n]+':None,'#.*?\r?\n':None,},str,*args,**kw)
 
+class ParserDescription(runtime.Parser):
+    Context = runtime.Context
     def Parser(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'Parser', [])
-        self._scan('"parser"')
-        ID = self._scan('ID')
-        self._scan('":"')
+        _context = self.Context(_parent, self._scanner, 'Parser', [])
+        self._scan('"parser"', context=_context)
+        ID = self._scan('ID', context=_context)
+        self._scan('":"', context=_context)
         Options = self.Options(_context)
         Tokens = self.Tokens(_context)
         Rules = self.Rules(Tokens, _context)
-        EOF = self._scan('EOF')
+        EOF = self._scan('EOF', context=_context)
         return parsetree.Generator(ID,Options,Tokens,Rules)
 
     def Options(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'Options', [])
+        _context = self.Context(_parent, self._scanner, 'Options', [])
         opt = {}
-        while self._peek() == '"option"':
-            self._scan('"option"')
-            self._scan('":"')
+        while self._peek('"option"', '"token"', '"ignore"', 'EOF', '"rule"', context=_context) == '"option"':
+            self._scan('"option"', context=_context)
+            self._scan('":"', context=_context)
             Str = self.Str(_context)
             opt[Str] = 1
-        if self._peek() not in ['"option"', '"token"', '"ignore"', 'EOF', '"rule"']:
-            raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(['"option"', '"token"', '"ignore"', 'EOF', '"rule"']))
         return opt
 
     def Tokens(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'Tokens', [])
+        _context = self.Context(_parent, self._scanner, 'Tokens', [])
         tok = []
-        while self._peek() in ['"token"', '"ignore"']:
-            _token = self._peek()
+        while self._peek('"token"', '"ignore"', 'EOF', '"rule"', context=_context) in ['"token"', '"ignore"']:
+            _token = self._peek('"token"', '"ignore"', context=_context)
             if _token == '"token"':
-                self._scan('"token"')
-                ID = self._scan('ID')
-                self._scan('":"')
+                self._scan('"token"', context=_context)
+                ID = self._scan('ID', context=_context)
+                self._scan('":"', context=_context)
                 Str = self.Str(_context)
                 tok.append( (ID,Str) )
-            elif _token == '"ignore"':
-                self._scan('"ignore"')
-                self._scan('":"')
+            else: # == '"ignore"'
+                self._scan('"ignore"', context=_context)
+                self._scan('":"', context=_context)
                 Str = self.Str(_context)
-                tok.append( ('#ignore',Str) )
-            else:
-                raise yappsrt.SyntaxError(_token[0], 'Could not match Tokens')
-        if self._peek() not in ['"token"', '"ignore"', 'EOF', '"rule"']:
-            raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(['"token"', '"ignore"', 'EOF', '"rule"']))
+                ign = ('#ignore',Str)
+                if self._peek('STMT', '"token"', '"ignore"', 'EOF', '"rule"', context=_context) == 'STMT':
+                    STMT = self._scan('STMT', context=_context)
+                    ign = ign + (STMT[2:-2],)
+                tok.append( ign )
         return tok
 
     def Rules(self, tokens, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'Rules', [tokens])
+        _context = self.Context(_parent, self._scanner, 'Rules', [tokens])
         rul = []
-        while self._peek() == '"rule"':
-            LINENO = self.LINENO(_context)
-            self._scan('"rule"')
-            ID = self._scan('ID')
+        while self._peek('"rule"', 'EOF', context=_context) == '"rule"':
+            self._scan('"rule"', context=_context)
+            ID = self._scan('ID', context=_context)
             OptParam = self.OptParam(_context)
-            self._scan('":"')
+            self._scan('":"', context=_context)
             ClauseA = self.ClauseA(ID, tokens, _context)
             rul.append( (ID, OptParam, ClauseA) )
-        if self._peek() not in ['"rule"', 'EOF']:
-            raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(['"rule"', 'EOF']))
         return rul
 
     def ClauseA(self, rule, tokens, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'ClauseA', [rule, tokens])
-        ClauseB = self.ClauseB(rule, tokens, _context)
+        _context = self.Context(_parent, self._scanner, 'ClauseA', [rule, tokens])
+        ClauseB = self.ClauseB(rule,tokens, _context)
         v = [ClauseB]
-        while self._peek() == 'OR':
-            OR = self._scan('OR')
-            ClauseB = self.ClauseB(rule, tokens, _context)
+        while self._peek('OR', 'RP', 'RB', '"rule"', 'EOF', context=_context) == 'OR':
+            OR = self._scan('OR', context=_context)
+            ClauseB = self.ClauseB(rule,tokens, _context)
             v.append(ClauseB)
-        if self._peek() not in ['OR', 'RP', 'RB', '"rule"', 'EOF']:
-            raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(['OR', 'RP', 'RB', '"rule"', 'EOF']))
-        return cleanup_choice(rule, v)
+        return cleanup_choice(rule,v)
 
-    def ClauseB(self, rule, tokens, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'ClauseB', [rule, tokens])
+    def ClauseB(self, rule,tokens, _parent=None):
+        _context = self.Context(_parent, self._scanner, 'ClauseB', [rule,tokens])
         v = []
-        while self._peek() in ['STR', 'ID', 'LP', 'LB', 'STMT']:
-            ClauseC = self.ClauseC(rule, tokens, _context)
+        while self._peek('STR', 'ID', 'LP', 'LB', 'STMT', 'OR', 'RP', 'RB', '"rule"', 'EOF', context=_context) in ['STR', 'ID', 'LP', 'LB', 'STMT']:
+            ClauseC = self.ClauseC(rule,tokens, _context)
             v.append(ClauseC)
-        if self._peek() not in ['STR', 'ID', 'LP', 'LB', 'STMT', 'OR', 'RP', 'RB', '"rule"', 'EOF']:
-            raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(['STR', 'ID', 'LP', 'LB', 'STMT', 'OR', 'RP', 'RB', '"rule"', 'EOF']))
         return cleanup_sequence(rule, v)
 
-    def ClauseC(self, rule, tokens, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'ClauseC', [rule, tokens])
-        ClauseD = self.ClauseD(rule, tokens, _context)
-        _token = self._peek()
+    def ClauseC(self, rule,tokens, _parent=None):
+        _context = self.Context(_parent, self._scanner, 'ClauseC', [rule,tokens])
+        ClauseD = self.ClauseD(rule,tokens, _context)
+        _token = self._peek('PLUS', 'STAR', 'QUEST', 'STR', 'ID', 'LP', 'LB', 'STMT', 'OR', 'RP', 'RB', '"rule"', 'EOF', context=_context)
         if _token == 'PLUS':
-            PLUS = self._scan('PLUS')
+            PLUS = self._scan('PLUS', context=_context)
             return parsetree.Plus(rule, ClauseD)
         elif _token == 'STAR':
-            STAR = self._scan('STAR')
+            STAR = self._scan('STAR', context=_context)
             return parsetree.Star(rule, ClauseD)
         elif _token == 'QUEST':
-            QUEST = self._scan('QUEST')
+            QUEST = self._scan('QUEST', context=_context)
             return parsetree.Option(rule, ClauseD)
-        elif _token not in ['"ignore"', '"token"', '"option"', '":"', '"parser"', 'ATTR', 'COLON']:
-            return ClauseD
         else:
-            raise yappsrt.SyntaxError(_token[0], 'Could not match ClauseC')
+            return ClauseD
 
-    def ClauseD(self, rule, tokens, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'ClauseD', [rule, tokens])
-        _token = self._peek()
+    def ClauseD(self, rule,tokens, _parent=None):
+        _context = self.Context(_parent, self._scanner, 'ClauseD', [rule,tokens])
+        _token = self._peek('STR', 'ID', 'LP', 'LB', 'STMT', context=_context)
         if _token == 'STR':
-            STR = self._scan('STR')
+            STR = self._scan('STR', context=_context)
             t = (STR, eval(STR,{},{}))
             if t not in tokens: tokens.insert( 0, t )
             return parsetree.Terminal(rule, STR)
         elif _token == 'ID':
-            ID = self._scan('ID')
+            ID = self._scan('ID', context=_context)
             OptParam = self.OptParam(_context)
-            return resolve_name(rule, tokens, ID, OptParam)
+            return resolve_name(rule,tokens, ID, OptParam)
         elif _token == 'LP':
-            LP = self._scan('LP')
-            ClauseA = self.ClauseA(rule, tokens, _context)
-            RP = self._scan('RP')
+            LP = self._scan('LP', context=_context)
+            ClauseA = self.ClauseA(rule,tokens, _context)
+            RP = self._scan('RP', context=_context)
             return ClauseA
         elif _token == 'LB':
-            LB = self._scan('LB')
-            ClauseA = self.ClauseA(rule, tokens, _context)
-            RB = self._scan('RB')
+            LB = self._scan('LB', context=_context)
+            ClauseA = self.ClauseA(rule,tokens, _context)
+            RB = self._scan('RB', context=_context)
             return parsetree.Option(rule, ClauseA)
-        elif _token == 'STMT':
-            STMT = self._scan('STMT')
+        else: # == 'STMT'
+            STMT = self._scan('STMT', context=_context)
             return parsetree.Eval(rule, STMT[2:-2])
-        else:
-            raise yappsrt.SyntaxError(_token[0], 'Could not match ClauseD')
 
     def OptParam(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'OptParam', [])
-        _token = self._peek()
-        if _token == 'ATTR':
-            ATTR = self._scan('ATTR')
+        _context = self.Context(_parent, self._scanner, 'OptParam', [])
+        if self._peek('ATTR', '":"', 'PLUS', 'STAR', 'QUEST', 'STR', 'ID', 'LP', 'LB', 'STMT', 'OR', 'RP', 'RB', '"rule"', 'EOF', context=_context) == 'ATTR':
+            ATTR = self._scan('ATTR', context=_context)
             return ATTR[2:-2]
-        elif _token not in ['"ignore"', '"token"', '"option"', '"parser"', 'COLON']:
-            return ''
-        else:
-            raise yappsrt.SyntaxError(_token[0], 'Could not match OptParam')
+        return ''
 
     def Str(self, _parent=None):
-        _context = self.Context(_parent, self._scanner, self._pos, 'Str', [])
-        STR = self._scan('STR')
+        _context = self.Context(_parent, self._scanner, 'Str', [])
+        STR = self._scan('STR', context=_context)
         return eval(STR,{},{})
 
 
 def parse(rule, text):
     P = ParserDescription(ParserDescriptionScanner(text))
-    return yappsrt.wrap_error_reporter(P, rule)
+    return runtime.wrap_error_reporter(P, rule)
 
 # End -- grammar generated by Yapps
 
--- yapps2-2.1.1.orig/yapps/parsetree.py
+++ yapps2-2.1.1/yapps/parsetree.py
@@ -1,5 +1,3 @@
-#!/usr/bin/python2
-#
 # parsetree.py, part of Yapps 2 - yet another python parser system
 # Copyright 1999-2003 by Amit J. Patel <amitp@cs.stanford.edu>
 #
@@ -35,12 +33,18 @@
         self.postparser = None
         
         self.tokens = {} # Map from tokens to regexps
-        self.ignore = [] # List of token names to ignore in parsing
+        self.ignore = {} # List of token names to ignore in parsing, map to statements
         self.terminals = [] # List of token names (to maintain ordering)
-        for n, t in tokens:
+        for t in tokens:
+            if len(t) == 3:
+                n,t,s = t
+            else:
+                n,t = t
+                s = None
+
             if n == '#ignore':
                 n = t
-                self.ignore.append(n)
+                self.ignore[n] = s
             if n in self.tokens.keys() and self.tokens[n] != t:
                 print >>sys.stderr, 'Warning: token %s defined more than once.' % n
             self.tokens[n] = t
@@ -199,7 +203,9 @@
         a_set = (repr(a)[1:-1])
         if self.equal_set(a, self.non_ignored_tokens()): a_set = ''
         if self.has_option('context-insensitive-scanner'): a_set = ''
-        return 'self._peek(%s)' % a_set
+        if a_set: a_set += ","
+        
+        return 'self._peek(%s context=_context)' % a_set
     
     def peek_test(self, a, b):
         """Generate a call to test whether the next token (which could be any of
@@ -252,31 +258,39 @@
                 print '    FOLLOW:', ', '.join(top.follow)
                 for x in top.get_children(): queue.append(x)
                 
+    def repr_ignore(self):
+        out="{"
+        for t,s in self.ignore.iteritems():
+            if s is None: s=repr(s)
+            out += "%s:%s," % (repr(t),s)
+        out += "}"
+        return out
+        
     def generate_output(self):
         self.calculate()
         self.write(self.preparser)
         self.write("# Begin -- grammar generated by Yapps\n")
         self.write("import sys, re\n")
-        self.write("import yappsrt\n")
+        self.write("from yapps import runtime\n")
         self.write("\n")
-        self.write("class ", self.name, "Scanner(yappsrt.Scanner):\n")
+        self.write("class ", self.name, "Scanner(runtime.Scanner):\n")
         self.write("    patterns = [\n")
         for p in self.terminals:
             self.write("        (%s, re.compile(%s)),\n" % (
                 repr(p), repr(self.tokens[p])))
         self.write("    ]\n")
-        self.write("    def __init__(self, str):\n")
-        self.write("        yappsrt.Scanner.__init__(self,None,%s,str)\n" %
-                   repr(self.ignore))
+        self.write("    def __init__(self, str,*args,**kw):\n")
+        self.write("        runtime.Scanner.__init__(self,None,%s,str,*args,**kw)\n" %
+                   self.repr_ignore())
         self.write("\n")
         
-        self.write("class ", self.name, "(yappsrt.Parser):\n")
-        self.write(INDENT, "Context = yappsrt.Context\n")
+        self.write("class ", self.name, "(runtime.Parser):\n")
+        self.write(INDENT, "Context = runtime.Context\n")
         for r in self.goals:
             self.write(INDENT, "def ", r, "(self")
             if self.params[r]: self.write(", ", self.params[r])
             self.write(", _parent=None):\n")
-            self.write(INDENT+INDENT, "_context = self.Context(_parent, self._scanner, self._pos, %s, [%s])\n" %
+            self.write(INDENT+INDENT, "_context = self.Context(_parent, self._scanner, %s, [%s])\n" %
                        (repr(r), self.params.get(r, '')))
             self.rules[r].output(self, INDENT+INDENT)
             self.write("\n")
@@ -284,7 +298,7 @@
         self.write("\n")
         self.write("def parse(rule, text):\n")
         self.write("    P = ", self.name, "(", self.name, "Scanner(text))\n")
-        self.write("    return yappsrt.wrap_error_reporter(P, rule)\n")
+        self.write("    return runtime.wrap_error_reporter(P, rule)\n")
         self.write("\n")
         if self.postparser is not None:
             self.write("# End -- grammar generated by Yapps\n")
@@ -355,7 +369,7 @@
         gen.write(indent)
         if re.match('[a-zA-Z_][a-zA-Z_0-9]*$', self.token):
             gen.write(self.token, " = ")
-        gen.write("self._scan(%s)\n" % repr(self.token))
+        gen.write("self._scan(%s, context=_context)\n" % repr(self.token))
         
 class Eval(Node):
     """This class stores evaluation nodes, from {{ ... }} clauses."""
@@ -547,7 +561,7 @@
 
         if tokens_unseen:
             gen.write(indent, "else:\n")
-            gen.write(indent, INDENT, "raise yappsrt.SyntaxError(_token[0], ")
+            gen.write(indent, INDENT, "raise runtime.SyntaxError(_token[0], ")
             gen.write("'Could not match ", self.rule, "')\n")
         
 class Wrapper(Node):
@@ -586,6 +600,13 @@
         gen.write(indent, "if %s:\n" %
                   gen.peek_test(self.first, self.child.first))
         self.child.output(gen, indent+INDENT)
+
+        if gen.has_option('context-insensitive-scanner'):
+            gen.write(indent, "if %s:\n" %
+                    gen.not_peek_test(gen.non_ignored_tokens(), self.follow))
+            gen.write(indent+INDENT, "raise runtime.SyntaxError(pos=self._scanner.get_pos(), context=_context, msg='Need one of ' + ', '.join(%s))\n" %
+                    repr(self.first))
+
         
 class Plus(Wrapper):
     """This class represents a 1-or-more repetition clause of the form A+"""
@@ -613,6 +634,13 @@
         gen.write(indent+INDENT, "if %s: break\n" %
                   gen.not_peek_test(union, self.child.first))
 
+        if gen.has_option('context-insensitive-scanner'):
+            gen.write(indent, "if %s:\n" %
+                    gen.not_peek_test(gen.non_ignored_tokens(), self.follow))
+            gen.write(indent+INDENT, "raise runtime.SyntaxError(pos=self._scanner.get_pos(), context=_context, msg='Need one of ' + ', '.join(%s))\n" %
+                    repr(self.first))
+
+
 class Star(Wrapper):
     """This class represents a 0-or-more repetition clause of the form A*"""
     def setup(self, gen):
@@ -637,9 +665,9 @@
         self.child.output(gen, indent+INDENT)
 
         # TODO: need to generate tests like this in lots of rules
-        # TODO: do we need to do this only when it's a context-insensitive scanner?
-        gen.write(indent, "if %s:\n" %
-                  gen.not_peek_test(gen.non_ignored_tokens(), self.follow))
-        gen.write(indent+INDENT, "raise yappsrt.SyntaxError(charpos=self._scanner.get_prev_char_pos(), context=_context, msg='Need one of ' + ', '.join(%s))\n" %
-                  repr(self.first))
+        if gen.has_option('context-insensitive-scanner'):
+            gen.write(indent, "if %s:\n" %
+                    gen.not_peek_test(gen.non_ignored_tokens(), self.follow))
+            gen.write(indent+INDENT, "raise runtime.SyntaxError(pos=self._scanner.get_pos(), context=_context, msg='Need one of ' + ', '.join(%s))\n" %
+                    repr(self.first))
 
--- yapps2-2.1.1.orig/yapps/runtime.py
+++ yapps2-2.1.1/yapps/runtime.py
@@ -1,6 +1,6 @@
-#
 # Yapps 2 Runtime, part of Yapps 2 - yet another python parser system
 # Copyright 1999-2003 by Amit J. Patel <amitp@cs.stanford.edu>
+# Enhancements copyright 2003-2004 by Matthias Urlichs <smurf@debian.org>
 #
 # This version of the Yapps 2 Runtime can be distributed under the
 # terms of the MIT open source license, either found in the LICENSE file
@@ -19,278 +19,424 @@
 
 import sys, re
 
+MIN_WINDOW=4096
+# File lookup window
+
 class SyntaxError(Exception):
-    """When we run into an unexpected token, this is the exception to use"""
-    def __init__(self, charpos=-1, msg="Bad Token", context=None):
-        Exception.__init__(self)
-        self.charpos = charpos
-        self.msg = msg
-        self.context = context
-        
-    def __str__(self):
-        if self.charpos < 0: return 'SyntaxError'
-        else: return 'SyntaxError@char%s(%s)' % (repr(self.charpos), self.msg)
+	"""When we run into an unexpected token, this is the exception to use"""
+	def __init__(self, pos=None, msg="Bad Token", context=None):
+		Exception.__init__(self)
+		self.pos = pos
+		self.msg = msg
+		self.context = context
+		
+	def __str__(self):
+		if not self.pos: return 'SyntaxError'
+		else: return 'SyntaxError@%s(%s)' % (repr(self.pos), self.msg)
 
 class NoMoreTokens(Exception):
-    """Another exception object, for when we run out of tokens"""
-    pass
+	"""Another exception object, for when we run out of tokens"""
+	pass
+
+class Token(object):
+	"""Yapps token.
 
-class Scanner:
-    """Yapps scanner.
+	This is a container for a scanned token.
+	"""
 
-    The Yapps scanner can work in context sensitive or context
-    insensitive modes.  The token(i) method is used to retrieve the
-    i-th token.  It takes a restrict set that limits the set of tokens
-    it is allowed to return.  In context sensitive mode, this restrict
-    set guides the scanner.  In context insensitive mode, there is no
-    restriction (the set is always the full set of tokens).
-    
-    """
-    
-    def __init__(self, patterns, ignore, input):
-        """Initialize the scanner.
-
-        Parameters:
-          patterns : [(terminal, uncompiled regex), ...] or None
-          ignore : [terminal,...]
-          input : string
-
-        If patterns is None, we assume that the subclass has
-        defined self.patterns : [(terminal, compiled regex), ...].
-        Note that the patterns parameter expects uncompiled regexes,
-        whereas the self.patterns field expects compiled regexes.
-        """
-        self.tokens = [] # [(begin char pos, end char pos, token name, matched text), ...]
-        self.restrictions = []
-        self.input = input
-        self.pos = 0
-        self.ignore = ignore
-        self.first_line_number = 1
-        
-        if patterns is not None:
-            # Compile the regex strings into regex objects
-            self.patterns = []
-            for terminal, regex in patterns:
-                self.patterns.append( (terminal, re.compile(regex)) )
-
-    def get_token_pos(self):
-        """Get the current token position in the input text."""
-        return len(self.tokens)
-
-    def get_char_pos(self):
-        """Get the current char position in the input text."""
-        return self.pos
-    
-    def get_prev_char_pos(self, i=None):
-        """Get the previous position (one token back) in the input text."""
-        if self.pos == 0: return 0
-        if i is None: i = -1
-        return self.tokens[i][0]
-    
-    def get_line_number(self):
-        """Get the line number of the current position in the input text."""
-        # TODO: make this work at any token/char position
-        return self.first_line_number + self.get_input_scanned().count('\n')
-
-    def get_column_number(self):
-        """Get the column number of the current position in the input text."""
-        s = self.get_input_scanned()
-        i = s.rfind('\n') # may be -1, but that's okay in this case
-        return len(s) - (i+1)
-    
-    def get_input_scanned(self):
-        """Get the portion of the input that has been tokenized."""
-        return self.input[:self.pos]
-
-    def get_input_unscanned(self):
-        """Get the portion of the input that has not yet been tokenized."""
-        return self.input[self.pos:]
-
-    def token(self, i, restrict=None):
-        """Get the i'th token in the input.
-
-        If i is one past the end, then scan for another token.
-        
-        Args:
-
-        restrict : [token, ...] or None; if restrict is None, then any
-        token is allowed.  You may call token(i) more than once.
-        However, the restrict set may never be larger than what was
-        passed in on the first call to token(i).
-        
-        """
-        if i == len(self.tokens):
-            self.scan(restrict)
-        if i < len(self.tokens):
-            # Make sure the restriction is more restricted.  This
-            # invariant is needed to avoid ruining tokenization at
-            # position i+1 and higher.
-            if restrict and self.restrictions[i]:
-                for r in restrict:
-                    if r not in self.restrictions[i]:
-                        raise NotImplementedError("Unimplemented: restriction set changed")
-            return self.tokens[i]
-        raise NoMoreTokens()
-    
-    def __repr__(self):
-        """Print the last 10 tokens that have been scanned in"""
-        output = ''
-        for t in self.tokens[-10:]:
-            output = '%s\n  (@%s)  %s  =  %s' % (output,t[0],t[2],repr(t[3]))
-        return output
-    
-    def scan(self, restrict):
-        """Should scan another token and add it to the list, self.tokens,
-        and add the restriction to self.restrictions"""
-        # Keep looking for a token, ignoring any in self.ignore
-        while 1:
-            # Search the patterns for the longest match, with earlier
-            # tokens in the list having preference
-            best_match = -1
-            best_pat = '(error)'
-            for p, regexp in self.patterns:
-                # First check to see if we're ignoring this token
-                if restrict and p not in restrict and p not in self.ignore:
-                    continue
-                m = regexp.match(self.input, self.pos)
-                if m and len(m.group(0)) > best_match:
-                    # We got a match that's better than the previous one
-                    best_pat = p
-                    best_match = len(m.group(0))
-                    
-            # If we didn't find anything, raise an error
-            if best_pat == '(error)' and best_match < 0:
-                msg = 'Bad Token'
-                if restrict:
-                    msg = 'Trying to find one of '+', '.join(restrict)
-                raise SyntaxError(self.pos, msg)
-
-            # If we found something that isn't to be ignored, return it
-            if best_pat not in self.ignore:
-                # Create a token with this data
-                token = (self.pos, self.pos+best_match, best_pat,
-                         self.input[self.pos:self.pos+best_match])
-                self.pos = self.pos + best_match
-                # Only add this token if it's not in the list
-                # (to prevent looping)
-                if not self.tokens or token != self.tokens[-1]:
-                    self.tokens.append(token)
-                    self.restrictions.append(restrict)
-                return
-            else:
-                # This token should be ignored ..
-                self.pos = self.pos + best_match
-
-class Parser:
-    """Base class for Yapps-generated parsers.
-
-    """
-    
-    def __init__(self, scanner):
-        self._scanner = scanner
-        self._pos = 0
-        
-    def _peek(self, *types):
-        """Returns the token type for lookahead; if there are any args
-        then the list of args is the set of token types to allow"""
-        tok = self._scanner.token(self._pos, types)
-        return tok[2]
-        
-    def _scan(self, type):
-        """Returns the matched text, and moves to the next token"""
-        tok = self._scanner.token(self._pos, [type])
-        if tok[2] != type:
-            raise SyntaxError(tok[0], 'Trying to find '+type+' :'+ ' ,'.join(self._scanner.restrictions[self._pos]))
-        self._pos = 1 + self._pos
-        return tok[3]
-
-class Context:
-    """Class to represent the parser's call stack.
-
-    Every rule creates a Context that links to its parent rule.  The
-    contexts can be used for debugging.
-
-    """
-    
-    def __init__(self, parent, scanner, tokenpos, rule, args=()):
-        """Create a new context.
-
-        Args:
-        parent: Context object or None
-        scanner: Scanner object
-        pos: integer (scanner token position)
-        rule: string (name of the rule)
-        args: tuple listing parameters to the rule
-
-        """
-        self.parent = parent
-        self.scanner = scanner
-        self.tokenpos = tokenpos
-        self.rule = rule
-        self.args = args
-
-    def __str__(self):
-        output = ''
-        if self.parent: output = str(self.parent) + ' > '
-        output += self.rule
-        return output
-    
-def print_line_with_pointer(text, p):
-    """Print the line of 'text' that includes position 'p',
-    along with a second line with a single caret (^) at position p"""
-    # Now try printing part of the line
-    text = text[max(p-80, 0):p+80]
-    p = p - max(p-80, 0)
-
-    # Strip to the left
-    i = text[:p].rfind('\n')
-    j = text[:p].rfind('\r')
-    if i < 0 or (0 <= j < i): i = j
-    if 0 <= i < p:
-        p = p - i - 1
-        text = text[i+1:]
-
-    # Strip to the right
-    i = text.find('\n', p)
-    j = text.find('\r', p)
-    if i < 0 or (0 <= j < i): i = j
-    if i >= 0:
-        text = text[:i]
-
-    # Now shorten the text
-    while len(text) > 70 and p > 60:
-        # Cut off 10 chars
-        text = "..." + text[10:]
-        p = p - 7
-
-    # Now print the string, along with an indicator
-    print >>sys.stderr, '> ',text
-    print >>sys.stderr, '> ',' '*p + '^'
-    
-def print_error(input, err, scanner):
-    """Print error messages, the parser stack, and the input text -- for human-readable error messages."""
-    # NOTE: this function assumes 80 columns :-(
-    # Figure out the line number
-    line_number = scanner.get_line_number()
-    column_number = scanner.get_column_number()
-    print >>sys.stderr, '%d:%d: %s' % (line_number, column_number, err.msg)
-
-    context = err.context
-    if not context:
-        print_line_with_pointer(input, err.charpos)
-        
-    while context:
-        # TODO: add line number
-        print >>sys.stderr, 'while parsing %s%s:' % (context.rule, tuple(context.args))
-        print_line_with_pointer(input, context.scanner.get_prev_char_pos(context.tokenpos))
-        context = context.parent
-
-def wrap_error_reporter(parser, rule):
-    try:
-        return getattr(parser, rule)()
-    except SyntaxError, e:
-        input = parser._scanner.input
-        print_error(input, e, parser._scanner)
-    except NoMoreTokens:
-        print >>sys.stderr, 'Could not complete parsing; stopped around here:'
-        print >>sys.stderr, parser._scanner
+	def __init__(self, type,value, pos=None):
+		"""Initialize a token."""
+		self.type = type
+		self.value = value
+		self.pos = pos
+
+	def __repr__(self):
+		output = '<%s: %s' % (self.type, repr(self.value))
+		if self.pos:
+			output += " @ "
+			if self.pos[0]:
+				output += "%s:" % self.pos[0]
+			if self.pos[1]:
+				output += "%d" % self.pos[1]
+			if self.pos[2] is not None:
+				output += ".%d" % self.pos[2]
+		output += ">"
+		return output
+
+in_name=0
+class Scanner(object):
+	"""Yapps scanner.
+
+	The Yapps scanner can work in context sensitive or context
+	insensitive modes.  The token(i) method is used to retrieve the
+	i-th token.  It takes a restrict set that limits the set of tokens
+	it is allowed to return.  In context sensitive mode, this restrict
+	set guides the scanner.  In context insensitive mode, there is no
+	restriction (the set is always the full set of tokens).
+	
+	"""
+	
+	def __init__(self, patterns, ignore, input="",
+			file=None,filename=None,stacked=False):
+		"""Initialize the scanner.
+
+		Parameters:
+		  patterns : [(terminal, uncompiled regex), ...] or None
+		  ignore : {terminal:None, ...}
+		  input : string
+
+		If patterns is None, we assume that the subclass has
+		defined self.patterns : [(terminal, compiled regex), ...].
+		Note that the patterns parameter expects uncompiled regexes,
+		whereas the self.patterns field expects compiled regexes.
+
+		The 'ignore' value is either None or a callable, which is called
+		with the scanner and the to-be-ignored match object; this can
+		be used for include file or comment handling.
+		"""
+
+		if not filename:
+			global in_name
+			filename="<f.%d>" % in_name
+			in_name += 1
+
+		self.input = input
+		self.ignore = ignore
+		self.file = file
+		self.filename = filename
+		self.pos = 0
+		self.del_pos = 0 # skipped
+		self.line = 1
+		self.del_line = 0 # skipped
+		self.col = 0
+		self.tokens = []
+		self.stack = None
+		self.stacked = stacked
+		
+		self.last_read_token = None
+		self.last_token = None
+		self.last_types = None
+
+		if patterns is not None:
+			# Compile the regex strings into regex objects
+			self.patterns = []
+			for terminal, regex in patterns:
+				self.patterns.append( (terminal, re.compile(regex)) )
+
+	def stack_input(self, input="", file=None, filename=None):
+		"""Temporarily parse from a second file."""
+
+		# Already reading from somewhere else: Go on top of that, please.
+		if self.stack:
+			# autogenerate a recursion-level-identifying filename
+			if not filename:
+				filename = 1
+			else:
+				try:
+					filename += 1
+				except TypeError:
+					pass
+				# now pass off to the include file
+			self.stack.stack_input(input,file,filename)
+		else:
+
+			try:
+				filename += 0
+			except TypeError:
+				pass
+			else:
+				filename = "<str_%d>" % filename
+
+#			self.stack = object.__new__(self.__class__)
+#			Scanner.__init__(self.stack,self.patterns,self.ignore,input,file,filename, stacked=True)
+
+			# Note that the pattern+ignore are added by the generated
+			# scanner code
+			self.stack = self.__class__(input,file,filename, stacked=True)
+
+	def get_pos(self):
+		"""Return a file/line/char tuple."""
+		if self.stack: return self.stack.get_pos()
+
+		return (self.filename, self.line+self.del_line, self.col)
+
+#	def __repr__(self):
+#		"""Print the last few tokens that have been scanned in"""
+#		output = ''
+#		for t in self.tokens:
+#			output += '%s\n' % (repr(t),)
+#		return output
+	
+	def print_line_with_pointer(self, pos, length=0, out=sys.stderr):
+		"""Print the line of 'text' that includes position 'p',
+		along with a second line with a single caret (^) at position p"""
+
+		file,line,p = pos
+		if file != self.filename:
+			if self.stack: return self.stack.print_line_with_pointer(pos,length=length,out=out)
+			print >>out, "(%s: not in input buffer)" % file
+			return
+
+		text = self.input
+		p += length-1 # starts at pos 1
+
+		origline=line
+		line -= self.del_line
+		spos=0
+		if line > 0:
+			while 1:
+				line = line - 1
+				try:
+					cr = text.index("\n",spos)
+				except ValueError:
+					if line:
+						text = ""
+					break
+				if line == 0:
+					text = text[spos:cr]
+					break
+				spos = cr+1
+		else:
+			print >>out, "(%s:%d not in input buffer)" % (file,origline)
+			return
+
+		# Now try printing part of the line
+		text = text[max(p-80, 0):p+80]
+		p = p - max(p-80, 0)
+
+		# Strip to the left
+		i = text[:p].rfind('\n')
+		j = text[:p].rfind('\r')
+		if i < 0 or (0 <= j < i): i = j
+		if 0 <= i < p:
+			p = p - i - 1
+			text = text[i+1:]
+
+		# Strip to the right
+		i = text.find('\n', p)
+		j = text.find('\r', p)
+		if i < 0 or (0 <= j < i): i = j
+		if i >= 0:
+			text = text[:i]
+
+		# Now shorten the text
+		while len(text) > 70 and p > 60:
+			# Cut off 10 chars
+			text = "..." + text[10:]
+			p = p - 7
+
+		# Now print the string, along with an indicator
+		print >>out, '> ',text
+		print >>out, '> ',' '*p + '^'
+	
+	def grab_input(self):
+		"""Get more input if possible."""
+		if not self.file: return
+		if len(self.input) - self.pos >= MIN_WINDOW: return
+
+		data = self.file.read(MIN_WINDOW)
+		if data is None or data == "":
+			self.file = None
+
+		# Drop bytes from the start, if necessary.
+		if self.pos > 2*MIN_WINDOW:
+			self.del_pos += MIN_WINDOW
+			self.del_line += self.input[:MIN_WINDOW].count("\n")
+			self.pos -= MIN_WINDOW
+			self.input = self.input[MIN_WINDOW:] + data
+		else:
+			self.input = self.input + data
+
+	def getchar(self):
+		"""Return the next character."""
+		self.grab_input()
+
+		c = self.input[self.pos]
+		self.pos += 1
+		return c
+
+	def token(self, restrict, context=None):
+		"""Scan for another token."""
+
+		while 1:
+			if self.stack:
+				try:
+					return self.stack.token(restrict, context)
+				except StopIteration:
+					self.stack = None
+
+		# Keep looking for a token, ignoring any in self.ignore
+			self.grab_input()
+
+			# special handling for end-of-file
+			if self.stacked and self.pos==len(self.input):
+				raise StopIteration
+
+			# Search the patterns for the longest match, with earlier
+			# tokens in the list having preference
+			best_match = -1
+			best_pat = '(error)'
+			best_m = None
+			for p, regexp in self.patterns:
+				# First check to see if we're ignoring this token
+				if restrict and p not in restrict and p not in self.ignore:
+					continue
+				m = regexp.match(self.input, self.pos)
+				if m and m.end()-m.start() > best_match:
+					# We got a match that's better than the previous one
+					best_pat = p
+					best_match = m.end()-m.start()
+					best_m = m
+					
+			# If we didn't find anything, raise an error
+			if best_pat == '(error)' and best_match < 0:
+				msg = 'Bad Token'
+				if restrict:
+					msg = 'Trying to find one of '+', '.join(restrict)
+				raise SyntaxError(self.get_pos(), msg, context=context)
+
+			ignore = best_pat in self.ignore
+			value = self.input[self.pos:self.pos+best_match]
+			if not ignore:
+				tok=Token(type=best_pat, value=value, pos=self.get_pos())
+
+			self.pos += best_match
+
+			npos = value.rfind("\n")
+			if npos > -1:
+				self.col = best_match-npos
+				self.line += value.count("\n")
+			else:
+				self.col += best_match
+
+			# If we found something that isn't to be ignored, return it
+			if not ignore:
+				if len(self.tokens) >= 10:
+					del self.tokens[0]
+				self.tokens.append(tok)
+				self.last_read_token = tok
+				# print repr(tok)
+				return tok
+			else:
+				ignore = self.ignore[best_pat]
+				if ignore:
+					ignore(self, best_m)
+
+	def peek(self, *types, **kw):
+		"""Returns the token type for lookahead; if there are any args
+		then the list of args is the set of token types to allow"""
+		context = kw.get("context",None)
+		if self.last_token is None:
+			self.last_types = types
+			self.last_token = self.token(types,context)
+		elif self.last_types:
+			for t in types:
+				if t not in self.last_types:
+					raise NotImplementedError("Unimplemented: restriction set changed")
+		return self.last_token.type
+		
+	def scan(self, type, **kw):
+		"""Returns the matched text, and moves to the next token"""
+		context = kw.get("context",None)
+
+		if self.last_token is None:
+			tok = self.token([type],context)
+		else:
+			if self.last_types and type not in self.last_types:
+				raise NotImplementedError("Unimplemented: restriction set changed")
+
+			tok = self.last_token
+			self.last_token = None
+		if tok.type != type:
+			if not self.last_types: self.last_types=[]
+			raise SyntaxError(tok.pos, 'Trying to find '+type+': '+ ', '.join(self.last_types)+", got "+tok.type, context=context)
+		return tok.value
+
+class Parser(object):
+	"""Base class for Yapps-generated parsers.
+
+	"""
+	
+	def __init__(self, scanner):
+		self._scanner = scanner
+		
+	def _stack(self, input="",file=None,filename=None):
+		"""Temporarily read from someplace else"""
+		self._scanner.stack_input(input,file,filename)
+		self._tok = None
+
+	def _peek(self, *types, **kw):
+		"""Returns the token type for lookahead; if there are any args
+		then the list of args is the set of token types to allow"""
+		return self._scanner.peek(*types, **kw)
+		
+	def _scan(self, type, **kw):
+		"""Returns the matched text, and moves to the next token"""
+		return self._scanner.scan(type, **kw)
+
+class Context(object):
+	"""Class to represent the parser's call stack.
+
+	Every rule creates a Context that links to its parent rule.  The
+	contexts can be used for debugging.
+
+	"""
+	
+	def __init__(self, parent, scanner, rule, args=()):
+		"""Create a new context.
+
+		Args:
+		parent: Context object or None
+		scanner: Scanner object
+		rule: string (name of the rule)
+		args: tuple listing parameters to the rule
+
+		"""
+		self.parent = parent
+		self.scanner = scanner
+		self.rule = rule
+		self.args = args
+		while scanner.stack: scanner = scanner.stack
+		self.token = scanner.last_read_token
+
+	def __str__(self):
+		output = ''
+		if self.parent: output = str(self.parent) + ' > '
+		output += self.rule
+		return output
+	
+def print_error(err, scanner, max_ctx=None):
+	"""Print error messages, the parser stack, and the input text -- for human-readable error messages."""
+	# NOTE: this function assumes 80 columns :-(
+	# Figure out the line number
+	pos = err.pos
+	if not pos:
+		pos = scanner.get_pos()
+
+	file_name, line_number, column_number = pos
+	print >>sys.stderr, '%s:%d:%d: %s' % (file_name, line_number, column_number, err.msg)
+
+	scanner.print_line_with_pointer(pos)
+		
+	context = err.context
+	token = None
+	while context:
+		print >>sys.stderr, 'while parsing %s%s:' % (context.rule, tuple(context.args))
+		if context.token:
+			token = context.token
+		if token:
+			scanner.print_line_with_pointer(token.pos, length=len(token.value))
+		context = context.parent
+		if max_ctx:
+			max_ctx = max_ctx-1
+			if not max_ctx:
+				break
+
+def wrap_error_reporter(parser, rule, *args,**kw):
+	try:
+		return getattr(parser, rule)(*args,**kw)
+	except SyntaxError, e:
+		print_error(e, parser._scanner)
+	except NoMoreTokens:
+		print >>sys.stderr, 'Could not complete parsing; stopped around here:'
+		print >>sys.stderr, parser._scanner
--- yapps2-2.1.1.orig/yapps2.py
+++ yapps2-2.1.1/yapps2.py
@@ -1,4 +1,4 @@
-#!/usr/bin/python2
+#!/usr/bin/python
 
 #
 # Yapps 2 - yet another python parser system
@@ -13,7 +13,7 @@
 
 import sys, re
 
-import yappsrt, parsetree
+from yapps import runtime, parsetree
 
 def generate(inputfilename, outputfilename='', dump=0, **flags):
     """Generate a grammar, given an input filename (X.g)
@@ -40,11 +40,12 @@
     if f >= 0: s, postparser = s[:f], '\n\n'+s[f+len(DIVIDER):]
 
     # Create the parser and scanner and parse the text
-    scanner = grammar.ParserDescriptionScanner(s)
-    if preparser: scanner.first_line_number = 1 + preparser.count('\n')
+    scanner = grammar.ParserDescriptionScanner(s, filename=inputfilename)
+    if preparser: scanner.del_line += preparser.count('\n')
+
     parser = grammar.ParserDescription(scanner)
-    t = yappsrt.wrap_error_reporter(parser, 'Parser')
-    if t is None: return # Failure
+    t = runtime.wrap_error_reporter(parser, 'Parser')
+    if t is None: return 1 # Failure
     if preparser is not None: t.preparser = preparser
     if postparser is not None: t.postparser = postparser
 
@@ -63,6 +64,7 @@
     else:
         t.output = open(outputfilename, 'w')
         t.generate_output()
+    return 0
 
 if __name__ == '__main__':
     import doctest
@@ -106,6 +108,6 @@
         if use_devel_grammar:
             import yapps_grammar as grammar
         else:
-            import grammar
+            from yapps import grammar
             
-        generate(*tuple(args), **flags)
+        sys.exit(generate(*tuple(args), **flags))
--- yapps2-2.1.1.orig/yapps_grammar.g
+++ yapps2-2.1.1/yapps_grammar.g
@@ -0,0 +1,121 @@
+# grammar.py, part of Yapps 2 - yet another python parser system
+# Copyright 1999-2003 by Amit J. Patel <amitp@cs.stanford.edu>
+# Enhancements copyright 2003-2004 by Matthias Urlichs <smurf@debian.org>
+#
+# This version of the Yapps 2 grammar can be distributed under the
+# terms of the MIT open source license, either found in the LICENSE
+# file included with the Yapps distribution
+# <http://theory.stanford.edu/~amitp/yapps/> or at
+# <http://www.opensource.org/licenses/mit-license.php>
+#
+
+"""Parser for Yapps grammars.
+
+This file defines the grammar of Yapps grammars.  Naturally, it is
+implemented in Yapps.  The grammar.py module needed by Yapps is built
+by running Yapps on yapps_grammar.g.  (Holy circularity, Batman!)
+
+"""
+
+import sys, re
+from yapps import parsetree
+
+######################################################################
+def cleanup_choice(rule, lst):
+    if len(lst) == 0: return Sequence(rule, [])
+    if len(lst) == 1: return lst[0]
+    return parsetree.Choice(rule, *tuple(lst))
+
+def cleanup_sequence(rule, lst):
+    if len(lst) == 1: return lst[0]
+    return parsetree.Sequence(rule, *tuple(lst))
+
+def resolve_name(rule, tokens, id, args):
+    if id in [x[0] for x in tokens]:
+	# It's a token
+	if args:
+	    print 'Warning: ignoring parameters on TOKEN %s<<%s>>' % (id, args)
+        return parsetree.Terminal(rule, id)
+    else:
+        # It's a name, so assume it's a nonterminal
+        return parsetree.NonTerminal(rule, id, args)
+
+%%
+parser ParserDescription:
+
+    ignore:      "[ \t\r\n]+"
+    ignore:      "#.*?\r?\n"
+    token EOF:   "$"
+    token ATTR:  "<<.+?>>"
+    token STMT:  "{{.+?}}"
+    token ID:    '[a-zA-Z_][a-zA-Z_0-9]*'
+    token STR:   '[rR]?\'([^\\n\'\\\\]|\\\\.)*\'|[rR]?"([^\\n"\\\\]|\\\\.)*"'
+    token LP:    '\\('
+    token RP:    '\\)'
+    token LB:    '\\['
+    token RB:    '\\]'
+    token OR:    '[|]'
+    token STAR:  '[*]'
+    token PLUS:  '[+]'
+    token QUEST: '[?]'
+    token COLON: ':'
+
+    rule Parser: "parser" ID ":"
+                   Options
+                   Tokens
+                   Rules<<Tokens>> 
+                 EOF 
+                 {{ return parsetree.Generator(ID,Options,Tokens,Rules) }}
+
+    rule Options: {{ opt = {} }}
+                  ( "option" ":" Str {{ opt[Str] = 1 }} )*
+                  {{ return opt }}
+
+    rule Tokens:  {{ tok = [] }}
+                  (
+                    "token" ID ":" Str {{ tok.append( (ID,Str) ) }}
+                  | "ignore"  
+				    ":" Str {{ ign = ('#ignore',Str) }}
+				    ( STMT  {{ ign = ign + (STMT[2:-2],) }} )?
+				            {{ tok.append( ign ) }}
+                  )*
+                  {{ return tok }}
+
+    rule Rules<<tokens>>:
+                  {{ rul = [] }}
+                  (
+                    "rule" ID OptParam ":" ClauseA<<ID, tokens>>
+                    {{ rul.append( (ID, OptParam, ClauseA) ) }}
+                  )*
+                  {{ return rul }}
+
+    rule ClauseA<<rule, tokens>>:
+                  ClauseB<<rule,tokens>>
+                  {{ v = [ClauseB] }}
+                  ( OR ClauseB<<rule,tokens>> {{ v.append(ClauseB) }} )*
+                  {{ return cleanup_choice(rule,v) }}
+
+    rule ClauseB<<rule,tokens>>:
+                  {{ v = [] }}
+                  ( ClauseC<<rule,tokens>> {{ v.append(ClauseC) }} )*
+                  {{ return cleanup_sequence(rule, v) }}
+
+    rule ClauseC<<rule,tokens>>:
+                  ClauseD<<rule,tokens>>
+                  ( PLUS {{ return parsetree.Plus(rule, ClauseD) }}
+                  | STAR {{ return parsetree.Star(rule, ClauseD) }}
+                  | QUEST {{ return parsetree.Option(rule, ClauseD) }}
+                  |      {{ return ClauseD }} )
+
+    rule ClauseD<<rule,tokens>>:
+                  STR {{ t = (STR, eval(STR,{},{})) }}
+                      {{ if t not in tokens: tokens.insert( 0, t ) }} 
+                      {{ return parsetree.Terminal(rule, STR) }}
+                | ID OptParam {{ return resolve_name(rule,tokens, ID, OptParam) }}
+                | LP ClauseA<<rule,tokens>> RP {{ return ClauseA }}
+                | LB ClauseA<<rule,tokens>> RB {{ return parsetree.Option(rule, ClauseA) }}
+                | STMT {{ return parsetree.Eval(rule, STMT[2:-2]) }}
+
+    rule OptParam: [ ATTR {{ return ATTR[2:-2] }} ] {{ return '' }}
+    rule Str:   STR {{ return eval(STR,{},{}) }}
+%%