commit 02da7f9e45ba2af967ae1b71575be62763da3bba
Author: Paul Evans <>
Date:   Sat Dec 11 19:46:20 2010 +0000

    Import of PEVANS/Parser-MGC-0.01 from CPAN.
    gitpan-cpan-distribution: Parser-MGC
    gitpan-cpan-version:      0.01
    gitpan-cpan-path:         PEVANS/Parser-MGC-0.01.tar.gz
    gitpan-cpan-author:       PEVANS
    gitpan-cpan-maturity:     released
 Build.PL           |  19 ++
 Changes            |   4 +
 LICENSE            | 377 ++++++++++++++++++++++++++++++++
 MANIFEST           |  24 +++
 META.yml           |  21 ++
 Makefile.PL        |  14 ++
 README             | 194 +++++++++++++++++
 lib/Parser/  | 614 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 t/00use.t          |   3 +
 t/01base.t         |  36 ++++
 t/02expect.t       |  31 +++
 t/03where.t        |  47 ++++
 t/04comment.t      |  32 +++
 t/10token_int.t    |  26 +++
 t/11token_string.t |  32 +++
 t/12token_ident.t  |  38 ++++
 t/13token_kw.t     |  28 +++
 t/20maybe.t        |  32 +++
 t/21scope_of.t     |  28 +++
 t/22list_of.t      |  25 +++
 t/23sequence_of.t  |  24 +++
 t/24one_of.t       |  33 +++
 t/30commit.t       |  39 ++++
 t/99pod.t          |   8 +
 24 files changed, 1729 insertions(+)

diff --git a/Build.PL b/Build.PL
new file mode 100644
index 0000000..f98f30d
--- /dev/null
+++ b/Build.PL
@@ -0,0 +1,19 @@
+use strict;
+use warnings;
+use Module::Build;
+my $build = Module::Build->new(
+   module_name => 'Parser::MGC',
+   requires => {
+   },
+   build_requires => {
+      'Test::More' => 0,
+   },
+   license => 'perl',
+   create_makefile_pl => 'traditional',
+   create_license => 1,
+   create_readme  => 1,
diff --git a/Changes b/Changes
new file mode 100644
index 0000000..086fef5
--- /dev/null
+++ b/Changes
@@ -0,0 +1,4 @@
+Revision history for Parser-MGC
+0.01    First version, released on an unsuspecting world.
diff --git a/MANIFEST b/MANIFEST
new file mode 100644
index 0000000..ace5273
--- /dev/null
@@ -0,0 +1,24 @@
+MANIFEST                       This list of files
diff --git a/META.yml b/META.yml
new file mode 100644
index 0000000..4f0c13c
--- /dev/null
+++ b/META.yml
@@ -0,0 +1,21 @@
+abstract: 'build simple recursive-descent parsers'
+  - 'Paul Evans <>'
+  Test::More: 0
+  Module::Build: 0.36
+generated_by: 'Module::Build version 0.3607'
+license: perl
+  url:
+  version: 1.4
+name: Parser-MGC
+  Parser::MGC:
+    file: lib/Parser/
+    version: 0.01
+  license:
+version: 0.01
diff --git a/Makefile.PL b/Makefile.PL
new file mode 100644
index 0000000..1c06b3a
--- /dev/null
+++ b/Makefile.PL
@@ -0,0 +1,14 @@
+# Note: this file was auto-generated by Module::Build::Compat version 0.3607
+use ExtUtils::MakeMaker;
+          'NAME' => 'Parser::MGC',
+          'VERSION_FROM' => 'lib/Parser/',
+          'PREREQ_PM' => {
+                           'Test::More' => 0
+                         },
+          'INSTALLDIRS' => 'site',
+          'EXE_FILES' => [],
+          'PL_FILES' => {}
+        )
diff --git a/README b/README
new file mode 100644
index 0000000..c1ac37f
--- /dev/null
+++ b/README
@@ -0,0 +1,194 @@
+    "Parser::MGC" - build simple recursive-descent parsers
+     package My::Grammar::Parser
+     use base qw( Parser::MGC );
+     sub parse
+     {
+        my $self = shift;
+        $self->sequence_of( sub {
+           $self->one_of(
+              sub { $self->token_int },
+              sub { $self->token_string },
+              sub { \$self->token_ident },
+              sub { $self->scope_of( "(", \&parse, ")" ) }
+           );
+        } );
+     }
+     my $parser = My::Grammar::Parser->new;
+     my $tree = $parser->from_file( $ARGV[0] );
+     ...
+    This base class provides a low-level framework for building
+    recursive-descent parsers that consume a given input string from left to
+    right, returning a parse structure. It takes its name from the "m//gc"
+    regexps used to implement the token parsing behaviour.
+    It provides a number of token-parsing methods, which each atomically
+    extract a grammatical token from the string. It also provides wrapping
+    methods that can be used to build up a possibly-recursive grammar
+    structure. Each method, both token and structural, atomically either
+    consumes a prefix of the string and returns its result, or fails and
+    consumes nothing.
+  $parser = Parser::MGC->new( %args )
+    Returns a new instance of a "Parser::MGC" object. This must be called on
+    a subclass that provides a "parse" method.
+    Takes the following named arguments
+    patterns => HASH
+            Keys in this hash should map to quoted regexp ("qr//")
+            references, to override the default patterns used to match
+            tokens. See "PATTERNS" below
+    The following pattern names are recognised. They may be passed to the
+    constructor in the "patterns" hash, or provided as a class method under
+    the name "pattern_*name*".
+    *   ws
+        Pattern used to skip whitespace between tokens. Defaults to
+        "/[\s\n\t]+/"
+    *   comment
+        Pattern used to skip comments between tokens. Undefined by default.
+    *   ident
+        Pattern used to parse an identifier by "token_ident". Defaults to
+        "/[[:alpha:]_]\w*/"
+    *   string_delim
+        Pattern used to delimit a string by "token_string". Defaults to
+        "/["']/".
+  $result = $parser->from_string( $str )
+    Parse the given literal string and return the result from the "parse"
+    method.
+  $result = $parser->from_file( $file )
+    Parse the given file, which may be a pathname in a string, or an opened
+    IO handle, and return the result from the "parse" method.
+  ( $lineno, $col, $text ) = $parser->where
+    Returns the current parse position, as a line and column number, and the
+    entire current line of text. The first line is numbered 1, and the first
+    column is numbered 0.
+  $parser->fail( $message )
+    Aborts the current parse attempt with the given message string. The
+    failure message will include the current line and column position, and
+    will include the line of input that failed.
+  $eos = $parser->at_eos
+    Returns true if the input string is at the end of the string.
+    The following methods may be used to build a grammatical structure out
+    of the defined basic token-parsing methods. Each takes at least one code
+    reference, which will be passed the actual $parser object as its first
+    argument.
+  $ret = $parser->maybe( $code )
+    Attempts to execute the given $code reference in scalar context, passing
+    in no arguments, and returning what it returned. If the code fails to
+    parse by calling the "fail" method then none of the input string will be
+    consumed; the current parsing position will be restored. "undef" will be
+    returned in this case.
+    This may be considered to be similar to the "?" regexp qualifier.
+  $ret = $parser->scope_of( $start, $code, $stop )
+    Expects to find the $start pattern, then attempts to execute the given
+    $code reference, then expects to find the $stop pattern. Returns
+    whatever the code reference returned.
+    While the code is being executed, the $stop pattern will be used by the
+    token parsing methods as an end-of-scope marker; causing them to return
+    "undef".
+  $ret = $parser->list_of( $sep, $code )
+    Expects to find a list of instances of something parsed by $code,
+    separated by the $sep pattern. Returns an ARRAY ref containing a list of
+    the return values from the $code.
+    This method does not consider it an error if the returned list is empty;
+    that is, that the scope ended before any item instances were parsed from
+    it.
+  $ret = $parser->sequence_of( $code )
+    A shortcut for calling "list_of" with an empty string as separator;
+    expects to find at least one instance of something parsed by $code,
+    separated only by skipped whitespace.
+    This may be considered to be similar to the "+" or "*" regexp
+    qualifiers.
+  $ret = $parser->one_of( @codes )
+    Expects that one of the given code references can parse something from
+    the input, returning what it returned. Each code reference may indicate
+    a failure to parse by calling the "fail" method.
+    This may be considered to be similar to the "|" regexp operator for
+    forming alternations of possible parse trees.
+  $parser->commit
+    Calling this method will cancel the backtracking behaviour of the
+    innermost "maybe" or "one_of" structure forming method. That is, if
+    later code then calls "fail", the exception will be propagated out of
+    "maybe", and no further code blocks will be attempted by "one_of".
+    Typically this will be called once the grammatical structure of an
+    alternation has been determined, ensuring that any further failures are
+    raised as real exceptions, rather than by attempting other alternatives.
+     TODO: Code example with commit inside one_of
+    The following methods attempt to consume some part of the input string,
+    to be used as part of the parsing process.
+    As a convenience for parsing, each of these methods will return undef if
+    the string is already at the end (if "at_eos" returns true).
+  $parser->expect( $string )
+  $parser->expect( qr/pattern/ )
+    Expects to find a literal string or regexp pattern match, and consumes
+    it. This method does not return a useful value.
+  $int = $parser->token_int
+    Expects to find an integer in decimal, octal or hexadecimal notation,
+    and consumes it.
+  $str = $parser->token_string
+    Expects to find a quoted string, and consumes it. The string should be
+    quoted using """ or "'" quote marks.
+  $ident = $parser->token_ident
+    Expects to find an identifier, and consumes it.
+  $keyword = $parser->token_kw( @keywords )
+    Expects to find a keyword, and consumes it. A keyword is defined as an
+    identifier which is exactly one of the literal values passed in.
+    *   Unescaping of string constants; customisable
+    *   Easy ability for subclasses to define more token types
+    Paul Evans <>
diff --git a/lib/Parser/ b/lib/Parser/
new file mode 100644
index 0000000..1bd12d0
--- /dev/null
+++ b/lib/Parser/
@@ -0,0 +1,614 @@
+#  You may distribute under the terms of either the GNU General Public License
+#  or the Artistic License (the same terms as Perl itself)
+#  (C) Paul Evans, 2010 --
+package Parser::MGC;
+use strict;
+use warnings;
+our $VERSION = '0.01';
+use Carp;
+use File::Slurp qw( slurp );
+=head1 NAME
+C<Parser::MGC> - build simple recursive-descent parsers
+=head1 SYNOPSIS
+ package My::Grammar::Parser
+ use base qw( Parser::MGC );
+ sub parse
+ {
+    my $self = shift;
+    $self->sequence_of( sub {
+       $self->one_of(
+          sub { $self->token_int },
+          sub { $self->token_string },
+          sub { \$self->token_ident },
+          sub { $self->scope_of( "(", \&parse, ")" ) }
+       );
+    } );
+ }
+ my $parser = My::Grammar::Parser->new;
+ my $tree = $parser->from_file( $ARGV[0] );
+ ...
+This base class provides a low-level framework for building recursive-descent
+parsers that consume a given input string from left to right, returning a
+parse structure. It takes its name from the C<m//gc> regexps used to implement
+the token parsing behaviour.
+It provides a number of token-parsing methods, which each atomically extract a
+grammatical token from the string. It also provides wrapping methods that can
+be used to build up a possibly-recursive grammar structure. Each method, both
+token and structural, atomically either consumes a prefix of the string and
+returns its result, or fails and consumes nothing.
+=head2 $parser = Parser::MGC->new( %args )
+Returns a new instance of a C<Parser::MGC> object. This must be called on a
+subclass that provides a C<parse> method.
+Takes the following named arguments
+=over 8
+=item patterns => HASH
+Keys in this hash should map to quoted regexp (C<qr//>) references, to
+override the default patterns used to match tokens. See C<PATTERNS> below
+=head1 PATTERNS
+The following pattern names are recognised. They may be passed to the
+constructor in the C<patterns> hash, or provided as a class method under the
+name C<pattern_I<name>>.
+=over 4
+=item * ws
+Pattern used to skip whitespace between tokens. Defaults to C</[\s\n\t]+/>
+=item * comment
+Pattern used to skip comments between tokens. Undefined by default.
+=item * ident
+Pattern used to parse an identifier by C<token_ident>. Defaults to
+=item * string_delim
+Pattern used to delimit a string by C<token_string>. Defaults to C</["']/>.
+my @patterns = qw(
+   ws
+   comment
+   ident
+   string_delim
+use constant {
+   pattern_ws      => qr/[\s\n\t]+/,
+   pattern_comment => undef,
+   pattern_ident   => qr/[[:alpha:]_]\w*/,
+   pattern_string_delim => qr/["']/,
+sub new
+   my $class = shift;
+   my %args = @_;
+   $class->can( "parse" ) or
+      croak "Expected to be a subclass that can ->parse";
+   my $self = bless {
+      patterns => {},
+   }, $class;
+   $self->{patterns}{$_} = $args{patterns}{$_} || $self->${\"pattern_$_"} for 
+   return $self;
+=head1 METHODS
+=head2 $result = $parser->from_string( $str )
+Parse the given literal string and return the result from the C<parse> method.
+sub from_string
+   my $self = shift;
+   my ( $str ) = @_;
+   $self->{str} = $str;
+   pos $self->{str} = 0;
+   my $result = $self->parse;
+   $self->at_eos or
+      $self->fail( "Expected end of input" );
+   return $result;
+=head2 $result = $parser->from_file( $file )
+Parse the given file, which may be a pathname in a string, or an opened IO
+handle, and return the result from the C<parse> method.
+sub from_file
+   my $self = shift;
+   my ( $filename ) = @_;
+   $self->{filename} = $filename;
+   $self->from_string( scalar(slurp $filename) );
+=head2 ( $lineno, $col, $text ) = $parser->where
+Returns the current parse position, as a line and column number, and
+the entire current line of text. The first line is numbered 1, and the first
+column is numbered 0.
+sub where
+   my $self = shift;
+   my $pos = pos $self->{str};
+   my $str = $self->{str};
+   my $sol = $pos;
+   $sol-- if $sol > 0 and substr( $str, $sol, 1 ) =~ m/^[\r\n]$/;
+   $sol-- while $sol > 0 and substr( $str, $sol-1, 1 ) !~ m/^[\r\n]$/;
+   my $eol = $pos;
+   $eol++ while $eol < length($str) and substr( $str, $eol, 1 ) !~ m/^[\r\n]$/;
+   my $line = substr( $str, $sol, $eol - $sol );
+   my $col = $pos - $sol;
+   my $lineno = ( () = substr( $str, 0, $pos ) =~ m/\n/g ) + 1;
+   return ( $lineno, $col, $line );
+=head2 $parser->fail( $message )
+Aborts the current parse attempt with the given message string. The failure
+message will include the current line and column position, and will include
+the line of input that failed.
+sub fail
+   my $self = shift;
+   my ( $message ) = @_;
+   my ( $lineno, $col, $line ) = $self->where;
+   die Parser::MGC::Failure->new( $message, $self->where );
+=head2 $eos = $parser->at_eos
+Returns true if the input string is at the end of the string.
+sub at_eos
+   my $self = shift;
+   $self->skip_ws;
+   my $pos = pos $self->{str};
+   return 1 if defined $pos and $pos >= length $self->{str};
+   return 0 unless defined $self->{endofscope};
+   # No /g so we won't actually alter pos()
+   my $at_eos = $self->{str} =~ m/\G$self->{endofscope}/;
+   return $at_eos;
+The following methods may be used to build a grammatical structure out of the
+defined basic token-parsing methods. Each takes at least one code reference,
+which will be passed the actual C<$parser> object as its first argument.
+=head2 $ret = $parser->maybe( $code )
+Attempts to execute the given C<$code> reference in scalar context, passing in
+no arguments, and returning what it returned. If the code fails to parse by
+calling the C<fail> method then none of the input string will be consumed; the
+current parsing position will be restored. C<undef> will be returned in this
+This may be considered to be similar to the C<?> regexp qualifier.
+sub maybe
+   my $self = shift;
+   my ( $code ) = @_;
+   my $pos = pos $self->{str};
+   my $committed = 0;
+   local $self->{committer} = sub { $committed++ };
+   my $ret;
+   eval { $ret = $code->( $self ); 1 } and return $ret;
+   my $e = $@;
+   pos($self->{str}) = $pos;
+   die $e if $committed or not eval { $e->isa( "Parser::MGC::Failure" ) };
+   return undef;
+=head2 $ret = $parser->scope_of( $start, $code, $stop )
+Expects to find the C<$start> pattern, then attempts to execute the given
+C<$code> reference, then expects to find the C<$stop> pattern. Returns
+whatever the code reference returned.
+While the code is being executed, the C<$stop> pattern will be used by the
+token parsing methods as an end-of-scope marker; causing them to return
+sub scope_of
+   my $self = shift;
+   my ( $start, $code, $stop ) = @_;
+   ref $stop or $stop = qr/\Q$stop/;
+   $self->expect( $start );
+   local $self->{endofscope} = $stop;
+   my $ret = $code->( $self );
+   $self->expect( $stop );
+   return $ret;
+=head2 $ret = $parser->list_of( $sep, $code )
+Expects to find a list of instances of something parsed by C<$code>,
+separated by the C<$sep> pattern. Returns an ARRAY ref containing a list of
+the return values from the C<$code>.
+This method does not consider it an error if the returned list is empty; that
+is, that the scope ended before any item instances were parsed from it.
+sub list_of
+   my $self = shift;
+   my ( $sep, $code ) = @_;
+   ref $sep or $sep = qr/\Q$sep/;
+   my @ret;
+   while( !$self->at_eos ) {
+      push @ret, scalar $code->( $self );
+      $self->skip_ws;
+      $self->{str} =~ m/\G$sep/gc or last;
+   }
+   return \@ret;
+=head2 $ret = $parser->sequence_of( $code )
+A shortcut for calling C<list_of> with an empty string as separator; expects
+to find at least one instance of something parsed by C<$code>, separated only
+by skipped whitespace.
+This may be considered to be similar to the C<+> or C<*> regexp qualifiers.
+sub sequence_of
+   my $self = shift;
+   my ( $code ) = @_;
+   return $self->list_of( "", $code );
+=head2 $ret = $parser->one_of( @codes )
+Expects that one of the given code references can parse something from the
+input, returning what it returned. Each code reference may indicate a failure
+to parse by calling the C<fail> method.
+This may be considered to be similar to the C<|> regexp operator for forming
+alternations of possible parse trees.
+sub one_of
+   my $self = shift;
+   while( @_ ) {
+      my $pos = pos $self->{str};
+      my $committed = 0;
+      local $self->{committer} = sub { $committed++ };
+      my $ret;
+      $ret = eval { shift->( $self ) } and return $ret;
+      my $e = $@;
+      pos( $self->{str} ) = $pos;
+      die $e if $committed or not eval { $e->isa( "Parser::MGC::Failure" ) };
+   }
+   $self->fail( "Found nothing parseable" );
+=head2 $parser->commit
+Calling this method will cancel the backtracking behaviour of the innermost
+C<maybe> or C<one_of> structure forming method. That is, if later code then
+calls C<fail>, the exception will be propagated out of C<maybe>, and no
+further code blocks will be attempted by C<one_of>.
+Typically this will be called once the grammatical structure of an
+alternation has been determined, ensuring that any further failures are raised
+as real exceptions, rather than by attempting other alternatives.
+ TODO: Code example with commit inside one_of
+sub commit
+   my $self = shift;
+   if( $self->{committer} ) {
+      $self->{committer}->();
+   }
+   else {
+      croak "Cannot commit except within a backtrack-able structure";
+   }
+The following methods attempt to consume some part of the input string, to be
+used as part of the parsing process.
+As a convenience for parsing, each of these methods will return undef if the
+string is already at the end (if C<at_eos> returns true).
+sub skip_ws
+   my $self = shift;
+   my $ws = $self->{patterns}{ws};
+   my $c  = $self->{patterns}{comment};
+   1 while $self->{str} =~ m/\G$ws/gc or
+           ( $c and $self->{str} =~ m/\G$c/gc );
+=head2 $parser->expect( $string )
+=head2 $parser->expect( qr/pattern/ )
+Expects to find a literal string or regexp pattern match, and consumes it.
+This method does not return a useful value.
+sub expect
+   my $self = shift;
+   my ( $expect ) = @_;
+   ref $expect or $expect = qr/\Q$expect/;
+   $self->skip_ws;
+   $self->{str} =~ m/\G$expect/gc or
+      $self->fail( "Expected $expect" );
+=head2 $int = $parser->token_int
+Expects to find an integer in decimal, octal or hexadecimal notation, and
+consumes it.
+sub token_int
+   my $self = shift;
+   return undef if $self->at_eos;
+   $self->{str} =~ m/\G(0x[[:xdigit:]]+|[[:digit:]]+)/gc or
+      $self->fail( "Expected integer" );
+   my $int = $1;
+   return oct $int if $int =~ m/^0/;
+   return $int;
+=head2 $str = $parser->token_string
+Expects to find a quoted string, and consumes it. The string should be quoted
+using C<"> or C<'> quote marks.
+sub token_string
+   my $self = shift;
+   return undef if $self->at_eos;
+   my $pos = pos $self->{str};
+   $self->{str} =~ m/\G($self->{patterns}{string_delim})/gc or
+      $self->fail( "Expected string delimiter" );
+   my $delim = $1;
+   $self->{str} =~ m/\G((?:\\.|[^\\])*)$delim/gc or
+      pos($self->{str}) = $pos, $self->fail( "Expected contents of string" );
+   my $string = $1;
+   # TODO: Unescape stuff like \\ and \n and whatnot
+   return $string;
+=head2 $ident = $parser->token_ident
+Expects to find an identifier, and consumes it.
+sub token_ident
+   my $self = shift;
+   return undef if $self->at_eos;
+   $self->{str} =~ m/\G($self->{patterns}{ident})/gc or
+      $self->fail( "Expected identifier" );
+   return $1;
+=head2 $keyword = $parser->token_kw( @keywords )
+Expects to find a keyword, and consumes it. A keyword is defined as an
+identifier which is exactly one of the literal values passed in.
+sub token_kw
+   my $self = shift;
+   my @acceptable = @_;
+   $self->skip_ws;
+   my $pos = pos $self->{str};
+   defined( my $kw = $self->token_ident ) or
+      return undef;
+   grep { $_ eq $kw } @acceptable or
+      pos($self->{str}) = $pos, $self->fail( "Expected any of ".join( ", ", 
@acceptable ) );
+   return $kw;
+package # hide from indexer
+   Parser::MGC::Failure;
+sub new
+   my $class = shift;
+   my $self = bless {}, $class;
+   @{$self}{qw( message linenum col text )} = @_;
+   return $self;
+use overload '""' => "STRING";
+   my $self = shift;
+   return "$self->{message} on line $self->{linenum} at:\n" . 
+          "$self->{text}\n" . 
+          ( " " x $self->{col} . "^" ) . "\n";
+# Keep perl happy; keep Britain tidy
+=head1 TODO
+=over 4
+=item *
+Unescaping of string constants; customisable
+=item *
+Easy ability for subclasses to define more token types
+=head1 AUTHOR
+Paul Evans <>
diff --git a/t/00use.t b/t/00use.t
new file mode 100644
index 0000000..d2dc1c4
--- /dev/null
+++ b/t/00use.t
@@ -0,0 +1,3 @@
+use Test::More tests => 1;
+use_ok( "Parser::MGC" );
diff --git a/t/01base.t b/t/01base.t
new file mode 100644
index 0000000..6efca79
--- /dev/null
+++ b/t/01base.t
@@ -0,0 +1,36 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 4;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   # Some slight cheating here
+   pos( $self->{str} ) = length( $self->{str} );
+   return [ split ' ', $self->{str} ];
+package main;
+my $parser = TestParser->new;
+isa_ok( $parser, "TestParser", '$parser' );
+isa_ok( $parser, "Parser::MGC", '$parser' );
+my $tokens = $parser->from_string( "1 2 3" );
+is_deeply( $tokens, [ 1, 2, 3 ], '->from_string' );
+$tokens = $parser->from_file( \*DATA );
+is_deeply( $tokens, [ 4, 5, 6 ], '->from_file(\*DATA)' );
+4 5 6
diff --git a/t/02expect.t b/t/02expect.t
new file mode 100644
index 0000000..df8049b
--- /dev/null
+++ b/t/02expect.t
@@ -0,0 +1,31 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 3;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->expect( "hello" );
+   $self->expect( qr/world/ );
+   return 1;
+package main;
+my $parser = TestParser->new;
+ok( $parser->from_string( "hello world" ), '"hello world"' );
+ok( !eval { $parser->from_string( "goodbye world" ) }, '"goodbye world" fails' 
+is( $@,
+   qq[Expected (?-xism:hello) on line 1 at:\n] . 
+   qq[goodbye world\n] . 
+   qq[^\n],
+   'Exception from "goodbye world" failure' );
diff --git a/t/03where.t b/t/03where.t
new file mode 100644
index 0000000..a955bd2
--- /dev/null
+++ b/t/03where.t
@@ -0,0 +1,47 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 6;
+my @positions;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   main::is_deeply( [ $self->where ],
+      $positions[0],
+      '->where before parsing' );
+   $self->expect( "hello" );
+   main::is_deeply( [ $self->where ],
+      $positions[1],
+      '->where during parsing' );
+   $self->expect( qr/world/ );
+   main::is_deeply( [ $self->where ],
+      $positions[2],
+      '->where after parsing' );
+   return 1;
+package main;
+my $parser = TestParser->new;
+@positions = (
+   [ 1, 0, "hello world" ],
+   [ 1, 5, "hello world" ],
+   [ 1, 11, "hello world" ], );
+$parser->from_string( "hello world" );
+@positions = (
+   [ 1, 0, "hello" ],
+   [ 1, 5, "hello" ],
+   [ 2, 5, "world" ], );
+$parser->from_string( "hello\nworld" );
diff --git a/t/04comment.t b/t/04comment.t
new file mode 100644
index 0000000..a95f780
--- /dev/null
+++ b/t/04comment.t
@@ -0,0 +1,32 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 4;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->expect( "hello" );
+   $self->expect( qr/world/ );
+   return 1;
+package main;
+my $parser = TestParser->new;
+ok( $parser->from_string( "hello world" ), '"hello world"' );
+ok( $parser->from_string( "hello\nworld" ), '"hello\nworld"' );
+ok( !eval { $parser->from_string( "hello\n# Comment\nworld" ) }, '"hello 
world" with comment fails' );
+$parser = TestParser->new(
+   patterns => { comment => qr/#.*\n/ },
+ok( $parser->from_string( "hello\n# Comment\nworld" ), '"hello world" with 
comment passes' );
diff --git a/t/10token_int.t b/t/10token_int.t
new file mode 100644
index 0000000..e5cc0ce
--- /dev/null
+++ b/t/10token_int.t
@@ -0,0 +1,26 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 5;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   return $self->token_int;
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "123" ), 123, 'Decimal integer' );
+is( $parser->from_string( "0" ),     0, 'Zero' );
+is( $parser->from_string( "0x20" ), 32, 'Hexadecimal integer' );
+is( $parser->from_string( "010" ),   8, 'Octal integer' );
+ok( !eval { $parser->from_string( "hello" ) }, '"hello" fails' );
diff --git a/t/11token_string.t b/t/11token_string.t
new file mode 100644
index 0000000..8c164c1
--- /dev/null
+++ b/t/11token_string.t
@@ -0,0 +1,32 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 6;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   return $self->token_string;
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( q['single'] ), "single", 'Single quoted string' );
+is( $parser->from_string( q["double"] ), "double", 'Double quoted string' );
+is( $parser->from_string( q["foo 'bar'"] ), "foo 'bar'", 'Double quoted string 
containing single substr' );
+is( $parser->from_string( q['foo "bar"'] ), 'foo "bar"', 'Single quoted string 
containing double substr' );
+$parser = TestParser->new(
+   patterns => { string_delim => qr/"/ }
+is( $parser->from_string( q["double"] ), "double", 'Double quoted string still 
passes' );
+ok( !eval { $parser->from_string( q['single'] ) }, 'Single quoted string now 
fails' );
diff --git a/t/12token_ident.t b/t/12token_ident.t
new file mode 100644
index 0000000..4785131
--- /dev/null
+++ b/t/12token_ident.t
@@ -0,0 +1,38 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 6;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   return $self->token_ident;
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "foo" ), "foo", 'Identifier' );
+is( $parser->from_string( "x" ), "x", 'Single-letter identifier' );
+ok( !eval { $parser->from_string( "123" ) }, '"123" fails' );
+is( $@,
+   qq[Expected identifier on line 1 at:\n] .
+   qq[123\n] .
+   qq[^\n],
+   'Exception from "123" failure' );
+ok( !eval { $parser->from_string( "some-ident" ) }, '"some-ident" fails on 
default identifier' );
+$parser = TestParser->new(
+   patterns => { ident => qr/[[:alpha:]_][\w-]+/ },
+is( $parser->from_string( "some-ident" ), "some-ident", '"some-ident" passes 
with new token pattern' );
diff --git a/t/13token_kw.t b/t/13token_kw.t
new file mode 100644
index 0000000..d534245
--- /dev/null
+++ b/t/13token_kw.t
@@ -0,0 +1,28 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 3;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   return $self->token_kw( qw( foo bar ) );
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "foo" ), "foo", 'Keyword' );
+ok( !eval { $parser->from_string( "splot" ) }, '"splot" fails' );
+is( $@,
+   qq[Expected any of foo, bar on line 1 at:\n] .
+   qq[splot\n] .
+   qq[^\n],
+   'Exception from "splot" failure' );
diff --git a/t/20maybe.t b/t/20maybe.t
new file mode 100644
index 0000000..e58235f
--- /dev/null
+++ b/t/20maybe.t
@@ -0,0 +1,32 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 4;
+my $die;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->maybe( sub {
+      die $die if $die;
+      $self->token_ident;
+   } ) ||
+      $self->token_int;
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "hello" ), "hello", '"hello"' );
+is( $parser->from_string( "123" ), 123, '"123"' );
+$die = "Now have to fail\n";
+ok( !eval { $parser->from_string( "456" ) }, '"456" with $die fails' );
+is( $@, "Now have to fail\n", 'Exception from failure' );
diff --git a/t/21scope_of.t b/t/21scope_of.t
new file mode 100644
index 0000000..fcb7da9
--- /dev/null
+++ b/t/21scope_of.t
@@ -0,0 +1,28 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 3;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->scope_of(
+      "(",
+      sub { return $self->token_int },
+      ")"
+   );
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "(123)" ), 123, '"(123)"' );
+ok( !eval { $parser->from_string( "(abc)" ) }, '"(abc)"' );
+ok( !eval { $parser->from_string( "456" ) }, '"456"' );
diff --git a/t/22list_of.t b/t/22list_of.t
new file mode 100644
index 0000000..d3a48be
--- /dev/null
+++ b/t/22list_of.t
@@ -0,0 +1,25 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 3;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->list_of( ",", sub {
+      return $self->token_int;
+   } );
+package main;
+my $parser = TestParser->new;
+is_deeply( $parser->from_string( "123" ), [ 123 ], '"123"' );
+is_deeply( $parser->from_string( "4,5,6" ), [ 4, 5, 6 ], '"4,5,6"' );
+is_deeply( $parser->from_string( "7, 8" ), [ 7, 8 ], '"7, 8"' );
diff --git a/t/23sequence_of.t b/t/23sequence_of.t
new file mode 100644
index 0000000..e91a6e4
--- /dev/null
+++ b/t/23sequence_of.t
@@ -0,0 +1,24 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 2;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->sequence_of( sub {
+      return $self->token_int;
+   } );
+package main;
+my $parser = TestParser->new;
+is_deeply( $parser->from_string( "123" ), [ 123 ], '"123"' );
+is_deeply( $parser->from_string( "4 5 6" ), [ 4, 5, 6 ], '"4 5 6"' );
diff --git a/t/24one_of.t b/t/24one_of.t
new file mode 100644
index 0000000..665e291
--- /dev/null
+++ b/t/24one_of.t
@@ -0,0 +1,33 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 6;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->one_of(
+      sub { [ int => $self->token_int ] },
+      sub { [ str => $self->token_string ] },
+      sub { [ ident => $self->token_ident ] },
+      sub { $self->expect( "@" ); die "Here I fail\n" },
+   );
+package main;
+my $parser = TestParser->new;
+is_deeply( $parser->from_string( "123" ), [ int => 123 ], '"123"' );
+is_deeply( $parser->from_string( q["hi"] ), [ str => "hi" ], '"hi"' );
+is_deeply( $parser->from_string( "foobar" ), [ ident => "foobar" ], '"foobar"' 
+ok( !eval { $parser->from_string( "@" ) }, '"@" fails' );
+is( $@, "Here I fail\n", 'Exception from "@" failure' );
+ok( !eval { $parser->from_string( "+" ) }, '"+" fails' );
diff --git a/t/30commit.t b/t/30commit.t
new file mode 100644
index 0000000..b9080bb
--- /dev/null
+++ b/t/30commit.t
@@ -0,0 +1,39 @@
+#!/usr/bin/perl -w
+use strict;
+use Test::More tests => 4;
+package TestParser;
+use base qw( Parser::MGC );
+sub parse
+   my $self = shift;
+   $self->one_of(
+      sub { $self->token_int },
+      sub {
+         $self->scope_of( "(",
+            sub {
+               $self->commit;
+               $self->token_string;
+            },
+            ")" );
+      }
+   );
+package main;
+my $parser = TestParser->new;
+is( $parser->from_string( "123" ), 123, '"123"' );
+is( $parser->from_string( '("hi")' ), "hi", '("hi")' );
+ok( !eval { $parser->from_string( "(456)" ) }, '"(456)" fails' );
+is( $@,
+   qq[Expected string delimiter on line 1 at:\n].
+   qq[(456)\n].
+   qq[ ^\n],
+   'Exception from "(456)" failure' );
diff --git a/t/99pod.t b/t/99pod.t
new file mode 100644
index 0000000..339b17d
--- /dev/null
+++ b/t/99pod.t
@@ -0,0 +1,8 @@
+#!/usr/bin/perl -w
+use Test::More;
+eval "use Test::Pod 1.00";
+plan skip_all => "Test::Pod 1.00 required for testing POD" if $@;

Alioth's /usr/local/bin/git-commit-notice on 

Pkg-perl-cvs-commits mailing list

Reply via email to