732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
     1  | 
// Parser Combinators: Simple Version
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
     2  | 
//====================================
  | 
| 
742
 | 
     3  | 
//
  | 
| 
906
 | 
     4  | 
// Call with Ammonite (Scala 2.13.10)
  | 
| 
742
 | 
     5  | 
//
  | 
| 
906
 | 
     6  | 
//  amm comb1-2.sc
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
     7  | 
  | 
| 
742
 | 
     8  | 
 
  | 
| 
906
 | 
     9  | 
//  Note, in the lectures I did not show the implicit type bound
  | 
| 
742
 | 
    10  | 
//  I : IsSeq, which means that the input type 'I' needs to be
  | 
| 
 | 
    11  | 
//  a sequence. 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    12  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    13  | 
type IsSeq[A] = A => Seq[_]
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    14  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    15  | 
abstract class Parser[I : IsSeq, T]{
 | 
| 
852
 | 
    16  | 
  def parse(in: I): Set[(T, I)]  
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    17  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    18  | 
  def parse_all(in: I) : Set[T] =
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    19  | 
    for ((hd, tl) <- parse(in); 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    20  | 
        if tl.isEmpty) yield hd
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    21  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    22  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    23  | 
// parser combinators
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    24  | 
  | 
| 
799
 | 
    25  | 
// alternative parser
  | 
| 
 | 
    26  | 
class AltParser[I : IsSeq, T](p: => Parser[I, T], 
  | 
| 
 | 
    27  | 
                              q: => Parser[I, T]) extends Parser[I, T] {
 | 
| 
 | 
    28  | 
  def parse(in: I) = p.parse(in) ++ q.parse(in)   
  | 
| 
 | 
    29  | 
}
  | 
| 
 | 
    30  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    31  | 
// sequence parser
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    32  | 
class SeqParser[I : IsSeq, T, S](p: => Parser[I, T], 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    33  | 
                                 q: => Parser[I, S]) extends Parser[I, (T, S)] {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    34  | 
  def parse(in: I) = 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    35  | 
    for ((hd1, tl1) <- p.parse(in); 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    36  | 
         (hd2, tl2) <- q.parse(tl1)) yield ((hd1, hd2), tl2)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    37  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    38  | 
  | 
| 
742
 | 
    39  | 
// map parser
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    40  | 
class MapParser[I : IsSeq, T, S](p: => Parser[I, T], 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    41  | 
                                 f: T => S) extends Parser[I, S] {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    42  | 
  def parse(in: I) = for ((hd, tl) <- p.parse(in)) yield (f(hd), tl)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    43  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    44  | 
  | 
| 
742
 | 
    45  | 
  | 
| 
 | 
    46  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    47  | 
// an example of an atomic parser for characters
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    48  | 
case class CharParser(c: Char) extends Parser[String, Char] {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    49  | 
  def parse(in: String) = 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    50  | 
    if (in != "" && in.head == c) Set((c, in.tail)) else Set()
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    51  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    52  | 
  | 
| 
897
 | 
    53  | 
CharParser('c').parse("abc")
 | 
| 
799
 | 
    54  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    55  | 
// an atomic parser for parsing strings according to a regex
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    56  | 
import scala.util.matching.Regex
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    57  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    58  | 
case class RegexParser(reg: Regex) extends Parser[String, String] {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    59  | 
  def parse(in: String) = reg.findPrefixMatchOf(in) match {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    60  | 
    case None => Set()
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    61  | 
    case Some(m) => Set((m.matched, m.after.toString))  
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    62  | 
  }
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    63  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    64  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    65  | 
// atomic parsers for numbers and "verbatim" strings 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    66  | 
val NumParser = RegexParser("[0-9]+".r)
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    67  | 
def StrParser(s: String) = RegexParser(Regex.quote(s).r)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    68  | 
  | 
| 
897
 | 
    69  | 
NumParser.parse("a123a123bc") 
 | 
| 
 | 
    70  | 
StrParser("else").parse("eelsethen")
 | 
| 
742
 | 
    71  | 
  | 
| 
799
 | 
    72  | 
  | 
| 
906
 | 
    73  | 
// NumParserInt transforms a "string integer" into a proper Int
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    74  | 
// (needs "new" because MapParser is not a case class)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    75  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    76  | 
val NumParserInt = new MapParser(NumParser, (s: String) => s.toInt)
  | 
| 
897
 | 
    77  | 
NumParserInt.parse("123abc")
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    78  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    79  | 
// the following string interpolation allows us to write 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    80  | 
// StrParser(_some_string_) more conveniently as 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    81  | 
//
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    82  | 
// p"<_some_string_>" 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    83  | 
  | 
| 
897
 | 
    84  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    85  | 
implicit def parser_interpolation(sc: StringContext) = new {
 | 
| 
803
 | 
    86  | 
  def p(args: Any*) = StrParser(sc.s(args:_*))
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    87  | 
}
  | 
| 
897
 | 
    88  | 
  | 
| 
 | 
    89  | 
(p"else").parse("elsethen")           
 | 
| 
799
 | 
    90  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    91  | 
// more convenient syntax for parser combinators
  | 
| 
906
 | 
    92  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    93  | 
implicit def ParserOps[I : IsSeq, T](p: Parser[I, T]) = new {
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    94  | 
  def ||(q : => Parser[I, T]) = new AltParser[I, T](p, q)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    95  | 
  def ~[S] (q : => Parser[I, S]) = new SeqParser[I, T, S](p, q)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    96  | 
  def map[S](f: => T => S) = new MapParser[I, T, S](p, f)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    97  | 
}
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
    98  | 
  | 
| 
906
 | 
    99  | 
// example
  | 
| 
897
 | 
   100  | 
def toU(s: String) = s.map(_.toUpper)
  | 
| 
 | 
   101  | 
(p"ELSE").map(toU(_)).parse("ELSEifthen")  
 | 
| 
 | 
   102  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   103  | 
// these implicits allow us to use an infix notation for
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   104  | 
// sequences and alternatives; we also can write the usual
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   105  | 
// map for a MapParser
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   106  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   107  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   108  | 
// with this NumParserInt can now be written more conveniently
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   109  | 
// as:
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   110  | 
  | 
| 
799
 | 
   111  | 
val NumParserInt2 = NumParser.map(_.toInt)
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   112  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   113  | 
  | 
| 
897
 | 
   114  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   115  | 
// A parser for palindromes (just returns them as string)
  | 
| 
803
 | 
   116  | 
lazy val Pal : Parser[String, String] = {
 | 
| 
897
 | 
   117  | 
   (p"a" ~ Pal ~ p"a").map{ case ((x, y), z) => s"$x$y$z" } || 
 | 
| 
896
 | 
   118  | 
   (p"b" ~ Pal ~ p"b").map{ case ((x, y), z) => s"$x$y$z" } || 
 | 
| 
 | 
   119  | 
    p"a" || p"b" || p""
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   120  | 
}  
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   121  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   122  | 
// examples
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   123  | 
Pal.parse_all("abaaaba")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   124  | 
Pal.parse("abaaaba")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   125  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   126  | 
println("Palindrome: " + Pal.parse_all("abaaaba"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   127  | 
  | 
| 
799
 | 
   128  | 
// A parser for wellnested parentheses 
  | 
| 
 | 
   129  | 
//
  | 
| 
 | 
   130  | 
//   P ::= ( P ) P | epsilon
  | 
| 
 | 
   131  | 
//
  | 
| 
 | 
   132  | 
//   (transforms '(' -> '{' , ')' -> '}' )
 | 
| 
 | 
   133  | 
lazy val P : Parser[String, String] = {
 | 
| 
 | 
   134  | 
  (p"(" ~ P ~ p")" ~ P).map{ case (((_, x), _), y) => "{" + x + "}" + y } ||
 | 
| 
 | 
   135  | 
  p""
  | 
| 
 | 
   136  | 
}  
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   137  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   138  | 
println(P.parse_all("(((()()))())"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   139  | 
println(P.parse_all("(((()()))()))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   140  | 
println(P.parse_all(")("))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   141  | 
println(P.parse_all("()"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   142  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   143  | 
// A parser for arithmetic expressions (Terms and Factors)
  | 
| 
898
 | 
   144  | 
  | 
| 
799
 | 
   145  | 
lazy val E: Parser[String, Int] = {
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   146  | 
  (T ~ p"+" ~ E).map{ case ((x, _), z) => x + z } ||
 | 
| 
799
 | 
   147  | 
  (T ~ p"-" ~ E).map{ case ((x, _), z) => x - z } || T }
 | 
| 
 | 
   148  | 
lazy val T: Parser[String, Int] = {
 | 
| 
 | 
   149  | 
  (F ~ p"*" ~ T).map{ case ((x, _), z) => x * z } || F }
 | 
| 
 | 
   150  | 
lazy val F: Parser[String, Int] = {
 | 
| 
 | 
   151  | 
  (p"(" ~ E ~ p")").map{ case ((_, y), _) => y } || NumParserInt }
 | 
| 
898
 | 
   152  | 
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   153  | 
println(E.parse_all("1+3+4"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   154  | 
println(E.parse("1+3+4"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   155  | 
println(E.parse_all("4*2+3"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   156  | 
println(E.parse_all("4*(2+3)"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   157  | 
println(E.parse_all("(4)*((2+3))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   158  | 
println(E.parse_all("4/2+3"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   159  | 
println(E.parse("1 + 2 * 3"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   160  | 
println(E.parse_all("(1+2)+3"))
 | 
| 
799
 | 
   161  | 
println(E.parse_all("1+2+3"))
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   162  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   163  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   164  | 
// with parser combinators (and other parsing algorithms)
  | 
| 
906
 | 
   165  | 
// no left-recursion is allowed, otherwise they will loop
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   166  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   167  | 
lazy val EL: Parser[String, Int] = 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   168  | 
  ((EL ~ p"+" ~ EL).map{ case ((x, y), z) => x + z} || 
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   169  | 
   (EL ~ p"*" ~ EL).map{ case ((x, y), z) => x * z} ||
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   170  | 
   (p"(" ~ EL ~ p")").map{ case ((x, y), z) => y} ||
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   171  | 
   NumParserInt)
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   172  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   173  | 
// this will run forever:
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   174  | 
//println(EL.parse_all("1+2+3"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   175  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   176  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   177  | 
// non-ambiguous vs ambiguous grammars
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   178  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   179  | 
// ambiguous
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   180  | 
lazy val S : Parser[String, String] =
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   181  | 
  (p"1" ~ S ~ S).map{ case ((x, y), z) => x + y + z } || p""
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   182  | 
  | 
| 
850
 | 
   183  | 
//println(time(S.parse("1" * 10)))
 | 
| 
 | 
   184  | 
//println(time(S.parse_all("1" * 10)))
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   185  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   186  | 
// non-ambiguous
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   187  | 
lazy val U : Parser[String, String] =
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   188  | 
  (p"1" ~ U).map{ case (x, y) => x + y } || p""
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   189  | 
  | 
| 
850
 | 
   190  | 
//println(time(U.parse("1" * 10)))
 | 
| 
 | 
   191  | 
//println(time(U.parse_all("1" * 10)))
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   192  | 
println(U.parse("1" * 25))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   193  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   194  | 
U.parse("11")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   195  | 
U.parse("11111")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   196  | 
U.parse("11011")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   197  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   198  | 
U.parse_all("1" * 100)
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   199  | 
U.parse_all("1" * 100 + "0")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   200  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   201  | 
// you can see the difference in second example
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   202  | 
//S.parse_all("1" * 100)         // succeeds
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   203  | 
//S.parse_all("1" * 100 + "0")   // fails
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   204  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   205  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   206  | 
// A variant which counts how many 1s are parsed
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   207  | 
lazy val UCount : Parser[String, Int] =
  | 
| 
799
 | 
   208  | 
  (p"1" ~ UCount).map{ case (_, y) => y + 1 } || p"".map{ _ => 0 }
 | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   209  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   210  | 
println(UCount.parse("11111"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   211  | 
println(UCount.parse_all("11111"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   212  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   213  | 
// Two single character parsers
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   214  | 
lazy val One : Parser[String, String] = p"a"
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   215  | 
lazy val Two : Parser[String, String] = p"b"
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   216  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   217  | 
One.parse("a")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   218  | 
One.parse("aaa")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   219  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   220  | 
// note how the pairs nest to the left with sequence parsers
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   221  | 
(One ~ One).parse("aaa")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   222  | 
(One ~ One ~ One).parse("aaa")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   223  | 
(One ~ One ~ One ~ One).parse("aaaa")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   224  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   225  | 
(One || Two).parse("aaa")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   226  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   227  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   228  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   229  | 
// a problem with the arithmetic expression parser: it 
  | 
| 
742
 | 
   230  | 
// gets very slow with deeply nested parentheses
  | 
732
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   231  | 
  | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   232  | 
println("Runtime problem")
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   233  | 
println(E.parse("1"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   234  | 
println(E.parse("(1)"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   235  | 
println(E.parse("((1))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   236  | 
//println(E.parse("(((1)))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   237  | 
//println(E.parse("((((1))))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   238  | 
//println(E.parse("((((((1))))))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   239  | 
//println(E.parse("(((((((1)))))))"))
 | 
Christian Urban <christian.urban@kcl.ac.uk> 
parents:  
diff
changeset
 
 | 
   240  | 
//println(E.parse("((((((((1)))))))"))
 | 
| 
828
 | 
   241  | 
  |