thys2/blexer2.sc
author Chengsong
Tue, 17 May 2022 00:54:29 +0100
changeset 514 036600af4c30
parent 500 4d9eecfc936a
child 516 6fecb7fe8cd0
permissions -rw-r--r--
chapter2
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
431
Chengsong
parents:
diff changeset
     1
// A simple lexer inspired by work of Sulzmann & Lu
Chengsong
parents:
diff changeset
     2
//==================================================
Chengsong
parents:
diff changeset
     3
//
Chengsong
parents:
diff changeset
     4
// Call the test cases with 
Chengsong
parents:
diff changeset
     5
//
Chengsong
parents:
diff changeset
     6
//   amm lexer.sc small
Chengsong
parents:
diff changeset
     7
//   amm lexer.sc fib
Chengsong
parents:
diff changeset
     8
//   amm lexer.sc loops
Chengsong
parents:
diff changeset
     9
//   amm lexer.sc email
Chengsong
parents:
diff changeset
    10
//
Chengsong
parents:
diff changeset
    11
//   amm lexer.sc all
Chengsong
parents:
diff changeset
    12
514
036600af4c30 chapter2
Chengsong
parents: 500
diff changeset
    13
431
Chengsong
parents:
diff changeset
    14
Chengsong
parents:
diff changeset
    15
// regular expressions including records
Chengsong
parents:
diff changeset
    16
abstract class Rexp 
Chengsong
parents:
diff changeset
    17
case object ZERO extends Rexp
Chengsong
parents:
diff changeset
    18
case object ONE extends Rexp
Chengsong
parents:
diff changeset
    19
case object ANYCHAR extends Rexp
Chengsong
parents:
diff changeset
    20
case class CHAR(c: Char) extends Rexp
Chengsong
parents:
diff changeset
    21
case class ALTS(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    22
case class SEQ(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    23
case class STAR(r: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    24
case class RECD(x: String, r: Rexp) extends Rexp  
Chengsong
parents:
diff changeset
    25
case class NTIMES(n: Int, r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    26
case class OPTIONAL(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    27
case class NOT(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    28
                // records for extracting strings or tokens
Chengsong
parents:
diff changeset
    29
  
Chengsong
parents:
diff changeset
    30
// values  
Chengsong
parents:
diff changeset
    31
abstract class Val
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    32
case object Failure extends Val
431
Chengsong
parents:
diff changeset
    33
case object Empty extends Val
Chengsong
parents:
diff changeset
    34
case class Chr(c: Char) extends Val
Chengsong
parents:
diff changeset
    35
case class Sequ(v1: Val, v2: Val) extends Val
Chengsong
parents:
diff changeset
    36
case class Left(v: Val) extends Val
Chengsong
parents:
diff changeset
    37
case class Right(v: Val) extends Val
Chengsong
parents:
diff changeset
    38
case class Stars(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    39
case class Rec(x: String, v: Val) extends Val
Chengsong
parents:
diff changeset
    40
case class Ntime(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    41
case class Optionall(v: Val) extends Val
Chengsong
parents:
diff changeset
    42
case class Nots(s: String) extends Val
Chengsong
parents:
diff changeset
    43
Chengsong
parents:
diff changeset
    44
Chengsong
parents:
diff changeset
    45
Chengsong
parents:
diff changeset
    46
abstract class Bit
Chengsong
parents:
diff changeset
    47
case object Z extends Bit
Chengsong
parents:
diff changeset
    48
case object S extends Bit
Chengsong
parents:
diff changeset
    49
Chengsong
parents:
diff changeset
    50
Chengsong
parents:
diff changeset
    51
type Bits = List[Bit]
Chengsong
parents:
diff changeset
    52
Chengsong
parents:
diff changeset
    53
abstract class ARexp 
Chengsong
parents:
diff changeset
    54
case object AZERO extends ARexp
Chengsong
parents:
diff changeset
    55
case class AONE(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    56
case class ACHAR(bs: Bits, c: Char) extends ARexp
Chengsong
parents:
diff changeset
    57
case class AALTS(bs: Bits, rs: List[ARexp]) extends ARexp 
Chengsong
parents:
diff changeset
    58
case class ASEQ(bs: Bits, r1: ARexp, r2: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    59
case class ASTAR(bs: Bits, r: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    60
case class ANOT(bs: Bits, r: ARexp) extends ARexp
Chengsong
parents:
diff changeset
    61
case class AANYCHAR(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    62
514
036600af4c30 chapter2
Chengsong
parents: 500
diff changeset
    63
import scala.util.Try
036600af4c30 chapter2
Chengsong
parents: 500
diff changeset
    64
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    65
trait Generator[+T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    66
    self => // an alias for "this"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    67
    def generate(): T
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    68
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    69
    def gen(n: Int) : List[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    70
      if (n == 0) Nil else self.generate() :: gen(n - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    71
    
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    72
    def map[S](f: T => S): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    73
      def generate = f(self.generate())  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    74
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    75
    def flatMap[S](f: T => Generator[S]): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    76
      def generate = f(self.generate()).generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    77
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    78
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    79
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    80
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    81
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    82
  // tests a property according to a given random generator
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    83
  def test[T](r: Generator[T], amount: Int = 100)(pred: T => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    84
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    85
      val value = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    86
      assert(pred(value), s"Test failed for: $value")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    87
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    88
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    89
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    90
  def test2[T, S](r: Generator[T], s: Generator[S], amount: Int = 100)(pred: (T, S) => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    91
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    92
      val valueR = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    93
      val valueS = s.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    94
      assert(pred(valueR, valueS), s"Test failed for: $valueR, $valueS")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    95
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    96
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    97
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    98
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    99
// random integers
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   100
val integers = new Generator[Int] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   101
  val rand = new java.util.Random
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   102
  def generate() = rand.nextInt()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   103
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   104
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   105
// random booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   106
val booleans = integers.map(_ > 0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   107
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   108
// random integers in the range lo and high  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   109
def range(lo: Int, hi: Int): Generator[Int] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   110
  for (x <- integers) yield (lo + x.abs % (hi - lo)).abs
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   111
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   112
// random characters
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   113
def chars_range(lo: Char, hi: Char) = range(lo, hi).map(_.toChar)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   114
val chars = chars_range('a', 'z')
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   115
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   116
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   117
def oneOf[T](xs: T*): Generator[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   118
  for (idx <- range(0, xs.length)) yield xs(idx)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   119
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   120
def single[T](x: T) = new Generator[T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   121
  def generate() = x
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   122
}   
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   123
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   124
def pairs[T, U](t: Generator[T], u: Generator[U]): Generator[(T, U)] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   125
  for (x <- t; y <- u) yield (x, y)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   126
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   127
// lists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   128
def emptyLists = single(Nil) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   129
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   130
def nonEmptyLists : Generator[List[Int]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   131
  for (head <- integers; tail <- lists) yield head :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   132
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   133
def lists: Generator[List[Int]] = for {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   134
  kind <- booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   135
  list <- if (kind) emptyLists else nonEmptyLists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   136
} yield list
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   137
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   138
def char_list(len: Int): Generator[List[Char]] = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   139
  if(len <= 0) single(Nil)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   140
  else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   141
    for { 
500
Chengsong
parents: 494
diff changeset
   142
      c <- chars_range('a', 'c')
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   143
      tail <- char_list(len - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   144
    } yield c :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   145
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   146
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   147
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   148
def strings(len: Int): Generator[String] = for(cs <- char_list(len)) yield cs.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   149
493
Chengsong
parents: 492
diff changeset
   150
def sampleString(r: Rexp) : List[String] = r match {
Chengsong
parents: 492
diff changeset
   151
  case STAR(r) => stringsFromRexp(r).flatMap(s => List("", s, s ++ s))//only generate 0, 1, 2 reptitions
Chengsong
parents: 492
diff changeset
   152
  case SEQ(r1, r2) => stringsFromRexp(r1).flatMap(s1 => stringsFromRexp(r2).map(s2 => s1 ++ s2) )
Chengsong
parents: 492
diff changeset
   153
  case ALTS(r1, r2) => throw new Error(s" Rexp ${r} not expected: all alternatives are supposed to have been opened up")
Chengsong
parents: 492
diff changeset
   154
  case ONE => "" :: Nil
Chengsong
parents: 492
diff changeset
   155
  case ZERO => Nil
Chengsong
parents: 492
diff changeset
   156
  case CHAR(c) => c.toString :: Nil
Chengsong
parents: 492
diff changeset
   157
Chengsong
parents: 492
diff changeset
   158
}
Chengsong
parents: 492
diff changeset
   159
Chengsong
parents: 492
diff changeset
   160
def stringsFromRexp(r: Rexp) : List[String] = 
Chengsong
parents: 492
diff changeset
   161
  breakIntoTerms(r).flatMap(r => sampleString(r))
Chengsong
parents: 492
diff changeset
   162
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   163
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   164
// (simple) binary trees
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   165
trait Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   166
case class Inner[T](left: Tree[T], right: Tree[T]) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   167
case class Leaf[T](x: T) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   168
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   169
def leafs[T](t: Generator[T]): Generator[Leaf[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   170
  for (x <- t) yield Leaf(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   171
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   172
def inners[T](t: Generator[T]): Generator[Inner[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   173
  for (l <- trees(t); r <- trees(t)) yield Inner(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   174
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   175
def trees[T](t: Generator[T]): Generator[Tree[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   176
  for (kind <- range(0, 2);  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   177
       tree <- if (kind == 0) leafs(t) else inners(t)) yield tree
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   178
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   179
// regular expressions
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   180
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   181
// generates random leaf-regexes; prefers CHAR-regexes
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   182
def leaf_rexp() : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   183
  for (kind <- range(0, 5);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   184
       c <- chars_range('a', 'd')) yield
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   185
    kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   186
      case 0 => ZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   187
      case 1 => ONE
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   188
      case _ => CHAR(c) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   189
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   190
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   191
// generates random inner regexes with maximum depth d
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   192
def inner_rexp(d: Int) : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   193
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   194
       l <- rexp(d); 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   195
       r <- rexp(d))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   196
  yield kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   197
    case 0 => ALTS(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   198
    case 1 => SEQ(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   199
    case 2 => STAR(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   200
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   201
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   202
// generates random regexes with maximum depth d;
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   203
// prefers inner regexes in 2/3 of the cases
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   204
def rexp(d: Int = 100): Generator[Rexp] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   205
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   206
       r <- if (d <= 0 || kind == 0) leaf_rexp() else inner_rexp(d - 1)) yield r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   207
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   208
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   209
// some test functions for rexps
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   210
def height(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   211
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   212
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   213
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   214
  case ALTS(r1, r2) => 1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   215
  case SEQ(r1, r2) =>  1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   216
  case STAR(r) => 1 + height(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   217
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   218
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   219
// def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   220
//   case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   221
//   case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   222
//   case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   223
//   case ALTS(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   224
//   case SEQ(r1, r2) =>  1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   225
//   case STAR(r) => 1 + size(r) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   226
// }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   227
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   228
// randomly subtracts 1 or 2 from the STAR case
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   229
def size_faulty(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   230
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   231
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   232
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   233
  case ALTS(r1, r2) => 1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   234
  case SEQ(r1, r2) =>  1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   235
  case STAR(r) => 1 + size_faulty(r) - range(0, 2).generate
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   236
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   237
431
Chengsong
parents:
diff changeset
   238
Chengsong
parents:
diff changeset
   239
   
Chengsong
parents:
diff changeset
   240
// some convenience for typing in regular expressions
Chengsong
parents:
diff changeset
   241
Chengsong
parents:
diff changeset
   242
def charlist2rexp(s : List[Char]): Rexp = s match {
Chengsong
parents:
diff changeset
   243
  case Nil => ONE
Chengsong
parents:
diff changeset
   244
  case c::Nil => CHAR(c)
Chengsong
parents:
diff changeset
   245
  case c::s => SEQ(CHAR(c), charlist2rexp(s))
Chengsong
parents:
diff changeset
   246
}
Chengsong
parents:
diff changeset
   247
implicit def string2rexp(s : String) : Rexp = 
Chengsong
parents:
diff changeset
   248
  charlist2rexp(s.toList)
Chengsong
parents:
diff changeset
   249
Chengsong
parents:
diff changeset
   250
implicit def RexpOps(r: Rexp) = new {
Chengsong
parents:
diff changeset
   251
  def | (s: Rexp) = ALTS(r, s)
Chengsong
parents:
diff changeset
   252
  def % = STAR(r)
Chengsong
parents:
diff changeset
   253
  def ~ (s: Rexp) = SEQ(r, s)
Chengsong
parents:
diff changeset
   254
}
Chengsong
parents:
diff changeset
   255
Chengsong
parents:
diff changeset
   256
implicit def stringOps(s: String) = new {
Chengsong
parents:
diff changeset
   257
  def | (r: Rexp) = ALTS(s, r)
Chengsong
parents:
diff changeset
   258
  def | (r: String) = ALTS(s, r)
Chengsong
parents:
diff changeset
   259
  def % = STAR(s)
Chengsong
parents:
diff changeset
   260
  def ~ (r: Rexp) = SEQ(s, r)
Chengsong
parents:
diff changeset
   261
  def ~ (r: String) = SEQ(s, r)
Chengsong
parents:
diff changeset
   262
  def $ (r: Rexp) = RECD(s, r)
Chengsong
parents:
diff changeset
   263
}
Chengsong
parents:
diff changeset
   264
Chengsong
parents:
diff changeset
   265
def nullable(r: Rexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   266
  case ZERO => false
Chengsong
parents:
diff changeset
   267
  case ONE => true
Chengsong
parents:
diff changeset
   268
  case CHAR(_) => false
Chengsong
parents:
diff changeset
   269
  case ANYCHAR => false
Chengsong
parents:
diff changeset
   270
  case ALTS(r1, r2) => nullable(r1) || nullable(r2)
Chengsong
parents:
diff changeset
   271
  case SEQ(r1, r2) => nullable(r1) && nullable(r2)
Chengsong
parents:
diff changeset
   272
  case STAR(_) => true
Chengsong
parents:
diff changeset
   273
  case RECD(_, r1) => nullable(r1)
Chengsong
parents:
diff changeset
   274
  case NTIMES(n, r) => if (n == 0) true else nullable(r)
Chengsong
parents:
diff changeset
   275
  case OPTIONAL(r) => true
Chengsong
parents:
diff changeset
   276
  case NOT(r) => !nullable(r)
Chengsong
parents:
diff changeset
   277
}
Chengsong
parents:
diff changeset
   278
Chengsong
parents:
diff changeset
   279
def der(c: Char, r: Rexp) : Rexp = r match {
Chengsong
parents:
diff changeset
   280
  case ZERO => ZERO
Chengsong
parents:
diff changeset
   281
  case ONE => ZERO
Chengsong
parents:
diff changeset
   282
  case CHAR(d) => if (c == d) ONE else ZERO
Chengsong
parents:
diff changeset
   283
  case ANYCHAR => ONE 
Chengsong
parents:
diff changeset
   284
  case ALTS(r1, r2) => ALTS(der(c, r1), der(c, r2))
Chengsong
parents:
diff changeset
   285
  case SEQ(r1, r2) => 
Chengsong
parents:
diff changeset
   286
    if (nullable(r1)) ALTS(SEQ(der(c, r1), r2), der(c, r2))
Chengsong
parents:
diff changeset
   287
    else SEQ(der(c, r1), r2)
Chengsong
parents:
diff changeset
   288
  case STAR(r) => SEQ(der(c, r), STAR(r))
Chengsong
parents:
diff changeset
   289
  case RECD(_, r1) => der(c, r1)
Chengsong
parents:
diff changeset
   290
  case NTIMES(n, r) => if(n > 0) SEQ(der(c, r), NTIMES(n - 1, r)) else ZERO
Chengsong
parents:
diff changeset
   291
  case OPTIONAL(r) => der(c, r)
Chengsong
parents:
diff changeset
   292
  case NOT(r) =>  NOT(der(c, r))
Chengsong
parents:
diff changeset
   293
}
Chengsong
parents:
diff changeset
   294
Chengsong
parents:
diff changeset
   295
Chengsong
parents:
diff changeset
   296
// extracts a string from a value
Chengsong
parents:
diff changeset
   297
def flatten(v: Val) : String = v match {
Chengsong
parents:
diff changeset
   298
  case Empty => ""
Chengsong
parents:
diff changeset
   299
  case Chr(c) => c.toString
Chengsong
parents:
diff changeset
   300
  case Left(v) => flatten(v)
Chengsong
parents:
diff changeset
   301
  case Right(v) => flatten(v)
Chengsong
parents:
diff changeset
   302
  case Sequ(v1, v2) => flatten(v1) ++ flatten(v2)
Chengsong
parents:
diff changeset
   303
  case Stars(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   304
  case Ntime(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   305
  case Optionall(v) => flatten(v)
Chengsong
parents:
diff changeset
   306
  case Rec(_, v) => flatten(v)
Chengsong
parents:
diff changeset
   307
}
Chengsong
parents:
diff changeset
   308
Chengsong
parents:
diff changeset
   309
Chengsong
parents:
diff changeset
   310
// extracts an environment from a value;
Chengsong
parents:
diff changeset
   311
// used for tokenising a string
Chengsong
parents:
diff changeset
   312
def env(v: Val) : List[(String, String)] = v match {
Chengsong
parents:
diff changeset
   313
  case Empty => Nil
Chengsong
parents:
diff changeset
   314
  case Chr(c) => Nil
Chengsong
parents:
diff changeset
   315
  case Left(v) => env(v)
Chengsong
parents:
diff changeset
   316
  case Right(v) => env(v)
Chengsong
parents:
diff changeset
   317
  case Sequ(v1, v2) => env(v1) ::: env(v2)
Chengsong
parents:
diff changeset
   318
  case Stars(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   319
  case Ntime(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   320
  case Rec(x, v) => (x, flatten(v))::env(v)
Chengsong
parents:
diff changeset
   321
  case Optionall(v) => env(v)
Chengsong
parents:
diff changeset
   322
  case Nots(s) => ("Negative", s) :: Nil
Chengsong
parents:
diff changeset
   323
}
Chengsong
parents:
diff changeset
   324
Chengsong
parents:
diff changeset
   325
Chengsong
parents:
diff changeset
   326
// The injection and mkeps part of the lexer
Chengsong
parents:
diff changeset
   327
//===========================================
Chengsong
parents:
diff changeset
   328
Chengsong
parents:
diff changeset
   329
def mkeps(r: Rexp) : Val = r match {
Chengsong
parents:
diff changeset
   330
  case ONE => Empty
Chengsong
parents:
diff changeset
   331
  case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   332
    if (nullable(r1)) Left(mkeps(r1)) else Right(mkeps(r2))
Chengsong
parents:
diff changeset
   333
  case SEQ(r1, r2) => Sequ(mkeps(r1), mkeps(r2))
Chengsong
parents:
diff changeset
   334
  case STAR(r) => Stars(Nil)
Chengsong
parents:
diff changeset
   335
  case RECD(x, r) => Rec(x, mkeps(r))
Chengsong
parents:
diff changeset
   336
  case NTIMES(n, r) => Ntime(List.fill(n)(mkeps(r)))
Chengsong
parents:
diff changeset
   337
  case OPTIONAL(r) => Optionall(Empty)
Chengsong
parents:
diff changeset
   338
  case NOT(rInner) => if(nullable(rInner)) throw new Exception("error")  
Chengsong
parents:
diff changeset
   339
                         else Nots("")//Nots(s.reverse.toString)
Chengsong
parents:
diff changeset
   340
//   case NOT(ZERO) => Empty
Chengsong
parents:
diff changeset
   341
//   case NOT(CHAR(c)) => Empty
Chengsong
parents:
diff changeset
   342
//   case NOT(SEQ(r1, r2)) => Sequ(mkeps(NOT(r1)), mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   343
//   case NOT(ALTS(r1, r2)) => if(!nullable(r1)) Left(mkeps(NOT(r1))) else Right(mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   344
//   case NOT(STAR(r)) => Stars(Nil) 
Chengsong
parents:
diff changeset
   345
Chengsong
parents:
diff changeset
   346
}
Chengsong
parents:
diff changeset
   347
Chengsong
parents:
diff changeset
   348
def inj(r: Rexp, c: Char, v: Val) : Val = (r, v) match {
Chengsong
parents:
diff changeset
   349
  case (STAR(r), Sequ(v1, Stars(vs))) => Stars(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   350
  case (SEQ(r1, r2), Sequ(v1, v2)) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   351
  case (SEQ(r1, r2), Left(Sequ(v1, v2))) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   352
  case (SEQ(r1, r2), Right(v2)) => Sequ(mkeps(r1), inj(r2, c, v2))
Chengsong
parents:
diff changeset
   353
  case (ALTS(r1, r2), Left(v1)) => Left(inj(r1, c, v1))
Chengsong
parents:
diff changeset
   354
  case (ALTS(r1, r2), Right(v2)) => Right(inj(r2, c, v2))
Chengsong
parents:
diff changeset
   355
  case (CHAR(d), Empty) => Chr(c) 
Chengsong
parents:
diff changeset
   356
  case (RECD(x, r1), _) => Rec(x, inj(r1, c, v))
Chengsong
parents:
diff changeset
   357
  case (NTIMES(n, r), Sequ(v1, Ntime(vs))) => Ntime(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   358
  case (OPTIONAL(r), v) => Optionall(inj(r, c, v))
Chengsong
parents:
diff changeset
   359
  case (NOT(r), Nots(s)) => Nots(c.toString ++ s)
Chengsong
parents:
diff changeset
   360
  case (ANYCHAR, Empty) => Chr(c)
Chengsong
parents:
diff changeset
   361
}
Chengsong
parents:
diff changeset
   362
Chengsong
parents:
diff changeset
   363
// some "rectification" functions for simplification
Chengsong
parents:
diff changeset
   364
Chengsong
parents:
diff changeset
   365
Chengsong
parents:
diff changeset
   366
Chengsong
parents:
diff changeset
   367
Chengsong
parents:
diff changeset
   368
// The Lexing Rules for the WHILE Language
Chengsong
parents:
diff changeset
   369
Chengsong
parents:
diff changeset
   370
  // bnullable function: tests whether the aregular 
Chengsong
parents:
diff changeset
   371
  // expression can recognise the empty string
Chengsong
parents:
diff changeset
   372
def bnullable (r: ARexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   373
    case AZERO => false
Chengsong
parents:
diff changeset
   374
    case AONE(_) => true
Chengsong
parents:
diff changeset
   375
    case ACHAR(_,_) => false
Chengsong
parents:
diff changeset
   376
    case AALTS(_, rs) => rs.exists(bnullable)
Chengsong
parents:
diff changeset
   377
    case ASEQ(_, r1, r2) => bnullable(r1) && bnullable(r2)
Chengsong
parents:
diff changeset
   378
    case ASTAR(_, _) => true
Chengsong
parents:
diff changeset
   379
    case ANOT(_, rn) => !bnullable(rn)
Chengsong
parents:
diff changeset
   380
  }
Chengsong
parents:
diff changeset
   381
Chengsong
parents:
diff changeset
   382
def mkepsBC(r: ARexp) : Bits = r match {
Chengsong
parents:
diff changeset
   383
    case AONE(bs) => bs
Chengsong
parents:
diff changeset
   384
    case AALTS(bs, rs) => {
Chengsong
parents:
diff changeset
   385
      val n = rs.indexWhere(bnullable)
Chengsong
parents:
diff changeset
   386
      bs ++ mkepsBC(rs(n))
Chengsong
parents:
diff changeset
   387
    }
Chengsong
parents:
diff changeset
   388
    case ASEQ(bs, r1, r2) => bs ++ mkepsBC(r1) ++ mkepsBC(r2)
Chengsong
parents:
diff changeset
   389
    case ASTAR(bs, r) => bs ++ List(Z)
Chengsong
parents:
diff changeset
   390
    case ANOT(bs, rn) => bs
Chengsong
parents:
diff changeset
   391
  }
Chengsong
parents:
diff changeset
   392
Chengsong
parents:
diff changeset
   393
Chengsong
parents:
diff changeset
   394
def bder(c: Char, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   395
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   396
    case AONE(_) => AZERO
Chengsong
parents:
diff changeset
   397
    case ACHAR(bs, f) => if (c == f) AONE(bs) else AZERO
Chengsong
parents:
diff changeset
   398
    case AALTS(bs, rs) => AALTS(bs, rs.map(bder(c, _)))
Chengsong
parents:
diff changeset
   399
    case ASEQ(bs, r1, r2) => 
Chengsong
parents:
diff changeset
   400
      if (bnullable(r1)) AALTS(bs, ASEQ(Nil, bder(c, r1), r2) :: fuse(mkepsBC(r1), bder(c, r2)) :: Nil )
Chengsong
parents:
diff changeset
   401
      else ASEQ(bs, bder(c, r1), r2)
Chengsong
parents:
diff changeset
   402
    case ASTAR(bs, r) => ASEQ(bs, fuse(List(S), bder(c, r)), ASTAR(Nil, r))
Chengsong
parents:
diff changeset
   403
    case ANOT(bs, rn) => ANOT(bs, bder(c, rn))
Chengsong
parents:
diff changeset
   404
    case AANYCHAR(bs) => AONE(bs)
Chengsong
parents:
diff changeset
   405
  } 
Chengsong
parents:
diff changeset
   406
Chengsong
parents:
diff changeset
   407
def fuse(bs: Bits, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   408
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   409
    case AONE(cs) => AONE(bs ++ cs)
Chengsong
parents:
diff changeset
   410
    case ACHAR(cs, f) => ACHAR(bs ++ cs, f)
Chengsong
parents:
diff changeset
   411
    case AALTS(cs, rs) => AALTS(bs ++ cs, rs)
Chengsong
parents:
diff changeset
   412
    case ASEQ(cs, r1, r2) => ASEQ(bs ++ cs, r1, r2)
Chengsong
parents:
diff changeset
   413
    case ASTAR(cs, r) => ASTAR(bs ++ cs, r)
Chengsong
parents:
diff changeset
   414
    case ANOT(cs, r) => ANOT(bs ++ cs, r)
Chengsong
parents:
diff changeset
   415
  }
Chengsong
parents:
diff changeset
   416
Chengsong
parents:
diff changeset
   417
Chengsong
parents:
diff changeset
   418
def internalise(r: Rexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   419
    case ZERO => AZERO
Chengsong
parents:
diff changeset
   420
    case ONE => AONE(Nil)
Chengsong
parents:
diff changeset
   421
    case CHAR(c) => ACHAR(Nil, c)
Chengsong
parents:
diff changeset
   422
    //case PRED(f) => APRED(Nil, f)
Chengsong
parents:
diff changeset
   423
    case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   424
      AALTS(Nil, List(fuse(List(Z), internalise(r1)), fuse(List(S), internalise(r2))))
Chengsong
parents:
diff changeset
   425
    // case ALTS(r1::rs) => {
Chengsong
parents:
diff changeset
   426
    //   val AALTS(Nil, rs2) = internalise(ALTS(rs))
Chengsong
parents:
diff changeset
   427
    //   AALTS(Nil, fuse(List(Z), internalise(r1)) :: rs2.map(fuse(List(S), _)))
Chengsong
parents:
diff changeset
   428
    // }
Chengsong
parents:
diff changeset
   429
    case SEQ(r1, r2) => ASEQ(Nil, internalise(r1), internalise(r2))
Chengsong
parents:
diff changeset
   430
    case STAR(r) => ASTAR(Nil, internalise(r))
Chengsong
parents:
diff changeset
   431
    case RECD(x, r) => internalise(r)
Chengsong
parents:
diff changeset
   432
    case NOT(r) => ANOT(Nil, internalise(r))
Chengsong
parents:
diff changeset
   433
    case ANYCHAR => AANYCHAR(Nil)
Chengsong
parents:
diff changeset
   434
  }
Chengsong
parents:
diff changeset
   435
Chengsong
parents:
diff changeset
   436
Chengsong
parents:
diff changeset
   437
def bsimp(r: ARexp): ARexp = 
Chengsong
parents:
diff changeset
   438
  {
Chengsong
parents:
diff changeset
   439
    r match {
Chengsong
parents:
diff changeset
   440
      case ASEQ(bs1, r1, r2) => (bsimp(r1), bsimp(r2)) match {
Chengsong
parents:
diff changeset
   441
          case (AZERO, _) => AZERO
Chengsong
parents:
diff changeset
   442
          case (_, AZERO) => AZERO
Chengsong
parents:
diff changeset
   443
          case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
Chengsong
parents:
diff changeset
   444
          case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
Chengsong
parents:
diff changeset
   445
      }
Chengsong
parents:
diff changeset
   446
      case AALTS(bs1, rs) => {
Chengsong
parents:
diff changeset
   447
            val rs_simp = rs.map(bsimp(_))
Chengsong
parents:
diff changeset
   448
            val flat_res = flats(rs_simp)
Chengsong
parents:
diff changeset
   449
            val dist_res = distinctBy(flat_res, erase)//strongDB(flat_res)//distinctBy(flat_res, erase)
Chengsong
parents:
diff changeset
   450
            dist_res match {
Chengsong
parents:
diff changeset
   451
              case Nil => AZERO
Chengsong
parents:
diff changeset
   452
              case s :: Nil => fuse(bs1, s)
Chengsong
parents:
diff changeset
   453
              case rs => AALTS(bs1, rs)  
Chengsong
parents:
diff changeset
   454
            }
Chengsong
parents:
diff changeset
   455
          
Chengsong
parents:
diff changeset
   456
      }
Chengsong
parents:
diff changeset
   457
      case r => r
Chengsong
parents:
diff changeset
   458
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   459
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   460
def strongBsimp(r: ARexp): ARexp =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   461
{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   462
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   463
    case ASEQ(bs1, r1, r2) => (strongBsimp(r1), strongBsimp(r2)) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   464
        case (AZERO, _) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   465
        case (_, AZERO) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   466
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   467
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
431
Chengsong
parents:
diff changeset
   468
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   469
    case AALTS(bs1, rs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   470
          val rs_simp = rs.map(strongBsimp(_))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   471
          val flat_res = flats(rs_simp)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   472
          val dist_res = distinctBy4(flat_res)//distinctBy(flat_res, erase)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   473
          dist_res match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   474
            case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   475
            case s :: Nil => fuse(bs1, s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   476
            case rs => AALTS(bs1, rs)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   477
          }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   478
        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   479
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   480
    case r => r
431
Chengsong
parents:
diff changeset
   481
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   482
}
431
Chengsong
parents:
diff changeset
   483
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   484
def strongBsimp5(r: ARexp): ARexp =
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   485
{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   486
  // println("was this called?")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   487
  r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   488
    case ASEQ(bs1, r1, r2) => (strongBsimp5(r1), strongBsimp5(r2)) match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   489
        case (AZERO, _) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   490
        case (_, AZERO) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   491
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   492
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   493
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   494
    case AALTS(bs1, rs) => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   495
        // println("alts case")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   496
          val rs_simp = rs.map(strongBsimp5(_))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   497
          val flat_res = flats(rs_simp)
500
Chengsong
parents: 494
diff changeset
   498
          var dist_res = distinctBy5(flat_res)//distinctBy(flat_res, erase)
Chengsong
parents: 494
diff changeset
   499
          var dist2_res = distinctBy5(dist_res)
Chengsong
parents: 494
diff changeset
   500
          while(dist_res != dist2_res){
Chengsong
parents: 494
diff changeset
   501
            dist_res = dist2_res
Chengsong
parents: 494
diff changeset
   502
            dist2_res = distinctBy5(dist_res)
Chengsong
parents: 494
diff changeset
   503
          }
Chengsong
parents: 494
diff changeset
   504
          (dist2_res) match {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   505
            case Nil => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   506
            case s :: Nil => fuse(bs1, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   507
            case rs => AALTS(bs1, rs)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   508
          }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   509
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   510
    case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   511
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   512
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   513
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   514
def bders (s: List[Char], r: ARexp) : ARexp = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   515
  case Nil => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   516
  case c::s => bders(s, bder(c, r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   517
}
431
Chengsong
parents:
diff changeset
   518
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   519
def flats(rs: List[ARexp]): List[ARexp] = rs match {
431
Chengsong
parents:
diff changeset
   520
    case Nil => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   521
    case AZERO :: rs1 => flats(rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   522
    case AALTS(bs, rs1) :: rs2 => rs1.map(fuse(bs, _)) ::: flats(rs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   523
    case r1 :: rs2 => r1 :: flats(rs2)
431
Chengsong
parents:
diff changeset
   524
  }
Chengsong
parents:
diff changeset
   525
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   526
def distinctBy[B, C](xs: List[B], f: B => C, acc: List[C] = Nil): List[B] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   527
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   528
  case (x::xs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   529
    val res = f(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   530
    if (acc.contains(res)) distinctBy(xs, f, acc)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   531
    else x::distinctBy(xs, f, res::acc)
431
Chengsong
parents:
diff changeset
   532
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   533
} 
431
Chengsong
parents:
diff changeset
   534
Chengsong
parents:
diff changeset
   535
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   536
def pruneRexp(r: ARexp, allowableTerms: List[Rexp]) : ARexp = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   537
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   538
    case ASEQ(bs, r1, r2) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   539
      val termsTruncated = allowableTerms.collect(rt => rt match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   540
        case SEQ(r1p, r2p) if(r2p == erase(r2)) => r1p//if(r2p == erase(r2)) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   541
      })
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   542
      val pruned : ARexp = pruneRexp(r1, termsTruncated)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   543
      pruned match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   544
        case AZERO => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   545
        case AONE(bs1) => fuse(bs ++ bs1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   546
        case pruned1 => ASEQ(bs, pruned1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   547
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   548
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   549
    case AALTS(bs, rs) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   550
      //allowableTerms.foreach(a => println(shortRexpOutput(a)))        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   551
      val rsp = rs.map(r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   552
                    pruneRexp(r, allowableTerms)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   553
                  )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   554
                  .filter(r => r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   555
      rsp match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   556
        case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   557
        case r1::Nil => fuse(bs, r1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   558
        case rs1 => AALTS(bs, rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   559
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   560
    case r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   561
      if(allowableTerms.contains(erase(r))) r else AZERO //assert(r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   562
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   563
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   564
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   565
def oneSimp(r: Rexp) : Rexp = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   566
  case SEQ(ONE, r) => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   567
  case SEQ(r1, r2) => SEQ(oneSimp(r1), r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   568
  case r => r//assert r != 0 
432
994403dbbed5 strong!
Chengsong
parents: 431
diff changeset
   569
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   570
}
431
Chengsong
parents:
diff changeset
   571
Chengsong
parents:
diff changeset
   572
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   573
def distinctBy4(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   574
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   575
  case x :: xs =>
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   576
    //assert(acc.distinct == acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   577
    val erased = erase(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   578
    if(acc.contains(erased))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   579
      distinctBy4(xs, acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   580
    else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   581
      val addToAcc =  breakIntoTerms(erased).filter(r => !acc.contains(oneSimp(r)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   582
      //val xp = pruneRexp(x, addToAcc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   583
      pruneRexp(x, addToAcc) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   584
        case AZERO => distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   585
        case xPrime => xPrime :: distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   586
      }
431
Chengsong
parents:
diff changeset
   587
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   588
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   589
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   590
// fun pAKC_aux :: "arexp list ⇒ arexp ⇒ rexp ⇒ arexp"
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   591
//   where
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   592
// "pAKC_aux rsa r ctx = (if (L (SEQ (erase r) ( ctx) )) ⊆ (L (erase (AALTs [] rsa))) then AZERO else
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   593
//                           case r of (ASEQ bs r1 r2) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   594
//                             bsimp_ASEQ bs (pAKC_aux rsa r1 (SEQ  (erase r2) ( ctx) )) r2   |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   595
//                                     (AALTs bs rs) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   596
//                             bsimp_AALTs bs (flts (map (λr. pAKC_aux rsa r ( ctx) ) rs) )    |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   597
//                                     r             ⇒ r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   598
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   599
// def canonicalSeq(rs: List[Rexp], acc: Rexp) = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   600
//   case r::Nil => SEQ(r, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   601
//   case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   602
//   case r1::r2::Nil => SEQ(SEQ(r1, r2), acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   603
// }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   604
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   605
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   606
//the "fake" Language interpretation: just concatenates!
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   607
def L(acc: Rexp, rs: List[Rexp]) : Rexp = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   608
  case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   609
  case r :: rs1 => 
500
Chengsong
parents: 494
diff changeset
   610
    // if(acc == ONE) 
Chengsong
parents: 494
diff changeset
   611
    //   L(r, rs1) 
Chengsong
parents: 494
diff changeset
   612
    // else
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   613
      L(SEQ(acc, r), rs1)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   614
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   615
500
Chengsong
parents: 494
diff changeset
   616
def rprint(r: Rexp) : Unit = println(shortRexpOutput(r))
Chengsong
parents: 494
diff changeset
   617
def rsprint(rs: List[Rexp]) = rs.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
   618
def aprint(a: ARexp) = println(shortRexpOutput(erase(a)))
Chengsong
parents: 494
diff changeset
   619
def asprint(as: List[ARexp]) = as.foreach(a => println(shortRexpOutput(erase(a))))
Chengsong
parents: 494
diff changeset
   620
Chengsong
parents: 494
diff changeset
   621
def pAKC(acc: List[Rexp], r: ARexp, ctx: List[Rexp]) : ARexp = {
Chengsong
parents: 494
diff changeset
   622
  // println("pakc")
Chengsong
parents: 494
diff changeset
   623
  // println(shortRexpOutput(erase(r)))
Chengsong
parents: 494
diff changeset
   624
  // println("acc")
Chengsong
parents: 494
diff changeset
   625
  // rsprint(acc)
Chengsong
parents: 494
diff changeset
   626
  // println("ctx---------")
Chengsong
parents: 494
diff changeset
   627
  // rsprint(ctx)
Chengsong
parents: 494
diff changeset
   628
  // println("ctx---------end")
Chengsong
parents: 494
diff changeset
   629
  // rsprint(breakIntoTerms(L(erase(r), ctx)).map(oneSimp))
Chengsong
parents: 494
diff changeset
   630
Chengsong
parents: 494
diff changeset
   631
  if (breakIntoTerms(L(erase(r), ctx)).map(oneSimp).forall(acc.contains)) {//acc.flatMap(breakIntoTerms
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   632
    AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   633
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   634
  else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   635
    r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   636
      case ASEQ(bs, r1, r2) => 
500
Chengsong
parents: 494
diff changeset
   637
      (pAKC(acc, r1, erase(r2) :: ctx)) match{
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   638
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   639
          AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   640
        case AONE(bs1) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   641
          fuse(bs1, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   642
        case r1p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   643
          ASEQ(bs, r1p, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   644
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   645
      case AALTS(bs, rs0) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   646
        // println("before pruning")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   647
        // println(s"ctx is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   648
        // ctx.foreach(r => println(shortRexpOutput(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   649
        // println(s"rs0 is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   650
        // rs0.foreach(r => println(shortRexpOutput(erase(r))))
500
Chengsong
parents: 494
diff changeset
   651
        // println(s"acc is ")
Chengsong
parents: 494
diff changeset
   652
        // acc.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
   653
        rs0.map(r => pAKC(acc, r, ctx)).filter(_ != AZERO) match {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   654
          case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   655
            // println("after pruning Nil")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   656
            AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   657
          case r :: Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   658
            // println("after pruning singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   659
            // println(shortRexpOutput(erase(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   660
            r 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   661
          case rs0p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   662
          // println("after pruning non-singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   663
            AALTS(bs, rs0p)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   664
        }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   665
      case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   666
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   667
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   668
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   669
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   670
def distinctBy5(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   671
  case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   672
    Nil
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   673
  case x :: xs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   674
    val erased = erase(x)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   675
    if(acc.contains(erased)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   676
      distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   677
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   678
    else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   679
      val pruned = pAKC(acc, x, Nil)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   680
      val newTerms = breakIntoTerms(erase(pruned))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   681
      pruned match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   682
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   683
          distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   684
        case xPrime => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   685
          xPrime :: distinctBy5(xs, newTerms.map(oneSimp) ::: acc)//distinctBy5(xs, addToAcc.map(oneSimp(_)) ::: acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   686
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   687
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   688
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   689
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   690
431
Chengsong
parents:
diff changeset
   691
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   692
def breakIntoTerms(r: Rexp) : List[Rexp] = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   693
  case SEQ(r1, r2)  => breakIntoTerms(r1).map(r11 => SEQ(r11, r2))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   694
  case ALTS(r1, r2) => breakIntoTerms(r1) ::: breakIntoTerms(r2)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   695
  case ZERO => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   696
  case _ => r::Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   697
}
431
Chengsong
parents:
diff changeset
   698
Chengsong
parents:
diff changeset
   699
Chengsong
parents:
diff changeset
   700
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   701
def decode_aux(r: Rexp, bs: Bits) : (Val, Bits) = (r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   702
  case (ONE, bs) => (Empty, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   703
  case (CHAR(f), bs) => (Chr(f), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   704
  case (ALTS(r1, r2), Z::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   705
      val (v, bs2) = decode_aux(r1, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   706
      (Left(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   707
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   708
  case (ALTS(r1, r2), S::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   709
      val (v, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   710
      (Right(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   711
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   712
  case (SEQ(r1, r2), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   713
    val (v1, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   714
    val (v2, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   715
    (Sequ(v1, v2), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   716
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   717
  case (STAR(r1), S::bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   718
    val (v, bs1) = decode_aux(r1, bs)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   719
    //(v)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   720
    val (Stars(vs), bs2) = decode_aux(STAR(r1), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   721
    (Stars(v::vs), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   722
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   723
  case (STAR(_), Z::bs) => (Stars(Nil), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   724
  case (RECD(x, r1), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   725
    val (v, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   726
    (Rec(x, v), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   727
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   728
  case (NOT(r), bs) => (Nots(r.toString), bs)
431
Chengsong
parents:
diff changeset
   729
}
Chengsong
parents:
diff changeset
   730
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   731
def decode(r: Rexp, bs: Bits) = decode_aux(r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   732
  case (v, Nil) => v
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   733
  case _ => throw new Exception("Not decodable")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   734
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   735
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   736
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   737
431
Chengsong
parents:
diff changeset
   738
def blexing_simp(r: Rexp, s: String) : Val = {
Chengsong
parents:
diff changeset
   739
    val bit_code = blex_simp(internalise(r), s.toList)
Chengsong
parents:
diff changeset
   740
    decode(r, bit_code)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   741
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   742
def simpBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   743
  Try(blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   744
}
431
Chengsong
parents:
diff changeset
   745
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   746
def strong_blexing_simp(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   747
  decode(r, strong_blex_simp(internalise(r), s.toList))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   748
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   749
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   750
def strong_blexing_simp5(r: Rexp, s: String) : Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   751
  decode(r, strong_blex_simp5(internalise(r), s.toList))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   752
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   753
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   754
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   755
def strongBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   756
  Try(strong_blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   757
}
431
Chengsong
parents:
diff changeset
   758
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   759
def strongBlexer5(r: Rexp, s: String): Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   760
  Try(strong_blexing_simp5(r, s)).getOrElse(Failure)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   761
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   762
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   763
def strong_blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   764
  case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   765
    if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   766
      //println(asize(r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   767
      val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   768
      bits
431
Chengsong
parents:
diff changeset
   769
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   770
    else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   771
      throw new Exception("Not matched")
431
Chengsong
parents:
diff changeset
   772
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   773
  case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   774
    val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   775
    val simp_res = strongBsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   776
    strong_blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   777
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   778
}
431
Chengsong
parents:
diff changeset
   779
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   780
def strong_blex_simp5(r: ARexp, s: List[Char]) : Bits = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   781
  case Nil => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   782
    if (bnullable(r)) {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   783
      //println(asize(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   784
      val bits = mkepsBC(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   785
      bits
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   786
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   787
    else 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   788
      throw new Exception("Not matched")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   789
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   790
  case c::cs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   791
    val der_res = bder(c,r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   792
    val simp_res = strongBsimp5(der_res)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   793
    strong_blex_simp5(simp_res, cs)      
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   794
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   795
}
431
Chengsong
parents:
diff changeset
   796
Chengsong
parents:
diff changeset
   797
Chengsong
parents:
diff changeset
   798
  def bders_simp(s: List[Char], r: ARexp) : ARexp = s match {
Chengsong
parents:
diff changeset
   799
    case Nil => r
435
Chengsong
parents: 432
diff changeset
   800
    case c::s => 
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   801
      //println(erase(r))
435
Chengsong
parents: 432
diff changeset
   802
      bders_simp(s, bsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   803
  }
Chengsong
parents:
diff changeset
   804
  
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   805
  def bdersStrong5(s: List[Char], r: ARexp) : ARexp = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   806
    case Nil => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   807
    case c::s => bdersStrong5(s, strongBsimp5(bder(c, r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   808
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   809
431
Chengsong
parents:
diff changeset
   810
  def bdersSimp(s: String, r: Rexp) : ARexp = bders_simp(s.toList, internalise(r))
Chengsong
parents:
diff changeset
   811
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   812
  def bdersStrong(s: List[Char], r: ARexp) : ARexp = s match {
431
Chengsong
parents:
diff changeset
   813
    case Nil => r 
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   814
    case c::s => bdersStrong(s, strongBsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   815
  }
Chengsong
parents:
diff changeset
   816
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   817
  def bdersStrongRexp(s: String, r: Rexp) : ARexp = bdersStrong(s.toList, internalise(r))
431
Chengsong
parents:
diff changeset
   818
Chengsong
parents:
diff changeset
   819
  def erase(r:ARexp): Rexp = r match{
Chengsong
parents:
diff changeset
   820
    case AZERO => ZERO
Chengsong
parents:
diff changeset
   821
    case AONE(_) => ONE
Chengsong
parents:
diff changeset
   822
    case ACHAR(bs, c) => CHAR(c)
Chengsong
parents:
diff changeset
   823
    case AALTS(bs, Nil) => ZERO
Chengsong
parents:
diff changeset
   824
    case AALTS(bs, a::Nil) => erase(a)
Chengsong
parents:
diff changeset
   825
    case AALTS(bs, a::as) => ALTS(erase(a), erase(AALTS(bs, as)))
Chengsong
parents:
diff changeset
   826
    case ASEQ(bs, r1, r2) => SEQ (erase(r1), erase(r2))
Chengsong
parents:
diff changeset
   827
    case ASTAR(cs, r)=> STAR(erase(r))
Chengsong
parents:
diff changeset
   828
    case ANOT(bs, r) => NOT(erase(r))
Chengsong
parents:
diff changeset
   829
    case AANYCHAR(bs) => ANYCHAR
Chengsong
parents:
diff changeset
   830
  }
Chengsong
parents:
diff changeset
   831
Chengsong
parents:
diff changeset
   832
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   833
  def allCharSeq(r: Rexp) : Boolean = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   834
    case CHAR(c) => true
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   835
    case SEQ(r1, r2) => allCharSeq(r1) && allCharSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   836
    case _ => false
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   837
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   838
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   839
  def flattenSeq(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   840
    case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   841
    case SEQ(r1, r2) => flattenSeq(r1) ++ flattenSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   842
    case _ => throw new Error("flatten unflattenable rexp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   843
  } 
431
Chengsong
parents:
diff changeset
   844
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   845
  def shortRexpOutput(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   846
      case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   847
      case ONE => "1"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   848
      case ZERO => "0"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   849
      case SEQ(r1, r2) if(allCharSeq(r)) => flattenSeq(r)//"[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   850
      case SEQ(r1, r2) => "[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   851
      case ALTS(r1, r2) => "(" ++ shortRexpOutput(r1) ++ "+" ++ shortRexpOutput(r2) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   852
      case STAR(STAR(r)) => "(..)*"// ++ shortRexpOutput(r) ++ "]*"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   853
      case STAR(r) => "STAR(" ++ shortRexpOutput(r) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   854
      //case RTOP => "RTOP"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   855
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   856
431
Chengsong
parents:
diff changeset
   857
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   858
  def blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   859
      case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   860
        if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   861
          val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   862
          bits
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   863
        }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   864
        else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   865
          throw new Exception("Not matched")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   866
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   867
      case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   868
        val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   869
        val simp_res = bsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   870
        blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   871
      }
431
Chengsong
parents:
diff changeset
   872
  }
Chengsong
parents:
diff changeset
   873
Chengsong
parents:
diff changeset
   874
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   875
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   876
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   877
    def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   878
      case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   879
      case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   880
      case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   881
      case ANYCHAR => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   882
      case NOT(r0) => 1 + size(r0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   883
      case SEQ(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   884
      case ALTS(r1, r2) => 1 + List(r1, r2).map(size).sum
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   885
      case STAR(r) => 1 + size(r)
431
Chengsong
parents:
diff changeset
   886
    }
Chengsong
parents:
diff changeset
   887
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   888
    def asize(a: ARexp) = size(erase(a))
431
Chengsong
parents:
diff changeset
   889
Chengsong
parents:
diff changeset
   890
//pder related
Chengsong
parents:
diff changeset
   891
type Mon = (Char, Rexp)
Chengsong
parents:
diff changeset
   892
type Lin = Set[Mon]
Chengsong
parents:
diff changeset
   893
Chengsong
parents:
diff changeset
   894
def dot_prod(rs: Set[Rexp], r: Rexp): Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   895
    case ZERO => Set()
Chengsong
parents:
diff changeset
   896
    case ONE => rs
Chengsong
parents:
diff changeset
   897
    case r => rs.map((re) => if (re == ONE) r else SEQ(re, r)  )   
Chengsong
parents:
diff changeset
   898
  }
Chengsong
parents:
diff changeset
   899
  def cir_prod(l: Lin, t: Rexp): Lin = t match {//remember this Lin is different from the Lin in Antimirov's paper. Here it does not mean the set of all subsets of linear forms that does not contain zero, but rather the type a set of linear forms
Chengsong
parents:
diff changeset
   900
    case ZERO => Set()
Chengsong
parents:
diff changeset
   901
    case ONE => l
Chengsong
parents:
diff changeset
   902
    case t => l.map( m => m._2 match {case ZERO => m case ONE => (m._1, t) case p => (m._1, SEQ(p, t)) }  )
Chengsong
parents:
diff changeset
   903
  }
Chengsong
parents:
diff changeset
   904
  def lf(r: Rexp): Lin = r match {
Chengsong
parents:
diff changeset
   905
    case ZERO => Set()
Chengsong
parents:
diff changeset
   906
    case ONE => Set()
Chengsong
parents:
diff changeset
   907
    case CHAR(f) => {
Chengsong
parents:
diff changeset
   908
      //val Some(c) = alphabet.find(f) 
Chengsong
parents:
diff changeset
   909
      Set((f, ONE))
Chengsong
parents:
diff changeset
   910
    }
Chengsong
parents:
diff changeset
   911
    case ALTS(r1, r2) => {
Chengsong
parents:
diff changeset
   912
      lf(r1 ) ++ lf(r2)
Chengsong
parents:
diff changeset
   913
    }
Chengsong
parents:
diff changeset
   914
    case STAR(r1) => cir_prod(lf(r1), STAR(r1)) //may try infix notation later......
Chengsong
parents:
diff changeset
   915
    case SEQ(r1, r2) =>{
Chengsong
parents:
diff changeset
   916
      if (nullable(r1))
Chengsong
parents:
diff changeset
   917
        cir_prod(lf(r1), r2) ++ lf(r2)
Chengsong
parents:
diff changeset
   918
      else
Chengsong
parents:
diff changeset
   919
        cir_prod(lf(r1), r2) 
Chengsong
parents:
diff changeset
   920
    }
Chengsong
parents:
diff changeset
   921
  }
Chengsong
parents:
diff changeset
   922
  def lfs(r: Set[Rexp]): Lin = {
Chengsong
parents:
diff changeset
   923
    r.foldLeft(Set[Mon]())((acc, r) => acc ++ lf(r))
Chengsong
parents:
diff changeset
   924
  }
Chengsong
parents:
diff changeset
   925
Chengsong
parents:
diff changeset
   926
  def pder(x: Char, t: Rexp): Set[Rexp] = {
Chengsong
parents:
diff changeset
   927
    val lft = lf(t)
Chengsong
parents:
diff changeset
   928
    (lft.filter(mon => if(mon._1 == x) true else false)).map(mon => mon._2)
Chengsong
parents:
diff changeset
   929
  }
Chengsong
parents:
diff changeset
   930
  def pders_single(s: List[Char], t: Rexp) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   931
    case x::xs => pders(xs, pder(x, t))
Chengsong
parents:
diff changeset
   932
    case Nil => Set(t)
Chengsong
parents:
diff changeset
   933
  }
Chengsong
parents:
diff changeset
   934
  def pders(s: List[Char], ts: Set[Rexp]) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   935
    case x::xs => pders(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   936
    case Nil => ts 
Chengsong
parents:
diff changeset
   937
  }
Chengsong
parents:
diff changeset
   938
  def pderss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]() )( (acc, s) => pders_single(s, t) ++ acc )
Chengsong
parents:
diff changeset
   939
  def pdera(t: Rexp): Set[Rexp] = lf(t).map(mon => mon._2)
Chengsong
parents:
diff changeset
   940
  //all implementation of partial derivatives that involve set union are potentially buggy
Chengsong
parents:
diff changeset
   941
  //because they don't include the original regular term before they are pdered.
Chengsong
parents:
diff changeset
   942
  //now only pderas is fixed.
Chengsong
parents:
diff changeset
   943
  def pderas(t: Set[Rexp], d: Int): Set[Rexp] = if(d > 0) pderas(lfs(t).map(mon => mon._2), d - 1) ++ t else lfs(t).map(mon => mon._2) ++ t//repeated application of pderas over the newest set of pders.
Chengsong
parents:
diff changeset
   944
  def pderUNIV(r: Rexp) : Set[Rexp] = pderas(Set(r), awidth(r) + 1)
Chengsong
parents:
diff changeset
   945
  def awidth(r: Rexp) : Int = r match {
Chengsong
parents:
diff changeset
   946
    case CHAR(c) => 1
Chengsong
parents:
diff changeset
   947
    case SEQ(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   948
    case ALTS(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   949
    case ONE => 0
Chengsong
parents:
diff changeset
   950
    case ZERO => 0
Chengsong
parents:
diff changeset
   951
    case STAR(r) => awidth(r)
Chengsong
parents:
diff changeset
   952
  }
Chengsong
parents:
diff changeset
   953
  //def sigma_lf(l: Set[Mon]) : Rexp = ALTS(l.map(mon => SEQ(CHAR(mon._1),mon._2)).toList)
Chengsong
parents:
diff changeset
   954
  //def sigma(rs: Set[Rexp]) : Rexp = ALTS(rs.toList)
Chengsong
parents:
diff changeset
   955
  def o(r: Rexp) = if (nullable(r)) ONE else ZERO
Chengsong
parents:
diff changeset
   956
  //def nlf(t: Rexp) : Rexp = ALTS(List( o(t), sigma_lf(lf(t)) ))
Chengsong
parents:
diff changeset
   957
  def pdp(x: Char, r: Rexp) : Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   958
    case ZERO => Set[Rexp]()
Chengsong
parents:
diff changeset
   959
    case ONE => Set[Rexp]()
Chengsong
parents:
diff changeset
   960
    case CHAR(f) => if(x == f) Set(ONE) else Set[Rexp]()
Chengsong
parents:
diff changeset
   961
    case ALTS(r1, r2) => pdp(x, r1) ++ pdp(x, r2)
Chengsong
parents:
diff changeset
   962
    case STAR(r1) => pdp(x, r).map(a => SEQ(a, STAR(r1)))
Chengsong
parents:
diff changeset
   963
    case SEQ(a0, b) => if(nullable(a0)) pdp(x, a0).map(a => SEQ(a, b)) ++ pdp(x, b) else pdp(x, a0).map(a => SEQ(a, b))
Chengsong
parents:
diff changeset
   964
  }
Chengsong
parents:
diff changeset
   965
  def pdps(s: List[Char], ts: Set[Rexp]): Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   966
    case x::xs => pdps(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   967
    case Nil => ts   
Chengsong
parents:
diff changeset
   968
  }
Chengsong
parents:
diff changeset
   969
  def pdpss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]())((acc, s) => pdps(s, Set(t)) ++ acc)
Chengsong
parents:
diff changeset
   970
Chengsong
parents:
diff changeset
   971
Chengsong
parents:
diff changeset
   972
Chengsong
parents:
diff changeset
   973
def starPrint(r: Rexp) : Unit = r match {
Chengsong
parents:
diff changeset
   974
        
Chengsong
parents:
diff changeset
   975
          case SEQ(head, rstar) =>
Chengsong
parents:
diff changeset
   976
            println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents:
diff changeset
   977
          case STAR(rstar) =>
Chengsong
parents:
diff changeset
   978
            println("STARREG")
Chengsong
parents:
diff changeset
   979
          case ALTS(r1, r2) =>  
Chengsong
parents:
diff changeset
   980
            println("(")
Chengsong
parents:
diff changeset
   981
            starPrint(r1)
Chengsong
parents:
diff changeset
   982
            println("+")
Chengsong
parents:
diff changeset
   983
            starPrint(r2)
Chengsong
parents:
diff changeset
   984
            println(")")
Chengsong
parents:
diff changeset
   985
          case ZERO => println("0")
Chengsong
parents:
diff changeset
   986
        
Chengsong
parents:
diff changeset
   987
      }
Chengsong
parents:
diff changeset
   988
Chengsong
parents:
diff changeset
   989
// @arg(doc = "small tests")
Chengsong
parents:
diff changeset
   990
val STARREG = //((( (STAR("aa")) | STAR("aaa") ).%).%)
Chengsong
parents:
diff changeset
   991
(((STAR("a") | ( STAR("aaa")) | STAR("aaaaa"| ( STAR("aaaaaaa")) | STAR("aaaaaaaaaaa"))).%).%).%
Chengsong
parents:
diff changeset
   992
Chengsong
parents:
diff changeset
   993
// @main
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   994
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   995
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   996
431
Chengsong
parents:
diff changeset
   997
def small() = {
Chengsong
parents:
diff changeset
   998
Chengsong
parents:
diff changeset
   999
Chengsong
parents:
diff changeset
  1000
//   println(lexing_simp(NOTREG, prog0))
Chengsong
parents:
diff changeset
  1001
//   val v = lex_simp(NOTREG, prog0.toList)
Chengsong
parents:
diff changeset
  1002
//   println(v)
Chengsong
parents:
diff changeset
  1003
Chengsong
parents:
diff changeset
  1004
//   val d =  (lex_simp(NOTREG, prog0.toList))
Chengsong
parents:
diff changeset
  1005
//   println(d)
Chengsong
parents:
diff changeset
  1006
  val pderSTAR = pderUNIV(STARREG)
Chengsong
parents:
diff changeset
  1007
Chengsong
parents:
diff changeset
  1008
  val refSize = pderSTAR.map(size(_)).sum
435
Chengsong
parents: 432
diff changeset
  1009
  // println("different partial derivative terms:")
Chengsong
parents: 432
diff changeset
  1010
  // pderSTAR.foreach(r => r match {
431
Chengsong
parents:
diff changeset
  1011
      
435
Chengsong
parents: 432
diff changeset
  1012
  //       case SEQ(head, rstar) =>
Chengsong
parents: 432
diff changeset
  1013
  //         println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents: 432
diff changeset
  1014
  //       case STAR(rstar) =>
Chengsong
parents: 432
diff changeset
  1015
  //         println("STARREG")
431
Chengsong
parents:
diff changeset
  1016
      
435
Chengsong
parents: 432
diff changeset
  1017
  //   }
Chengsong
parents: 432
diff changeset
  1018
  //   )
Chengsong
parents: 432
diff changeset
  1019
  // println("the total number of terms is")
Chengsong
parents: 432
diff changeset
  1020
  // //println(refSize)
Chengsong
parents: 432
diff changeset
  1021
  // println(pderSTAR.size)
431
Chengsong
parents:
diff changeset
  1022
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1023
  // val A : Rexp= ("c" | (ONE | "b") ~ "d") ~((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1024
  // val B : Rexp = ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1025
  // val C : Rexp = ("d") ~ ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1026
  // val PRUNE_REG : Rexp = (C | B | A)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1027
  // val APRUNE_REG = internalise(PRUNE_REG)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1028
  // val program_solution = pruneRexp(APRUNE_REG, breakIntoTerms(PRUNE_REG))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1029
  // println("program executes and gives: as disired!")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1030
  // println(shortRexpOutput(erase(program_solution)))
435
Chengsong
parents: 432
diff changeset
  1031
  // val simpedPruneReg = strongBsimp(APRUNE_REG)
Chengsong
parents: 432
diff changeset
  1032
Chengsong
parents: 432
diff changeset
  1033
  // println(shortRexpOutput(erase(simpedPruneReg)))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1034
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1035
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1036
  for(i <- List(1,2,3,4,10, 100, 400, 841, 900 ) ){// 100, 400, 800, 840, 841, 900
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1037
    val prog0 = "a" * i
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1038
    //println(s"test: $prog0")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1039
    println(s"testing with $i a's" )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1040
    //val bd = bdersSimp(prog0, STARREG)//DB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1041
    val sbd = bdersStrongRexp(prog0, STARREG)//strongDB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1042
    starPrint(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1043
    val subTerms = breakIntoTerms(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1044
    //val subTermsLarge = breakIntoTerms(erase(bd))
431
Chengsong
parents:
diff changeset
  1045
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1046
    println(s"subterms of regex with strongDB: ${subTerms.length}")//, standard DB: ${subTermsLarge.length}")
431
Chengsong
parents:
diff changeset
  1047
Chengsong
parents:
diff changeset
  1048
Chengsong
parents:
diff changeset
  1049
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1050
    println("the number of distinct subterms for bsimp with strongDB")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1051
    println(subTerms.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1052
    //println(subTermsLarge.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1053
    if(pderSTAR.size > subTerms.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1054
      println(s"which is less than or equal to the number of PDER terms: ${pderSTAR.size}")
431
Chengsong
parents:
diff changeset
  1055
Chengsong
parents:
diff changeset
  1056
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1057
    // println(shortRexpOutput(erase(sbd)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1058
    // println(shortRexpOutput(erase(bd)))
431
Chengsong
parents:
diff changeset
  1059
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1060
    println("pdersize, original, strongSimp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1061
    println(refSize, size(STARREG),  asize(sbd))
431
Chengsong
parents:
diff changeset
  1062
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1063
    //val vres = strong_blexing_simp( STARREG, prog0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1064
    //println(vres)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1065
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1066
  // println(vs.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1067
  // println(vs)
431
Chengsong
parents:
diff changeset
  1068
   
Chengsong
parents:
diff changeset
  1069
Chengsong
parents:
diff changeset
  1070
  // val prog1 = """read  n; write n"""  
Chengsong
parents:
diff changeset
  1071
  // println(s"test: $prog1")
Chengsong
parents:
diff changeset
  1072
  // println(lexing_simp(WHILE_REGS, prog1))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1073
  // val display = ("a"| "ab").%
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1074
  // val adisplay = internalise(display)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1075
  // bders_simp( "aaaaa".toList, adisplay)
431
Chengsong
parents:
diff changeset
  1076
}
Chengsong
parents:
diff changeset
  1077
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1078
def generator_test() {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1079
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1080
  // test(rexp(7), 1000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1081
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1082
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1083
  //     val simpVal = simpBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1084
  //     val strongVal = strongBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1085
  //     // println(simpVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1086
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1087
  //     (simpVal == strongVal) && (simpVal != None) 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1088
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1089
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1090
  // }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1091
  // test(single(STAR(ALTS(STAR(CHAR('c')),ALTS(CHAR('c'),ZERO)))), 100000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1092
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1093
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1094
  //     val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1095
  //     val bdStrong5 = bdersStrong5(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1096
  //     // println(shortRexpOutput(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1097
  //     // println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1098
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1099
  //     // println(strongVal5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1100
  //     // (strongVal == strongVal5) 
493
Chengsong
parents: 492
diff changeset
  1101
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1102
  //     if(asize(bdStrong5) > asize(bdStrong)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1103
  //       println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1104
  //       println(shortRexpOutput(erase(bdStrong5)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1105
  //       println(shortRexpOutput(erase(bdStrong)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1106
  //     }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1107
  //     asize(bdStrong5) <= asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1108
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1109
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1110
  // }
500
Chengsong
parents: 494
diff changeset
  1111
  //*** example where bdStrong5 has a smaller size than bdStrong
Chengsong
parents: 494
diff changeset
  1112
  // test(single(STAR(SEQ(ALTS(SEQ(STAR(CHAR('a')),ALTS(ALTS(ONE,ZERO),SEQ(ONE,ONE))),CHAR('a')),ONE))), 1) { (r: Rexp) => 
Chengsong
parents: 494
diff changeset
  1113
  //*** depth 5 example bdStrong5 larger size than bdStrong
Chengsong
parents: 494
diff changeset
  1114
  // test(single(STAR(SEQ(SEQ(ALTS(CHAR('b'),STAR(CHAR('b'))),CHAR('b')),(ALTS(STAR(CHAR('c')), ONE))))), 1) {(r: Rexp) =>
Chengsong
parents: 494
diff changeset
  1115
 
Chengsong
parents: 494
diff changeset
  1116
 
Chengsong
parents: 494
diff changeset
  1117
 
Chengsong
parents: 494
diff changeset
  1118
  //sanity check from Christian's request
Chengsong
parents: 494
diff changeset
  1119
  // val r = ("a" | "ab") ~ ("bc" | "c")
Chengsong
parents: 494
diff changeset
  1120
  // val a = internalise(r)
Chengsong
parents: 494
diff changeset
  1121
  // val aval = blexing_simp(r, "abc")
Chengsong
parents: 494
diff changeset
  1122
  // println(aval)
Chengsong
parents: 494
diff changeset
  1123
Chengsong
parents: 494
diff changeset
  1124
  //sample counterexample:(depth 7)
Chengsong
parents: 494
diff changeset
  1125
  //STAR(SEQ(ALTS(STAR(STAR(STAR(STAR(CHAR(c))))),ALTS(CHAR(c),CHAR(b))),ALTS(ZERO,SEQ(ALTS(ALTS(STAR(CHAR(c)),SEQ(CHAR(b),CHAR(a))),CHAR(c)),STAR(ALTS(ALTS(ONE,CHAR(a)),STAR(CHAR(c))))))))
Chengsong
parents: 494
diff changeset
  1126
  //(depth5)
Chengsong
parents: 494
diff changeset
  1127
  //STAR(SEQ(ALTS(ALTS(STAR(CHAR(b)),SEQ(ONE,CHAR(b))),SEQ(STAR(CHAR(a)),CHAR(b))),ALTS(ZERO,ALTS(STAR(CHAR(b)),STAR(CHAR(a))))))
Chengsong
parents: 494
diff changeset
  1128
  test(rexp(4), 10000000) { (r: Rexp) => 
Chengsong
parents: 494
diff changeset
  1129
  // ALTS(SEQ(SEQ(ONE,CHAR('a')),STAR(CHAR('a'))),SEQ(ALTS(CHAR('c'),ONE),STAR(ZERO))))))), 1) { (r: Rexp) => 
493
Chengsong
parents: 492
diff changeset
  1130
    val ss = stringsFromRexp(r)
Chengsong
parents: 492
diff changeset
  1131
    val boolList = ss.map(s => {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1132
      val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1133
      val bdStrong5 = bdersStrong5(s.toList, internalise(r))
500
Chengsong
parents: 494
diff changeset
  1134
      val bdFurther5 = strongBsimp5(bdStrong5)
Chengsong
parents: 494
diff changeset
  1135
      val sizeFurther5 = asize(bdFurther5)
Chengsong
parents: 494
diff changeset
  1136
      val pdersSet = pderUNIV(r)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1137
      val size5 = asize(bdStrong5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1138
      val size0 = asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1139
      // println(s)
500
Chengsong
parents: 494
diff changeset
  1140
      // println("pdersSet size")
Chengsong
parents: 494
diff changeset
  1141
      // println(pdersSet.size)
Chengsong
parents: 494
diff changeset
  1142
      // pdersSet.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
  1143
      // println("after bdStrong5")
Chengsong
parents: 494
diff changeset
  1144
      
Chengsong
parents: 494
diff changeset
  1145
      // println(shortRexpOutput(erase(bdStrong5)))
Chengsong
parents: 494
diff changeset
  1146
      // println(breakIntoTerms(erase(bdStrong5)).size)
Chengsong
parents: 494
diff changeset
  1147
      
Chengsong
parents: 494
diff changeset
  1148
      // println("after bdStrong")
Chengsong
parents: 494
diff changeset
  1149
      // println(shortRexpOutput(erase(bdStrong)))
Chengsong
parents: 494
diff changeset
  1150
      // println(breakIntoTerms(erase(bdStrong)).size)
Chengsong
parents: 494
diff changeset
  1151
      // println(size5, size0, sizeFurther5)
Chengsong
parents: 494
diff changeset
  1152
      // aprint(strongBsimp5(bdStrong))
Chengsong
parents: 494
diff changeset
  1153
      // println(asize(strongBsimp5(bdStrong5)))
Chengsong
parents: 494
diff changeset
  1154
      // println(s)
Chengsong
parents: 494
diff changeset
  1155
      size5 <= size0 
493
Chengsong
parents: 492
diff changeset
  1156
    })
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1157
    // println(boolList)
500
Chengsong
parents: 494
diff changeset
  1158
    //!boolList.exists(b => b == false)
493
Chengsong
parents: 492
diff changeset
  1159
    !boolList.exists(b => b == false)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1160
  }
493
Chengsong
parents: 492
diff changeset
  1161
Chengsong
parents: 492
diff changeset
  1162
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1163
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1164
// small()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1165
generator_test()
493
Chengsong
parents: 492
diff changeset
  1166
Chengsong
parents: 492
diff changeset
  1167
1
Chengsong
parents: 492
diff changeset
  1168
Chengsong
parents: 492
diff changeset
  1169
SEQ(SEQ(SEQ(ONE,CHAR('b')),STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1170
SEQ(ALTS(ALTS(ZERO,STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1171
STAR(ALTS(CHAR('a'),SEQ(SEQ(STAR(ALTS(STAR(CHAR('c')),CHAR('a'))),
Chengsong
parents: 492
diff changeset
  1172
SEQ(CHAR('a'),SEQ(ALTS(CHAR('b'),ZERO),SEQ(ONE,CHAR('b'))))),ONE)))),ONE))
Chengsong
parents: 492
diff changeset
  1173
Chengsong
parents: 492
diff changeset
  1174
Chengsong
parents: 492
diff changeset
  1175
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))
Chengsong
parents: 492
diff changeset
  1176
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))